{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.96, "eval_steps": 500, "global_step": 153600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 2.1875e-06, "loss": 3.7908, "step": 8 }, { "epoch": 0.0, "learning_rate": 4.6875000000000004e-06, "loss": 3.244, "step": 16 }, { "epoch": 0.0, "learning_rate": 7.187499999999999e-06, "loss": 2.6806, "step": 24 }, { "epoch": 0.0, "learning_rate": 9.6875e-06, "loss": 2.5457, "step": 32 }, { "epoch": 0.0, "learning_rate": 1.21875e-05, "loss": 2.5046, "step": 40 }, { "epoch": 0.0, "learning_rate": 1.4687500000000001e-05, "loss": 2.4884, "step": 48 }, { "epoch": 0.0, "learning_rate": 1.71875e-05, "loss": 2.4491, "step": 56 }, { "epoch": 0.0, "learning_rate": 1.96875e-05, "loss": 2.459, "step": 64 }, { "epoch": 0.0, "learning_rate": 2.21875e-05, "loss": 2.4546, "step": 72 }, { "epoch": 0.0, "learning_rate": 2.4687500000000004e-05, "loss": 2.4491, "step": 80 }, { "epoch": 0.0, "learning_rate": 2.71875e-05, "loss": 2.431, "step": 88 }, { "epoch": 0.0, "learning_rate": 2.96875e-05, "loss": 2.4526, "step": 96 }, { "epoch": 0.0, "learning_rate": 3.21875e-05, "loss": 2.4363, "step": 104 }, { "epoch": 0.0, "learning_rate": 3.46875e-05, "loss": 2.4337, "step": 112 }, { "epoch": 0.0, "learning_rate": 3.71875e-05, "loss": 2.437, "step": 120 }, { "epoch": 0.0, "learning_rate": 3.96875e-05, "loss": 2.43, "step": 128 }, { "epoch": 0.0, "learning_rate": 4.21875e-05, "loss": 2.4237, "step": 136 }, { "epoch": 0.0, "learning_rate": 4.46875e-05, "loss": 2.4397, "step": 144 }, { "epoch": 0.0, "learning_rate": 4.71875e-05, "loss": 2.4258, "step": 152 }, { "epoch": 0.0, "learning_rate": 4.96875e-05, "loss": 2.4191, "step": 160 }, { "epoch": 0.0, "learning_rate": 5.21875e-05, "loss": 2.4195, "step": 168 }, { "epoch": 0.0, "learning_rate": 5.46875e-05, "loss": 2.4165, "step": 176 }, { "epoch": 0.0, "learning_rate": 5.718750000000001e-05, "loss": 2.4126, "step": 184 }, { "epoch": 0.0, "learning_rate": 5.968750000000001e-05, "loss": 2.4364, "step": 192 }, { "epoch": 0.0, "learning_rate": 6.21875e-05, "loss": 2.4099, "step": 200 }, { "epoch": 0.0, "learning_rate": 6.468750000000001e-05, "loss": 2.4278, "step": 208 }, { "epoch": 0.0, "learning_rate": 6.71875e-05, "loss": 2.4437, "step": 216 }, { "epoch": 0.0, "learning_rate": 6.96875e-05, "loss": 2.4319, "step": 224 }, { "epoch": 0.0, "learning_rate": 7.218750000000001e-05, "loss": 2.4429, "step": 232 }, { "epoch": 0.0, "learning_rate": 7.468749999999999e-05, "loss": 2.4255, "step": 240 }, { "epoch": 0.0, "learning_rate": 7.71875e-05, "loss": 2.4345, "step": 248 }, { "epoch": 0.0, "learning_rate": 7.96875e-05, "loss": 2.4152, "step": 256 }, { "epoch": 0.0, "learning_rate": 8.218750000000001e-05, "loss": 2.4331, "step": 264 }, { "epoch": 0.0, "learning_rate": 8.46875e-05, "loss": 2.4294, "step": 272 }, { "epoch": 0.0, "learning_rate": 8.71875e-05, "loss": 2.4323, "step": 280 }, { "epoch": 0.0, "learning_rate": 8.96875e-05, "loss": 2.4397, "step": 288 }, { "epoch": 0.0, "learning_rate": 9.21875e-05, "loss": 2.4432, "step": 296 }, { "epoch": 0.0, "learning_rate": 9.46875e-05, "loss": 2.4435, "step": 304 }, { "epoch": 0.0, "learning_rate": 9.718750000000001e-05, "loss": 2.4259, "step": 312 }, { "epoch": 0.0, "learning_rate": 9.96875e-05, "loss": 2.433, "step": 320 }, { "epoch": 0.0, "learning_rate": 0.00010218750000000001, "loss": 2.4046, "step": 328 }, { "epoch": 0.0, "learning_rate": 0.0001046875, "loss": 2.4232, "step": 336 }, { "epoch": 0.0, "learning_rate": 0.0001071875, "loss": 2.4301, "step": 344 }, { "epoch": 0.0, "learning_rate": 0.0001096875, "loss": 2.4404, "step": 352 }, { "epoch": 0.0, "learning_rate": 0.0001121875, "loss": 2.4471, "step": 360 }, { "epoch": 0.0, "learning_rate": 0.00011468750000000002, "loss": 2.4418, "step": 368 }, { "epoch": 0.0, "learning_rate": 0.00011718750000000001, "loss": 2.4427, "step": 376 }, { "epoch": 0.0, "learning_rate": 0.0001196875, "loss": 2.4383, "step": 384 }, { "epoch": 0.0, "learning_rate": 0.0001221875, "loss": 2.4211, "step": 392 }, { "epoch": 0.01, "learning_rate": 0.0001246875, "loss": 2.4363, "step": 400 }, { "epoch": 0.01, "learning_rate": 0.00012718750000000002, "loss": 2.4359, "step": 408 }, { "epoch": 0.01, "learning_rate": 0.0001296875, "loss": 2.4287, "step": 416 }, { "epoch": 0.01, "learning_rate": 0.0001321875, "loss": 2.4371, "step": 424 }, { "epoch": 0.01, "learning_rate": 0.00013468750000000001, "loss": 2.4317, "step": 432 }, { "epoch": 0.01, "learning_rate": 0.0001371875, "loss": 2.4417, "step": 440 }, { "epoch": 0.01, "learning_rate": 0.00013968750000000003, "loss": 2.4406, "step": 448 }, { "epoch": 0.01, "learning_rate": 0.0001421875, "loss": 2.448, "step": 456 }, { "epoch": 0.01, "learning_rate": 0.0001446875, "loss": 2.4444, "step": 464 }, { "epoch": 0.01, "learning_rate": 0.00014718750000000002, "loss": 2.4265, "step": 472 }, { "epoch": 0.01, "learning_rate": 0.0001496875, "loss": 2.4423, "step": 480 }, { "epoch": 0.01, "learning_rate": 0.0001521875, "loss": 2.4551, "step": 488 }, { "epoch": 0.01, "learning_rate": 0.0001546875, "loss": 2.4311, "step": 496 }, { "epoch": 0.01, "learning_rate": 0.0001571875, "loss": 2.4289, "step": 504 }, { "epoch": 0.01, "learning_rate": 0.0001596875, "loss": 2.4416, "step": 512 }, { "epoch": 0.01, "learning_rate": 0.0001621875, "loss": 2.4463, "step": 520 }, { "epoch": 0.01, "learning_rate": 0.0001646875, "loss": 2.4513, "step": 528 }, { "epoch": 0.01, "learning_rate": 0.00016718750000000002, "loss": 2.4543, "step": 536 }, { "epoch": 0.01, "learning_rate": 0.0001696875, "loss": 2.4493, "step": 544 }, { "epoch": 0.01, "learning_rate": 0.0001721875, "loss": 2.4445, "step": 552 }, { "epoch": 0.01, "learning_rate": 0.0001746875, "loss": 2.4467, "step": 560 }, { "epoch": 0.01, "learning_rate": 0.00017718750000000002, "loss": 2.4626, "step": 568 }, { "epoch": 0.01, "learning_rate": 0.0001796875, "loss": 2.4415, "step": 576 }, { "epoch": 0.01, "learning_rate": 0.0001821875, "loss": 2.4567, "step": 584 }, { "epoch": 0.01, "learning_rate": 0.0001846875, "loss": 2.4502, "step": 592 }, { "epoch": 0.01, "learning_rate": 0.00018718750000000002, "loss": 2.4515, "step": 600 }, { "epoch": 0.01, "learning_rate": 0.00018968750000000002, "loss": 2.4469, "step": 608 }, { "epoch": 0.01, "learning_rate": 0.0001921875, "loss": 2.4481, "step": 616 }, { "epoch": 0.01, "learning_rate": 0.0001946875, "loss": 2.4434, "step": 624 }, { "epoch": 0.01, "learning_rate": 0.00019718750000000002, "loss": 2.4621, "step": 632 }, { "epoch": 0.01, "learning_rate": 0.0001996875, "loss": 2.4592, "step": 640 }, { "epoch": 0.01, "learning_rate": 0.00019999999548675498, "loss": 2.4773, "step": 648 }, { "epoch": 0.01, "learning_rate": 0.00019999998194702038, "loss": 2.4694, "step": 656 }, { "epoch": 0.01, "learning_rate": 0.00019999995938079756, "loss": 2.4468, "step": 664 }, { "epoch": 0.01, "learning_rate": 0.0001999999277880888, "loss": 2.4647, "step": 672 }, { "epoch": 0.01, "learning_rate": 0.00019999988716889723, "loss": 2.4333, "step": 680 }, { "epoch": 0.01, "learning_rate": 0.00019999983752322698, "loss": 2.4634, "step": 688 }, { "epoch": 0.01, "learning_rate": 0.00019999977885108293, "loss": 2.462, "step": 696 }, { "epoch": 0.01, "learning_rate": 0.00019999971115247108, "loss": 2.4678, "step": 704 }, { "epoch": 0.01, "learning_rate": 0.00019999963442739814, "loss": 2.4698, "step": 712 }, { "epoch": 0.01, "learning_rate": 0.00019999954867587185, "loss": 2.4364, "step": 720 }, { "epoch": 0.01, "learning_rate": 0.00019999945389790079, "loss": 2.4617, "step": 728 }, { "epoch": 0.01, "learning_rate": 0.0001999993500934945, "loss": 2.46, "step": 736 }, { "epoch": 0.01, "learning_rate": 0.00019999923726266329, "loss": 2.4694, "step": 744 }, { "epoch": 0.01, "learning_rate": 0.0001999991154054186, "loss": 2.4677, "step": 752 }, { "epoch": 0.01, "learning_rate": 0.00019999898452177257, "loss": 2.4403, "step": 760 }, { "epoch": 0.01, "learning_rate": 0.00019999884461173836, "loss": 2.4546, "step": 768 }, { "epoch": 0.01, "learning_rate": 0.00019999869567533, "loss": 2.4709, "step": 776 }, { "epoch": 0.01, "learning_rate": 0.00019999853771256242, "loss": 2.4434, "step": 784 }, { "epoch": 0.01, "learning_rate": 0.00019999837072345148, "loss": 2.456, "step": 792 }, { "epoch": 0.01, "learning_rate": 0.0001999981947080139, "loss": 2.4698, "step": 800 }, { "epoch": 0.01, "learning_rate": 0.00019999800966626736, "loss": 2.4417, "step": 808 }, { "epoch": 0.01, "learning_rate": 0.00019999781559823044, "loss": 2.4621, "step": 816 }, { "epoch": 0.01, "learning_rate": 0.0001999976125039225, "loss": 2.4566, "step": 824 }, { "epoch": 0.01, "learning_rate": 0.000199997400383364, "loss": 2.4626, "step": 832 }, { "epoch": 0.01, "learning_rate": 0.00019999717923657623, "loss": 2.4658, "step": 840 }, { "epoch": 0.01, "learning_rate": 0.0001999969490635813, "loss": 2.452, "step": 848 }, { "epoch": 0.01, "learning_rate": 0.00019999670986440234, "loss": 2.4648, "step": 856 }, { "epoch": 0.01, "learning_rate": 0.00019999646163906335, "loss": 2.4578, "step": 864 }, { "epoch": 0.01, "learning_rate": 0.00019999620438758918, "loss": 2.4739, "step": 872 }, { "epoch": 0.01, "learning_rate": 0.0001999959381100057, "loss": 2.4797, "step": 880 }, { "epoch": 0.01, "learning_rate": 0.00019999566280633953, "loss": 2.4588, "step": 888 }, { "epoch": 0.01, "learning_rate": 0.00019999537847661833, "loss": 2.4708, "step": 896 }, { "epoch": 0.01, "learning_rate": 0.00019999508512087062, "loss": 2.4584, "step": 904 }, { "epoch": 0.01, "learning_rate": 0.0001999947827391258, "loss": 2.4612, "step": 912 }, { "epoch": 0.01, "learning_rate": 0.00019999447133141422, "loss": 2.4454, "step": 920 }, { "epoch": 0.01, "learning_rate": 0.00019999415089776712, "loss": 2.4417, "step": 928 }, { "epoch": 0.01, "learning_rate": 0.00019999382143821658, "loss": 2.452, "step": 936 }, { "epoch": 0.01, "learning_rate": 0.0001999934829527957, "loss": 2.4647, "step": 944 }, { "epoch": 0.01, "learning_rate": 0.00019999313544153844, "loss": 2.4687, "step": 952 }, { "epoch": 0.01, "learning_rate": 0.0001999927789044796, "loss": 2.4574, "step": 960 }, { "epoch": 0.01, "learning_rate": 0.00019999241334165495, "loss": 2.4513, "step": 968 }, { "epoch": 0.01, "learning_rate": 0.00019999203875310117, "loss": 2.4372, "step": 976 }, { "epoch": 0.01, "learning_rate": 0.00019999165513885582, "loss": 2.4729, "step": 984 }, { "epoch": 0.01, "learning_rate": 0.00019999126249895742, "loss": 2.4827, "step": 992 }, { "epoch": 0.01, "learning_rate": 0.00019999086083344526, "loss": 2.4509, "step": 1000 }, { "epoch": 0.01, "learning_rate": 0.0001999904501423597, "loss": 2.4499, "step": 1008 }, { "epoch": 0.01, "learning_rate": 0.0001999900304257419, "loss": 2.4495, "step": 1016 }, { "epoch": 0.01, "learning_rate": 0.00019998960168363396, "loss": 2.4493, "step": 1024 }, { "epoch": 0.01, "learning_rate": 0.00019998916391607892, "loss": 2.4783, "step": 1032 }, { "epoch": 0.01, "learning_rate": 0.0001999887171231206, "loss": 2.4696, "step": 1040 }, { "epoch": 0.01, "learning_rate": 0.00019998826130480387, "loss": 2.458, "step": 1048 }, { "epoch": 0.01, "learning_rate": 0.00019998779646117443, "loss": 2.4689, "step": 1056 }, { "epoch": 0.01, "learning_rate": 0.0001999873225922789, "loss": 2.4648, "step": 1064 }, { "epoch": 0.01, "learning_rate": 0.00019998683969816482, "loss": 2.4683, "step": 1072 }, { "epoch": 0.01, "learning_rate": 0.00019998634777888062, "loss": 2.4603, "step": 1080 }, { "epoch": 0.01, "learning_rate": 0.00019998584683447558, "loss": 2.4625, "step": 1088 }, { "epoch": 0.01, "learning_rate": 0.00019998533686500005, "loss": 2.4614, "step": 1096 }, { "epoch": 0.01, "learning_rate": 0.0001999848178705051, "loss": 2.4478, "step": 1104 }, { "epoch": 0.01, "learning_rate": 0.00019998428985104277, "loss": 2.4685, "step": 1112 }, { "epoch": 0.01, "learning_rate": 0.00019998375280666606, "loss": 2.4549, "step": 1120 }, { "epoch": 0.01, "learning_rate": 0.00019998320673742884, "loss": 2.4505, "step": 1128 }, { "epoch": 0.01, "learning_rate": 0.00019998265164338584, "loss": 2.4779, "step": 1136 }, { "epoch": 0.01, "learning_rate": 0.00019998208752459274, "loss": 2.4484, "step": 1144 }, { "epoch": 0.01, "learning_rate": 0.00019998151438110616, "loss": 2.4654, "step": 1152 }, { "epoch": 0.01, "learning_rate": 0.00019998093221298356, "loss": 2.4586, "step": 1160 }, { "epoch": 0.01, "learning_rate": 0.00019998034102028327, "loss": 2.4604, "step": 1168 }, { "epoch": 0.01, "learning_rate": 0.00019997974080306465, "loss": 2.4624, "step": 1176 }, { "epoch": 0.01, "learning_rate": 0.0001999791315613879, "loss": 2.4584, "step": 1184 }, { "epoch": 0.01, "learning_rate": 0.00019997851329531406, "loss": 2.4749, "step": 1192 }, { "epoch": 0.01, "learning_rate": 0.00019997788600490524, "loss": 2.4656, "step": 1200 }, { "epoch": 0.02, "learning_rate": 0.00019997724969022428, "loss": 2.47, "step": 1208 }, { "epoch": 0.02, "learning_rate": 0.000199976604351335, "loss": 2.4712, "step": 1216 }, { "epoch": 0.02, "learning_rate": 0.00019997594998830216, "loss": 2.4586, "step": 1224 }, { "epoch": 0.02, "learning_rate": 0.00019997528660119134, "loss": 2.4565, "step": 1232 }, { "epoch": 0.02, "learning_rate": 0.00019997461419006914, "loss": 2.4474, "step": 1240 }, { "epoch": 0.02, "learning_rate": 0.00019997393275500292, "loss": 2.4615, "step": 1248 }, { "epoch": 0.02, "learning_rate": 0.00019997324229606108, "loss": 2.4584, "step": 1256 }, { "epoch": 0.02, "learning_rate": 0.00019997254281331283, "loss": 2.4601, "step": 1264 }, { "epoch": 0.02, "learning_rate": 0.00019997183430682836, "loss": 2.4461, "step": 1272 }, { "epoch": 0.02, "learning_rate": 0.00019997111677667875, "loss": 2.4616, "step": 1280 }, { "epoch": 0.02, "learning_rate": 0.0001999703902229359, "loss": 2.4537, "step": 1288 }, { "epoch": 0.02, "learning_rate": 0.00019996965464567278, "loss": 2.4584, "step": 1296 }, { "epoch": 0.02, "learning_rate": 0.000199968910044963, "loss": 2.4498, "step": 1304 }, { "epoch": 0.02, "learning_rate": 0.00019996815642088137, "loss": 2.4746, "step": 1312 }, { "epoch": 0.02, "learning_rate": 0.00019996739377350345, "loss": 2.4598, "step": 1320 }, { "epoch": 0.02, "learning_rate": 0.0001999666221029057, "loss": 2.4702, "step": 1328 }, { "epoch": 0.02, "learning_rate": 0.00019996584140916557, "loss": 2.4624, "step": 1336 }, { "epoch": 0.02, "learning_rate": 0.00019996505169236125, "loss": 2.447, "step": 1344 }, { "epoch": 0.02, "learning_rate": 0.0001999642529525721, "loss": 2.472, "step": 1352 }, { "epoch": 0.02, "learning_rate": 0.0001999634451898781, "loss": 2.4599, "step": 1360 }, { "epoch": 0.02, "learning_rate": 0.00019996262840436032, "loss": 2.4628, "step": 1368 }, { "epoch": 0.02, "learning_rate": 0.00019996180259610063, "loss": 2.4446, "step": 1376 }, { "epoch": 0.02, "learning_rate": 0.0001999609677651819, "loss": 2.4503, "step": 1384 }, { "epoch": 0.02, "learning_rate": 0.0001999601239116879, "loss": 2.4448, "step": 1392 }, { "epoch": 0.02, "learning_rate": 0.00019995927103570317, "loss": 2.4539, "step": 1400 }, { "epoch": 0.02, "learning_rate": 0.00019995840913731333, "loss": 2.4493, "step": 1408 }, { "epoch": 0.02, "learning_rate": 0.00019995753821660473, "loss": 2.4523, "step": 1416 }, { "epoch": 0.02, "learning_rate": 0.00019995665827366482, "loss": 2.4513, "step": 1424 }, { "epoch": 0.02, "learning_rate": 0.0001999557693085818, "loss": 2.4701, "step": 1432 }, { "epoch": 0.02, "learning_rate": 0.0001999548713214448, "loss": 2.4596, "step": 1440 }, { "epoch": 0.02, "learning_rate": 0.00019995396431234395, "loss": 2.4566, "step": 1448 }, { "epoch": 0.02, "learning_rate": 0.0001999530482813702, "loss": 2.4461, "step": 1456 }, { "epoch": 0.02, "learning_rate": 0.0001999521232286154, "loss": 2.4557, "step": 1464 }, { "epoch": 0.02, "learning_rate": 0.00019995118915417233, "loss": 2.4603, "step": 1472 }, { "epoch": 0.02, "learning_rate": 0.00019995024605813468, "loss": 2.4615, "step": 1480 }, { "epoch": 0.02, "learning_rate": 0.00019994929394059706, "loss": 2.4428, "step": 1488 }, { "epoch": 0.02, "learning_rate": 0.0001999483328016549, "loss": 2.4484, "step": 1496 }, { "epoch": 0.02, "learning_rate": 0.00019994736264140466, "loss": 2.4419, "step": 1504 }, { "epoch": 0.02, "learning_rate": 0.00019994638345994362, "loss": 2.4678, "step": 1512 }, { "epoch": 0.02, "learning_rate": 0.00019994539525736998, "loss": 2.4551, "step": 1520 }, { "epoch": 0.02, "learning_rate": 0.00019994439803378282, "loss": 2.4575, "step": 1528 }, { "epoch": 0.02, "learning_rate": 0.0001999433917892822, "loss": 2.4426, "step": 1536 }, { "epoch": 0.02, "learning_rate": 0.00019994237652396909, "loss": 2.4511, "step": 1544 }, { "epoch": 0.02, "learning_rate": 0.0001999413522379452, "loss": 2.4538, "step": 1552 }, { "epoch": 0.02, "learning_rate": 0.00019994031893131334, "loss": 2.4625, "step": 1560 }, { "epoch": 0.02, "learning_rate": 0.0001999392766041771, "loss": 2.4645, "step": 1568 }, { "epoch": 0.02, "learning_rate": 0.00019993822525664107, "loss": 2.4668, "step": 1576 }, { "epoch": 0.02, "learning_rate": 0.00019993716488881063, "loss": 2.4399, "step": 1584 }, { "epoch": 0.02, "learning_rate": 0.00019993609550079217, "loss": 2.4444, "step": 1592 }, { "epoch": 0.02, "learning_rate": 0.00019993501709269295, "loss": 2.4504, "step": 1600 }, { "epoch": 0.02, "learning_rate": 0.00019993392966462112, "loss": 2.4444, "step": 1608 }, { "epoch": 0.02, "learning_rate": 0.00019993283321668572, "loss": 2.457, "step": 1616 }, { "epoch": 0.02, "learning_rate": 0.00019993172774899676, "loss": 2.4689, "step": 1624 }, { "epoch": 0.02, "learning_rate": 0.0001999306132616651, "loss": 2.4495, "step": 1632 }, { "epoch": 0.02, "learning_rate": 0.00019992948975480244, "loss": 2.4523, "step": 1640 }, { "epoch": 0.02, "learning_rate": 0.0001999283572285216, "loss": 2.4741, "step": 1648 }, { "epoch": 0.02, "learning_rate": 0.00019992721568293606, "loss": 2.4476, "step": 1656 }, { "epoch": 0.02, "learning_rate": 0.0001999260651181603, "loss": 2.4605, "step": 1664 }, { "epoch": 0.02, "learning_rate": 0.00019992490553430981, "loss": 2.435, "step": 1672 }, { "epoch": 0.02, "learning_rate": 0.00019992373693150084, "loss": 2.451, "step": 1680 }, { "epoch": 0.02, "learning_rate": 0.00019992255930985058, "loss": 2.4393, "step": 1688 }, { "epoch": 0.02, "learning_rate": 0.00019992137266947716, "loss": 2.4474, "step": 1696 }, { "epoch": 0.02, "learning_rate": 0.00019992017701049957, "loss": 2.4181, "step": 1704 }, { "epoch": 0.02, "learning_rate": 0.00019991897233303773, "loss": 2.4535, "step": 1712 }, { "epoch": 0.02, "learning_rate": 0.0001999177586372125, "loss": 2.4633, "step": 1720 }, { "epoch": 0.02, "learning_rate": 0.00019991653592314556, "loss": 2.4442, "step": 1728 }, { "epoch": 0.02, "learning_rate": 0.00019991530419095956, "loss": 2.4517, "step": 1736 }, { "epoch": 0.02, "learning_rate": 0.0001999140634407781, "loss": 2.4664, "step": 1744 }, { "epoch": 0.02, "learning_rate": 0.00019991281367272548, "loss": 2.4554, "step": 1752 }, { "epoch": 0.02, "learning_rate": 0.00019991155488692714, "loss": 2.428, "step": 1760 }, { "epoch": 0.02, "learning_rate": 0.0001999102870835093, "loss": 2.4654, "step": 1768 }, { "epoch": 0.02, "learning_rate": 0.0001999090102625992, "loss": 2.451, "step": 1776 }, { "epoch": 0.02, "learning_rate": 0.00019990772442432474, "loss": 2.4292, "step": 1784 }, { "epoch": 0.02, "learning_rate": 0.000199906429568815, "loss": 2.4508, "step": 1792 }, { "epoch": 0.02, "learning_rate": 0.0001999051256961998, "loss": 2.4439, "step": 1800 }, { "epoch": 0.02, "learning_rate": 0.00019990381280660991, "loss": 2.4451, "step": 1808 }, { "epoch": 0.02, "learning_rate": 0.00019990249090017707, "loss": 2.4462, "step": 1816 }, { "epoch": 0.02, "learning_rate": 0.00019990115997703379, "loss": 2.4566, "step": 1824 }, { "epoch": 0.02, "learning_rate": 0.00019989982003731354, "loss": 2.4673, "step": 1832 }, { "epoch": 0.02, "learning_rate": 0.00019989847108115076, "loss": 2.4467, "step": 1840 }, { "epoch": 0.02, "learning_rate": 0.00019989711310868072, "loss": 2.4426, "step": 1848 }, { "epoch": 0.02, "learning_rate": 0.00019989574612003962, "loss": 2.4495, "step": 1856 }, { "epoch": 0.02, "learning_rate": 0.0001998943701153646, "loss": 2.434, "step": 1864 }, { "epoch": 0.02, "learning_rate": 0.00019989298509479357, "loss": 2.4699, "step": 1872 }, { "epoch": 0.02, "learning_rate": 0.00019989159105846555, "loss": 2.4647, "step": 1880 }, { "epoch": 0.02, "learning_rate": 0.00019989018800652025, "loss": 2.4523, "step": 1888 }, { "epoch": 0.02, "learning_rate": 0.00019988877593909844, "loss": 2.4627, "step": 1896 }, { "epoch": 0.02, "learning_rate": 0.00019988735485634179, "loss": 2.45, "step": 1904 }, { "epoch": 0.02, "learning_rate": 0.00019988592475839273, "loss": 2.4496, "step": 1912 }, { "epoch": 0.02, "learning_rate": 0.00019988448564539475, "loss": 2.4534, "step": 1920 }, { "epoch": 0.02, "learning_rate": 0.0001998830375174922, "loss": 2.4373, "step": 1928 }, { "epoch": 0.02, "learning_rate": 0.00019988158037483026, "loss": 2.4457, "step": 1936 }, { "epoch": 0.02, "learning_rate": 0.00019988011421755514, "loss": 2.4543, "step": 1944 }, { "epoch": 0.02, "learning_rate": 0.0001998786390458138, "loss": 2.447, "step": 1952 }, { "epoch": 0.02, "learning_rate": 0.0001998771548597543, "loss": 2.4593, "step": 1960 }, { "epoch": 0.02, "learning_rate": 0.0001998756616595254, "loss": 2.454, "step": 1968 }, { "epoch": 0.02, "learning_rate": 0.00019987415944527692, "loss": 2.4317, "step": 1976 }, { "epoch": 0.02, "learning_rate": 0.0001998726482171595, "loss": 2.4334, "step": 1984 }, { "epoch": 0.02, "learning_rate": 0.0001998711279753247, "loss": 2.4591, "step": 1992 }, { "epoch": 0.03, "learning_rate": 0.00019986959871992502, "loss": 2.449, "step": 2000 }, { "epoch": 0.03, "learning_rate": 0.0001998680604511138, "loss": 2.4296, "step": 2008 }, { "epoch": 0.03, "learning_rate": 0.00019986651316904536, "loss": 2.4508, "step": 2016 }, { "epoch": 0.03, "learning_rate": 0.0001998649568738748, "loss": 2.464, "step": 2024 }, { "epoch": 0.03, "learning_rate": 0.00019986339156575833, "loss": 2.4447, "step": 2032 }, { "epoch": 0.03, "learning_rate": 0.00019986181724485286, "loss": 2.4509, "step": 2040 }, { "epoch": 0.03, "learning_rate": 0.00019986023391131632, "loss": 2.4673, "step": 2048 }, { "epoch": 0.03, "learning_rate": 0.00019985864156530747, "loss": 2.4549, "step": 2056 }, { "epoch": 0.03, "learning_rate": 0.00019985704020698605, "loss": 2.4507, "step": 2064 }, { "epoch": 0.03, "learning_rate": 0.00019985542983651269, "loss": 2.4632, "step": 2072 }, { "epoch": 0.03, "learning_rate": 0.00019985381045404881, "loss": 2.4354, "step": 2080 }, { "epoch": 0.03, "learning_rate": 0.0001998521820597569, "loss": 2.4405, "step": 2088 }, { "epoch": 0.03, "learning_rate": 0.00019985054465380028, "loss": 2.44, "step": 2096 }, { "epoch": 0.03, "learning_rate": 0.0001998488982363431, "loss": 2.4376, "step": 2104 }, { "epoch": 0.03, "learning_rate": 0.0001998472428075506, "loss": 2.4441, "step": 2112 }, { "epoch": 0.03, "learning_rate": 0.00019984557836758872, "loss": 2.4635, "step": 2120 }, { "epoch": 0.03, "learning_rate": 0.00019984390491662447, "loss": 2.4606, "step": 2128 }, { "epoch": 0.03, "learning_rate": 0.00019984222245482557, "loss": 2.4428, "step": 2136 }, { "epoch": 0.03, "learning_rate": 0.00019984053098236087, "loss": 2.4565, "step": 2144 }, { "epoch": 0.03, "learning_rate": 0.00019983883049939994, "loss": 2.4409, "step": 2152 }, { "epoch": 0.03, "learning_rate": 0.0001998371210061134, "loss": 2.455, "step": 2160 }, { "epoch": 0.03, "learning_rate": 0.00019983540250267267, "loss": 2.4195, "step": 2168 }, { "epoch": 0.03, "learning_rate": 0.0001998336749892501, "loss": 2.4555, "step": 2176 }, { "epoch": 0.03, "learning_rate": 0.00019983193846601896, "loss": 2.4474, "step": 2184 }, { "epoch": 0.03, "learning_rate": 0.00019983019293315338, "loss": 2.4574, "step": 2192 }, { "epoch": 0.03, "learning_rate": 0.00019982843839082848, "loss": 2.4332, "step": 2200 }, { "epoch": 0.03, "learning_rate": 0.00019982667483922018, "loss": 2.4547, "step": 2208 }, { "epoch": 0.03, "learning_rate": 0.0001998249022785054, "loss": 2.4366, "step": 2216 }, { "epoch": 0.03, "learning_rate": 0.00019982312070886192, "loss": 2.4435, "step": 2224 }, { "epoch": 0.03, "learning_rate": 0.00019982133013046836, "loss": 2.4627, "step": 2232 }, { "epoch": 0.03, "learning_rate": 0.00019981953054350434, "loss": 2.4434, "step": 2240 }, { "epoch": 0.03, "learning_rate": 0.00019981772194815038, "loss": 2.4292, "step": 2248 }, { "epoch": 0.03, "learning_rate": 0.00019981590434458785, "loss": 2.452, "step": 2256 }, { "epoch": 0.03, "learning_rate": 0.000199814077732999, "loss": 2.4529, "step": 2264 }, { "epoch": 0.03, "learning_rate": 0.00019981224211356707, "loss": 2.4578, "step": 2272 }, { "epoch": 0.03, "learning_rate": 0.00019981039748647621, "loss": 2.4521, "step": 2280 }, { "epoch": 0.03, "learning_rate": 0.00019980854385191134, "loss": 2.4473, "step": 2288 }, { "epoch": 0.03, "learning_rate": 0.0001998066812100584, "loss": 2.4263, "step": 2296 }, { "epoch": 0.03, "learning_rate": 0.00019980480956110423, "loss": 2.446, "step": 2304 }, { "epoch": 0.03, "learning_rate": 0.00019980292890523654, "loss": 2.439, "step": 2312 }, { "epoch": 0.03, "learning_rate": 0.00019980103924264388, "loss": 2.4562, "step": 2320 }, { "epoch": 0.03, "learning_rate": 0.00019979914057351584, "loss": 2.4409, "step": 2328 }, { "epoch": 0.03, "learning_rate": 0.00019979723289804285, "loss": 2.4439, "step": 2336 }, { "epoch": 0.03, "learning_rate": 0.0001997953162164162, "loss": 2.4548, "step": 2344 }, { "epoch": 0.03, "learning_rate": 0.00019979339052882814, "loss": 2.4491, "step": 2352 }, { "epoch": 0.03, "learning_rate": 0.00019979145583547182, "loss": 2.4437, "step": 2360 }, { "epoch": 0.03, "learning_rate": 0.00019978951213654129, "loss": 2.4304, "step": 2368 }, { "epoch": 0.03, "learning_rate": 0.00019978755943223143, "loss": 2.4417, "step": 2376 }, { "epoch": 0.03, "learning_rate": 0.00019978559772273813, "loss": 2.4714, "step": 2384 }, { "epoch": 0.03, "learning_rate": 0.00019978362700825815, "loss": 2.4345, "step": 2392 }, { "epoch": 0.03, "learning_rate": 0.0001997816472889891, "loss": 2.4435, "step": 2400 }, { "epoch": 0.03, "learning_rate": 0.00019977965856512954, "loss": 2.4371, "step": 2408 }, { "epoch": 0.03, "learning_rate": 0.000199777660836879, "loss": 2.4583, "step": 2416 }, { "epoch": 0.03, "learning_rate": 0.00019977565410443776, "loss": 2.4617, "step": 2424 }, { "epoch": 0.03, "learning_rate": 0.0001997736383680071, "loss": 2.4378, "step": 2432 }, { "epoch": 0.03, "learning_rate": 0.0001997716136277892, "loss": 2.4415, "step": 2440 }, { "epoch": 0.03, "learning_rate": 0.00019976957988398713, "loss": 2.4411, "step": 2448 }, { "epoch": 0.03, "learning_rate": 0.00019976753713680487, "loss": 2.4488, "step": 2456 }, { "epoch": 0.03, "learning_rate": 0.00019976548538644729, "loss": 2.4531, "step": 2464 }, { "epoch": 0.03, "learning_rate": 0.00019976342463312016, "loss": 2.4361, "step": 2472 }, { "epoch": 0.03, "learning_rate": 0.00019976135487703015, "loss": 2.4234, "step": 2480 }, { "epoch": 0.03, "learning_rate": 0.00019975927611838487, "loss": 2.4434, "step": 2488 }, { "epoch": 0.03, "learning_rate": 0.0001997571883573928, "loss": 2.4423, "step": 2496 }, { "epoch": 0.03, "learning_rate": 0.00019975509159426334, "loss": 2.4479, "step": 2504 }, { "epoch": 0.03, "learning_rate": 0.00019975298582920677, "loss": 2.4344, "step": 2512 }, { "epoch": 0.03, "learning_rate": 0.00019975087106243426, "loss": 2.4431, "step": 2520 }, { "epoch": 0.03, "learning_rate": 0.000199748747294158, "loss": 2.4385, "step": 2528 }, { "epoch": 0.03, "learning_rate": 0.00019974661452459088, "loss": 2.4388, "step": 2536 }, { "epoch": 0.03, "learning_rate": 0.00019974447275394687, "loss": 2.4516, "step": 2544 }, { "epoch": 0.03, "learning_rate": 0.00019974232198244078, "loss": 2.4632, "step": 2552 }, { "epoch": 0.03, "learning_rate": 0.00019974016221028826, "loss": 2.4615, "step": 2560 }, { "epoch": 0.03, "learning_rate": 0.00019973799343770603, "loss": 2.4501, "step": 2568 }, { "epoch": 0.03, "learning_rate": 0.0001997358156649115, "loss": 2.4451, "step": 2576 }, { "epoch": 0.03, "learning_rate": 0.00019973362889212312, "loss": 2.4358, "step": 2584 }, { "epoch": 0.03, "learning_rate": 0.00019973143311956024, "loss": 2.4408, "step": 2592 }, { "epoch": 0.03, "learning_rate": 0.00019972922834744308, "loss": 2.4423, "step": 2600 }, { "epoch": 0.03, "learning_rate": 0.00019972701457599272, "loss": 2.4389, "step": 2608 }, { "epoch": 0.03, "learning_rate": 0.00019972479180543123, "loss": 2.4418, "step": 2616 }, { "epoch": 0.03, "learning_rate": 0.00019972256003598153, "loss": 2.4507, "step": 2624 }, { "epoch": 0.03, "learning_rate": 0.00019972031926786745, "loss": 2.4392, "step": 2632 }, { "epoch": 0.03, "learning_rate": 0.00019971806950131376, "loss": 2.4504, "step": 2640 }, { "epoch": 0.03, "learning_rate": 0.00019971581073654603, "loss": 2.4225, "step": 2648 }, { "epoch": 0.03, "learning_rate": 0.00019971354297379086, "loss": 2.462, "step": 2656 }, { "epoch": 0.03, "learning_rate": 0.00019971126621327564, "loss": 2.4421, "step": 2664 }, { "epoch": 0.03, "learning_rate": 0.0001997089804552288, "loss": 2.4392, "step": 2672 }, { "epoch": 0.03, "learning_rate": 0.00019970668569987951, "loss": 2.4402, "step": 2680 }, { "epoch": 0.03, "learning_rate": 0.00019970438194745797, "loss": 2.443, "step": 2688 }, { "epoch": 0.03, "learning_rate": 0.00019970206919819522, "loss": 2.4299, "step": 2696 }, { "epoch": 0.03, "learning_rate": 0.0001996997474523232, "loss": 2.4463, "step": 2704 }, { "epoch": 0.03, "learning_rate": 0.00019969741671007477, "loss": 2.4449, "step": 2712 }, { "epoch": 0.03, "learning_rate": 0.0001996950769716837, "loss": 2.4218, "step": 2720 }, { "epoch": 0.03, "learning_rate": 0.00019969272823738466, "loss": 2.4347, "step": 2728 }, { "epoch": 0.03, "learning_rate": 0.0001996903705074132, "loss": 2.4463, "step": 2736 }, { "epoch": 0.03, "learning_rate": 0.00019968800378200577, "loss": 2.4388, "step": 2744 }, { "epoch": 0.03, "learning_rate": 0.0001996856280613998, "loss": 2.4269, "step": 2752 }, { "epoch": 0.03, "learning_rate": 0.0001996832433458335, "loss": 2.4495, "step": 2760 }, { "epoch": 0.03, "learning_rate": 0.00019968084963554604, "loss": 2.4226, "step": 2768 }, { "epoch": 0.03, "learning_rate": 0.00019967844693077758, "loss": 2.4418, "step": 2776 }, { "epoch": 0.03, "learning_rate": 0.00019967603523176898, "loss": 2.4565, "step": 2784 }, { "epoch": 0.03, "learning_rate": 0.0001996736145387622, "loss": 2.4539, "step": 2792 }, { "epoch": 0.04, "learning_rate": 0.000199671184852, "loss": 2.4393, "step": 2800 }, { "epoch": 0.04, "learning_rate": 0.0001996687461717261, "loss": 2.4553, "step": 2808 }, { "epoch": 0.04, "learning_rate": 0.000199666298498185, "loss": 2.4382, "step": 2816 }, { "epoch": 0.04, "learning_rate": 0.00019966384183162225, "loss": 2.427, "step": 2824 }, { "epoch": 0.04, "learning_rate": 0.00019966137617228422, "loss": 2.4414, "step": 2832 }, { "epoch": 0.04, "learning_rate": 0.00019965890152041823, "loss": 2.4332, "step": 2840 }, { "epoch": 0.04, "learning_rate": 0.00019965641787627244, "loss": 2.4351, "step": 2848 }, { "epoch": 0.04, "learning_rate": 0.00019965392524009599, "loss": 2.4507, "step": 2856 }, { "epoch": 0.04, "learning_rate": 0.0001996514236121388, "loss": 2.4253, "step": 2864 }, { "epoch": 0.04, "learning_rate": 0.00019964891299265188, "loss": 2.45, "step": 2872 }, { "epoch": 0.04, "learning_rate": 0.0001996463933818869, "loss": 2.4332, "step": 2880 }, { "epoch": 0.04, "learning_rate": 0.00019964386478009665, "loss": 2.444, "step": 2888 }, { "epoch": 0.04, "learning_rate": 0.0001996413271875347, "loss": 2.44, "step": 2896 }, { "epoch": 0.04, "learning_rate": 0.0001996387806044556, "loss": 2.4632, "step": 2904 }, { "epoch": 0.04, "learning_rate": 0.00019963622503111467, "loss": 2.4233, "step": 2912 }, { "epoch": 0.04, "learning_rate": 0.00019963366046776834, "loss": 2.4413, "step": 2920 }, { "epoch": 0.04, "learning_rate": 0.00019963108691467373, "loss": 2.4417, "step": 2928 }, { "epoch": 0.04, "learning_rate": 0.00019962850437208897, "loss": 2.4445, "step": 2936 }, { "epoch": 0.04, "learning_rate": 0.0001996259128402731, "loss": 2.4397, "step": 2944 }, { "epoch": 0.04, "learning_rate": 0.00019962331231948604, "loss": 2.4274, "step": 2952 }, { "epoch": 0.04, "learning_rate": 0.00019962070280998858, "loss": 2.4464, "step": 2960 }, { "epoch": 0.04, "learning_rate": 0.0001996180843120424, "loss": 2.4552, "step": 2968 }, { "epoch": 0.04, "learning_rate": 0.0001996154568259102, "loss": 2.4477, "step": 2976 }, { "epoch": 0.04, "learning_rate": 0.00019961282035185546, "loss": 2.4465, "step": 2984 }, { "epoch": 0.04, "learning_rate": 0.00019961017489014265, "loss": 2.4439, "step": 2992 }, { "epoch": 0.04, "learning_rate": 0.000199607520441037, "loss": 2.4297, "step": 3000 }, { "epoch": 0.04, "learning_rate": 0.00019960485700480486, "loss": 2.4379, "step": 3008 }, { "epoch": 0.04, "learning_rate": 0.00019960218458171323, "loss": 2.4388, "step": 3016 }, { "epoch": 0.04, "learning_rate": 0.00019959950317203023, "loss": 2.4465, "step": 3024 }, { "epoch": 0.04, "learning_rate": 0.00019959681277602475, "loss": 2.4364, "step": 3032 }, { "epoch": 0.04, "learning_rate": 0.00019959411339396665, "loss": 2.4373, "step": 3040 }, { "epoch": 0.04, "learning_rate": 0.00019959140502612664, "loss": 2.4383, "step": 3048 }, { "epoch": 0.04, "learning_rate": 0.00019958868767277634, "loss": 2.4286, "step": 3056 }, { "epoch": 0.04, "learning_rate": 0.00019958596133418831, "loss": 2.4224, "step": 3064 }, { "epoch": 0.04, "learning_rate": 0.000199583226010636, "loss": 2.4136, "step": 3072 }, { "epoch": 0.04, "learning_rate": 0.00019958048170239372, "loss": 2.4579, "step": 3080 }, { "epoch": 0.04, "learning_rate": 0.00019957772840973668, "loss": 2.4361, "step": 3088 }, { "epoch": 0.04, "learning_rate": 0.00019957496613294112, "loss": 2.4405, "step": 3096 }, { "epoch": 0.04, "learning_rate": 0.00019957219487228397, "loss": 2.452, "step": 3104 }, { "epoch": 0.04, "learning_rate": 0.00019956941462804322, "loss": 2.4343, "step": 3112 }, { "epoch": 0.04, "learning_rate": 0.00019956662540049773, "loss": 2.4397, "step": 3120 }, { "epoch": 0.04, "learning_rate": 0.00019956382718992722, "loss": 2.446, "step": 3128 }, { "epoch": 0.04, "learning_rate": 0.00019956101999661234, "loss": 2.4348, "step": 3136 }, { "epoch": 0.04, "learning_rate": 0.0001995582038208346, "loss": 2.435, "step": 3144 }, { "epoch": 0.04, "learning_rate": 0.00019955537866287655, "loss": 2.4519, "step": 3152 }, { "epoch": 0.04, "learning_rate": 0.00019955254452302143, "loss": 2.4423, "step": 3160 }, { "epoch": 0.04, "learning_rate": 0.00019954970140155355, "loss": 2.4262, "step": 3168 }, { "epoch": 0.04, "learning_rate": 0.000199546849298758, "loss": 2.4474, "step": 3176 }, { "epoch": 0.04, "learning_rate": 0.00019954398821492086, "loss": 2.4424, "step": 3184 }, { "epoch": 0.04, "learning_rate": 0.0001995411181503291, "loss": 2.4477, "step": 3192 }, { "epoch": 0.04, "learning_rate": 0.00019953823910527058, "loss": 2.4423, "step": 3200 }, { "epoch": 0.04, "learning_rate": 0.000199535351080034, "loss": 2.4388, "step": 3208 }, { "epoch": 0.04, "learning_rate": 0.00019953245407490906, "loss": 2.433, "step": 3216 }, { "epoch": 0.04, "learning_rate": 0.00019952954809018627, "loss": 2.4421, "step": 3224 }, { "epoch": 0.04, "learning_rate": 0.00019952663312615716, "loss": 2.4444, "step": 3232 }, { "epoch": 0.04, "learning_rate": 0.00019952370918311402, "loss": 2.4207, "step": 3240 }, { "epoch": 0.04, "learning_rate": 0.00019952077626135005, "loss": 2.4408, "step": 3248 }, { "epoch": 0.04, "learning_rate": 0.00019951783436115953, "loss": 2.4483, "step": 3256 }, { "epoch": 0.04, "learning_rate": 0.00019951488348283745, "loss": 2.4304, "step": 3264 }, { "epoch": 0.04, "learning_rate": 0.0001995119236266798, "loss": 2.4315, "step": 3272 }, { "epoch": 0.04, "learning_rate": 0.0001995089547929834, "loss": 2.4186, "step": 3280 }, { "epoch": 0.04, "learning_rate": 0.000199505976982046, "loss": 2.4568, "step": 3288 }, { "epoch": 0.04, "learning_rate": 0.0001995029901941663, "loss": 2.4397, "step": 3296 }, { "epoch": 0.04, "learning_rate": 0.00019949999442964384, "loss": 2.413, "step": 3304 }, { "epoch": 0.04, "learning_rate": 0.00019949698968877902, "loss": 2.4338, "step": 3312 }, { "epoch": 0.04, "learning_rate": 0.00019949397597187333, "loss": 2.4338, "step": 3320 }, { "epoch": 0.04, "learning_rate": 0.0001994909532792289, "loss": 2.4406, "step": 3328 }, { "epoch": 0.04, "learning_rate": 0.00019948792161114895, "loss": 2.4424, "step": 3336 }, { "epoch": 0.04, "learning_rate": 0.00019948488096793753, "loss": 2.4435, "step": 3344 }, { "epoch": 0.04, "learning_rate": 0.00019948183134989962, "loss": 2.4157, "step": 3352 }, { "epoch": 0.04, "learning_rate": 0.000199478772757341, "loss": 2.4086, "step": 3360 }, { "epoch": 0.04, "learning_rate": 0.00019947570519056855, "loss": 2.4379, "step": 3368 }, { "epoch": 0.04, "learning_rate": 0.00019947262864988984, "loss": 2.4355, "step": 3376 }, { "epoch": 0.04, "learning_rate": 0.00019946954313561347, "loss": 2.4351, "step": 3384 }, { "epoch": 0.04, "learning_rate": 0.00019946644864804886, "loss": 2.4495, "step": 3392 }, { "epoch": 0.04, "learning_rate": 0.0001994633451875064, "loss": 2.4345, "step": 3400 }, { "epoch": 0.04, "learning_rate": 0.00019946023275429735, "loss": 2.4333, "step": 3408 }, { "epoch": 0.04, "learning_rate": 0.0001994571113487339, "loss": 2.4329, "step": 3416 }, { "epoch": 0.04, "learning_rate": 0.00019945398097112905, "loss": 2.4431, "step": 3424 }, { "epoch": 0.04, "learning_rate": 0.00019945084162179675, "loss": 2.4366, "step": 3432 }, { "epoch": 0.04, "learning_rate": 0.0001994476933010519, "loss": 2.4247, "step": 3440 }, { "epoch": 0.04, "learning_rate": 0.00019944453600921028, "loss": 2.4589, "step": 3448 }, { "epoch": 0.04, "learning_rate": 0.00019944136974658848, "loss": 2.4422, "step": 3456 }, { "epoch": 0.04, "learning_rate": 0.00019943819451350415, "loss": 2.4318, "step": 3464 }, { "epoch": 0.04, "learning_rate": 0.00019943501031027564, "loss": 2.4404, "step": 3472 }, { "epoch": 0.04, "learning_rate": 0.0001994318171372224, "loss": 2.4272, "step": 3480 }, { "epoch": 0.04, "learning_rate": 0.00019942861499466465, "loss": 2.4378, "step": 3488 }, { "epoch": 0.04, "learning_rate": 0.00019942540388292353, "loss": 2.445, "step": 3496 }, { "epoch": 0.04, "learning_rate": 0.00019942218380232112, "loss": 2.4262, "step": 3504 }, { "epoch": 0.04, "learning_rate": 0.00019941895475318039, "loss": 2.4483, "step": 3512 }, { "epoch": 0.04, "learning_rate": 0.00019941571673582516, "loss": 2.4484, "step": 3520 }, { "epoch": 0.04, "learning_rate": 0.00019941246975058017, "loss": 2.3924, "step": 3528 }, { "epoch": 0.04, "learning_rate": 0.0001994092137977711, "loss": 2.4438, "step": 3536 }, { "epoch": 0.04, "learning_rate": 0.00019940594887772454, "loss": 2.4381, "step": 3544 }, { "epoch": 0.04, "learning_rate": 0.0001994026749907679, "loss": 2.426, "step": 3552 }, { "epoch": 0.04, "learning_rate": 0.00019939939213722957, "loss": 2.4433, "step": 3560 }, { "epoch": 0.04, "learning_rate": 0.00019939610031743872, "loss": 2.4425, "step": 3568 }, { "epoch": 0.04, "learning_rate": 0.00019939279953172558, "loss": 2.4255, "step": 3576 }, { "epoch": 0.04, "learning_rate": 0.00019938948978042117, "loss": 2.4279, "step": 3584 }, { "epoch": 0.04, "learning_rate": 0.00019938617106385746, "loss": 2.4457, "step": 3592 }, { "epoch": 0.04, "learning_rate": 0.00019938284338236726, "loss": 2.4399, "step": 3600 }, { "epoch": 0.05, "learning_rate": 0.00019937950673628435, "loss": 2.4434, "step": 3608 }, { "epoch": 0.05, "learning_rate": 0.0001993761611259434, "loss": 2.4532, "step": 3616 }, { "epoch": 0.05, "learning_rate": 0.00019937280655167984, "loss": 2.4479, "step": 3624 }, { "epoch": 0.05, "learning_rate": 0.00019936944301383026, "loss": 2.4249, "step": 3632 }, { "epoch": 0.05, "learning_rate": 0.00019936607051273194, "loss": 2.4197, "step": 3640 }, { "epoch": 0.05, "learning_rate": 0.0001993626890487231, "loss": 2.4326, "step": 3648 }, { "epoch": 0.05, "learning_rate": 0.0001993592986221429, "loss": 2.421, "step": 3656 }, { "epoch": 0.05, "learning_rate": 0.00019935589923333142, "loss": 2.4447, "step": 3664 }, { "epoch": 0.05, "learning_rate": 0.00019935249088262955, "loss": 2.4518, "step": 3672 }, { "epoch": 0.05, "learning_rate": 0.00019934907357037912, "loss": 2.4214, "step": 3680 }, { "epoch": 0.05, "learning_rate": 0.00019934564729692293, "loss": 2.4416, "step": 3688 }, { "epoch": 0.05, "learning_rate": 0.00019934221206260457, "loss": 2.4305, "step": 3696 }, { "epoch": 0.05, "learning_rate": 0.00019933876786776855, "loss": 2.4332, "step": 3704 }, { "epoch": 0.05, "learning_rate": 0.00019933531471276036, "loss": 2.4378, "step": 3712 }, { "epoch": 0.05, "learning_rate": 0.0001993318525979263, "loss": 2.4375, "step": 3720 }, { "epoch": 0.05, "learning_rate": 0.00019932838152361362, "loss": 2.4358, "step": 3728 }, { "epoch": 0.05, "learning_rate": 0.0001993249014901704, "loss": 2.4444, "step": 3736 }, { "epoch": 0.05, "learning_rate": 0.00019932141249794574, "loss": 2.4217, "step": 3744 }, { "epoch": 0.05, "learning_rate": 0.00019931791454728953, "loss": 2.4397, "step": 3752 }, { "epoch": 0.05, "learning_rate": 0.00019931440763855255, "loss": 2.4435, "step": 3760 }, { "epoch": 0.05, "learning_rate": 0.00019931089177208658, "loss": 2.441, "step": 3768 }, { "epoch": 0.05, "learning_rate": 0.00019930736694824425, "loss": 2.4324, "step": 3776 }, { "epoch": 0.05, "learning_rate": 0.00019930383316737907, "loss": 2.439, "step": 3784 }, { "epoch": 0.05, "learning_rate": 0.00019930029042984545, "loss": 2.4413, "step": 3792 }, { "epoch": 0.05, "learning_rate": 0.00019929673873599865, "loss": 2.4272, "step": 3800 }, { "epoch": 0.05, "learning_rate": 0.00019929317808619498, "loss": 2.4445, "step": 3808 }, { "epoch": 0.05, "learning_rate": 0.0001992896084807915, "loss": 2.4309, "step": 3816 }, { "epoch": 0.05, "learning_rate": 0.00019928602992014624, "loss": 2.4553, "step": 3824 }, { "epoch": 0.05, "learning_rate": 0.00019928244240461807, "loss": 2.4391, "step": 3832 }, { "epoch": 0.05, "learning_rate": 0.00019927884593456686, "loss": 2.4331, "step": 3840 }, { "epoch": 0.05, "learning_rate": 0.00019927524051035328, "loss": 2.4184, "step": 3848 }, { "epoch": 0.05, "learning_rate": 0.00019927162613233895, "loss": 2.4233, "step": 3856 }, { "epoch": 0.05, "learning_rate": 0.00019926800280088634, "loss": 2.4348, "step": 3864 }, { "epoch": 0.05, "learning_rate": 0.00019926437051635888, "loss": 2.4239, "step": 3872 }, { "epoch": 0.05, "learning_rate": 0.00019926072927912086, "loss": 2.4297, "step": 3880 }, { "epoch": 0.05, "learning_rate": 0.00019925707908953746, "loss": 2.4333, "step": 3888 }, { "epoch": 0.05, "learning_rate": 0.0001992534199479748, "loss": 2.4244, "step": 3896 }, { "epoch": 0.05, "learning_rate": 0.00019924975185479986, "loss": 2.4289, "step": 3904 }, { "epoch": 0.05, "learning_rate": 0.0001992460748103805, "loss": 2.4404, "step": 3912 }, { "epoch": 0.05, "learning_rate": 0.00019924238881508554, "loss": 2.4309, "step": 3920 }, { "epoch": 0.05, "learning_rate": 0.0001992386938692847, "loss": 2.4258, "step": 3928 }, { "epoch": 0.05, "learning_rate": 0.00019923498997334845, "loss": 2.4052, "step": 3936 }, { "epoch": 0.05, "learning_rate": 0.0001992312771276484, "loss": 2.4343, "step": 3944 }, { "epoch": 0.05, "learning_rate": 0.0001992275553325568, "loss": 2.4511, "step": 3952 }, { "epoch": 0.05, "learning_rate": 0.00019922382458844703, "loss": 2.4371, "step": 3960 }, { "epoch": 0.05, "learning_rate": 0.00019922008489569327, "loss": 2.4251, "step": 3968 }, { "epoch": 0.05, "learning_rate": 0.00019921633625467045, "loss": 2.4434, "step": 3976 }, { "epoch": 0.05, "learning_rate": 0.0001992125786657547, "loss": 2.4362, "step": 3984 }, { "epoch": 0.05, "learning_rate": 0.0001992088121293228, "loss": 2.433, "step": 3992 }, { "epoch": 0.05, "learning_rate": 0.00019920503664575253, "loss": 2.446, "step": 4000 }, { "epoch": 0.05, "learning_rate": 0.00019920125221542254, "loss": 2.4311, "step": 4008 }, { "epoch": 0.05, "learning_rate": 0.00019919745883871238, "loss": 2.4436, "step": 4016 }, { "epoch": 0.05, "learning_rate": 0.00019919365651600257, "loss": 2.4289, "step": 4024 }, { "epoch": 0.05, "learning_rate": 0.00019918984524767435, "loss": 2.4192, "step": 4032 }, { "epoch": 0.05, "learning_rate": 0.00019918602503411005, "loss": 2.4188, "step": 4040 }, { "epoch": 0.05, "learning_rate": 0.0001991821958756928, "loss": 2.4274, "step": 4048 }, { "epoch": 0.05, "learning_rate": 0.00019917835777280666, "loss": 2.4346, "step": 4056 }, { "epoch": 0.05, "learning_rate": 0.0001991745107258365, "loss": 2.4132, "step": 4064 }, { "epoch": 0.05, "learning_rate": 0.00019917065473516824, "loss": 2.431, "step": 4072 }, { "epoch": 0.05, "learning_rate": 0.00019916678980118859, "loss": 2.4237, "step": 4080 }, { "epoch": 0.05, "learning_rate": 0.00019916291592428514, "loss": 2.4356, "step": 4088 }, { "epoch": 0.05, "learning_rate": 0.00019915903310484644, "loss": 2.4351, "step": 4096 }, { "epoch": 0.05, "learning_rate": 0.00019915514134326195, "loss": 2.4252, "step": 4104 }, { "epoch": 0.05, "learning_rate": 0.00019915124063992195, "loss": 2.4243, "step": 4112 }, { "epoch": 0.05, "learning_rate": 0.0001991473309952177, "loss": 2.4173, "step": 4120 }, { "epoch": 0.05, "learning_rate": 0.00019914341240954126, "loss": 2.438, "step": 4128 }, { "epoch": 0.05, "learning_rate": 0.00019913948488328566, "loss": 2.4144, "step": 4136 }, { "epoch": 0.05, "learning_rate": 0.00019913554841684484, "loss": 2.4277, "step": 4144 }, { "epoch": 0.05, "learning_rate": 0.00019913160301061357, "loss": 2.4127, "step": 4152 }, { "epoch": 0.05, "learning_rate": 0.00019912764866498756, "loss": 2.446, "step": 4160 }, { "epoch": 0.05, "learning_rate": 0.00019912368538036344, "loss": 2.4476, "step": 4168 }, { "epoch": 0.05, "learning_rate": 0.00019911971315713866, "loss": 2.4323, "step": 4176 }, { "epoch": 0.05, "learning_rate": 0.00019911573199571166, "loss": 2.4243, "step": 4184 }, { "epoch": 0.05, "learning_rate": 0.00019911174189648167, "loss": 2.4372, "step": 4192 }, { "epoch": 0.05, "learning_rate": 0.0001991077428598489, "loss": 2.4262, "step": 4200 }, { "epoch": 0.05, "learning_rate": 0.00019910373488621444, "loss": 2.4549, "step": 4208 }, { "epoch": 0.05, "learning_rate": 0.00019909971797598026, "loss": 2.4264, "step": 4216 }, { "epoch": 0.05, "learning_rate": 0.00019909569212954925, "loss": 2.4239, "step": 4224 }, { "epoch": 0.05, "learning_rate": 0.00019909165734732513, "loss": 2.4095, "step": 4232 }, { "epoch": 0.05, "learning_rate": 0.00019908761362971263, "loss": 2.4324, "step": 4240 }, { "epoch": 0.05, "learning_rate": 0.00019908356097711723, "loss": 2.4469, "step": 4248 }, { "epoch": 0.05, "learning_rate": 0.0001990794993899455, "loss": 2.4226, "step": 4256 }, { "epoch": 0.05, "learning_rate": 0.00019907542886860472, "loss": 2.4307, "step": 4264 }, { "epoch": 0.05, "learning_rate": 0.00019907134941350314, "loss": 2.4383, "step": 4272 }, { "epoch": 0.05, "learning_rate": 0.00019906726102504995, "loss": 2.4283, "step": 4280 }, { "epoch": 0.05, "learning_rate": 0.0001990631637036551, "loss": 2.4128, "step": 4288 }, { "epoch": 0.05, "learning_rate": 0.00019905905744972964, "loss": 2.4227, "step": 4296 }, { "epoch": 0.05, "learning_rate": 0.00019905494226368534, "loss": 2.41, "step": 4304 }, { "epoch": 0.05, "learning_rate": 0.00019905081814593494, "loss": 2.4338, "step": 4312 }, { "epoch": 0.05, "learning_rate": 0.0001990466850968921, "loss": 2.4254, "step": 4320 }, { "epoch": 0.05, "learning_rate": 0.00019904254311697126, "loss": 2.4201, "step": 4328 }, { "epoch": 0.05, "learning_rate": 0.00019903839220658791, "loss": 2.423, "step": 4336 }, { "epoch": 0.05, "learning_rate": 0.00019903423236615836, "loss": 2.4335, "step": 4344 }, { "epoch": 0.05, "learning_rate": 0.00019903006359609976, "loss": 2.4316, "step": 4352 }, { "epoch": 0.05, "learning_rate": 0.0001990258858968303, "loss": 2.4102, "step": 4360 }, { "epoch": 0.05, "learning_rate": 0.00019902169926876894, "loss": 2.4341, "step": 4368 }, { "epoch": 0.05, "learning_rate": 0.0001990175037123355, "loss": 2.4377, "step": 4376 }, { "epoch": 0.05, "learning_rate": 0.00019901329922795088, "loss": 2.4223, "step": 4384 }, { "epoch": 0.05, "learning_rate": 0.00019900908581603672, "loss": 2.4407, "step": 4392 }, { "epoch": 0.06, "learning_rate": 0.0001990048634770156, "loss": 2.4118, "step": 4400 }, { "epoch": 0.06, "learning_rate": 0.00019900063221131104, "loss": 2.4226, "step": 4408 }, { "epoch": 0.06, "learning_rate": 0.00019899639201934733, "loss": 2.4124, "step": 4416 }, { "epoch": 0.06, "learning_rate": 0.0001989921429015498, "loss": 2.4221, "step": 4424 }, { "epoch": 0.06, "learning_rate": 0.0001989878848583446, "loss": 2.4428, "step": 4432 }, { "epoch": 0.06, "learning_rate": 0.00019898361789015879, "loss": 2.433, "step": 4440 }, { "epoch": 0.06, "learning_rate": 0.00019897934199742027, "loss": 2.4261, "step": 4448 }, { "epoch": 0.06, "learning_rate": 0.00019897505718055798, "loss": 2.443, "step": 4456 }, { "epoch": 0.06, "learning_rate": 0.0001989707634400016, "loss": 2.4349, "step": 4464 }, { "epoch": 0.06, "learning_rate": 0.00019896646077618174, "loss": 2.4319, "step": 4472 }, { "epoch": 0.06, "learning_rate": 0.00019896214918953002, "loss": 2.4292, "step": 4480 }, { "epoch": 0.06, "learning_rate": 0.00019895782868047885, "loss": 2.4261, "step": 4488 }, { "epoch": 0.06, "learning_rate": 0.00019895349924946146, "loss": 2.4266, "step": 4496 }, { "epoch": 0.06, "learning_rate": 0.0001989491608969122, "loss": 2.4458, "step": 4504 }, { "epoch": 0.06, "learning_rate": 0.00019894481362326606, "loss": 2.4249, "step": 4512 }, { "epoch": 0.06, "learning_rate": 0.00019894045742895912, "loss": 2.4271, "step": 4520 }, { "epoch": 0.06, "learning_rate": 0.0001989360923144283, "loss": 2.44, "step": 4528 }, { "epoch": 0.06, "learning_rate": 0.0001989317182801113, "loss": 2.4125, "step": 4536 }, { "epoch": 0.06, "learning_rate": 0.00019892733532644692, "loss": 2.4101, "step": 4544 }, { "epoch": 0.06, "learning_rate": 0.00019892294345387468, "loss": 2.4481, "step": 4552 }, { "epoch": 0.06, "learning_rate": 0.00019891854266283507, "loss": 2.4439, "step": 4560 }, { "epoch": 0.06, "learning_rate": 0.00019891413295376948, "loss": 2.4261, "step": 4568 }, { "epoch": 0.06, "learning_rate": 0.00019890971432712018, "loss": 2.4237, "step": 4576 }, { "epoch": 0.06, "learning_rate": 0.00019890528678333033, "loss": 2.4333, "step": 4584 }, { "epoch": 0.06, "learning_rate": 0.00019890085032284394, "loss": 2.4333, "step": 4592 }, { "epoch": 0.06, "learning_rate": 0.00019889640494610603, "loss": 2.4332, "step": 4600 }, { "epoch": 0.06, "learning_rate": 0.0001988919506535624, "loss": 2.4348, "step": 4608 }, { "epoch": 0.06, "learning_rate": 0.00019888748744565984, "loss": 2.3965, "step": 4616 }, { "epoch": 0.06, "learning_rate": 0.00019888301532284592, "loss": 2.441, "step": 4624 }, { "epoch": 0.06, "learning_rate": 0.00019887853428556923, "loss": 2.4317, "step": 4632 }, { "epoch": 0.06, "learning_rate": 0.00019887404433427917, "loss": 2.4223, "step": 4640 }, { "epoch": 0.06, "learning_rate": 0.000198869545469426, "loss": 2.421, "step": 4648 }, { "epoch": 0.06, "learning_rate": 0.000198865037691461, "loss": 2.4406, "step": 4656 }, { "epoch": 0.06, "learning_rate": 0.0001988605210008363, "loss": 2.449, "step": 4664 }, { "epoch": 0.06, "learning_rate": 0.0001988559953980048, "loss": 2.4437, "step": 4672 }, { "epoch": 0.06, "learning_rate": 0.0001988514608834205, "loss": 2.4063, "step": 4680 }, { "epoch": 0.06, "learning_rate": 0.00019884691745753808, "loss": 2.4317, "step": 4688 }, { "epoch": 0.06, "learning_rate": 0.00019884236512081332, "loss": 2.4154, "step": 4696 }, { "epoch": 0.06, "learning_rate": 0.00019883780387370273, "loss": 2.4344, "step": 4704 }, { "epoch": 0.06, "learning_rate": 0.0001988332337166638, "loss": 2.4386, "step": 4712 }, { "epoch": 0.06, "learning_rate": 0.00019882865465015487, "loss": 2.4452, "step": 4720 }, { "epoch": 0.06, "learning_rate": 0.00019882406667463522, "loss": 2.4318, "step": 4728 }, { "epoch": 0.06, "learning_rate": 0.000198819469790565, "loss": 2.425, "step": 4736 }, { "epoch": 0.06, "learning_rate": 0.00019881486399840522, "loss": 2.4279, "step": 4744 }, { "epoch": 0.06, "learning_rate": 0.00019881024929861786, "loss": 2.4195, "step": 4752 }, { "epoch": 0.06, "learning_rate": 0.00019880562569166567, "loss": 2.4193, "step": 4760 }, { "epoch": 0.06, "learning_rate": 0.00019880099317801247, "loss": 2.4098, "step": 4768 }, { "epoch": 0.06, "learning_rate": 0.0001987963517581228, "loss": 2.4202, "step": 4776 }, { "epoch": 0.06, "learning_rate": 0.0001987917014324622, "loss": 2.4201, "step": 4784 }, { "epoch": 0.06, "learning_rate": 0.00019878704220149706, "loss": 2.4045, "step": 4792 }, { "epoch": 0.06, "learning_rate": 0.00019878237406569473, "loss": 2.4389, "step": 4800 }, { "epoch": 0.06, "learning_rate": 0.0001987776970255233, "loss": 2.4165, "step": 4808 }, { "epoch": 0.06, "learning_rate": 0.00019877301108145193, "loss": 2.4148, "step": 4816 }, { "epoch": 0.06, "learning_rate": 0.00019876831623395053, "loss": 2.4255, "step": 4824 }, { "epoch": 0.06, "learning_rate": 0.00019876361248349003, "loss": 2.422, "step": 4832 }, { "epoch": 0.06, "learning_rate": 0.00019875889983054213, "loss": 2.4315, "step": 4840 }, { "epoch": 0.06, "learning_rate": 0.00019875417827557956, "loss": 2.4249, "step": 4848 }, { "epoch": 0.06, "learning_rate": 0.00019874944781907578, "loss": 2.4238, "step": 4856 }, { "epoch": 0.06, "learning_rate": 0.0001987447084615053, "loss": 2.4289, "step": 4864 }, { "epoch": 0.06, "learning_rate": 0.00019873996020334337, "loss": 2.4268, "step": 4872 }, { "epoch": 0.06, "learning_rate": 0.00019873520304506632, "loss": 2.4279, "step": 4880 }, { "epoch": 0.06, "learning_rate": 0.00019873043698715115, "loss": 2.4372, "step": 4888 }, { "epoch": 0.06, "learning_rate": 0.00019872566203007596, "loss": 2.4103, "step": 4896 }, { "epoch": 0.06, "learning_rate": 0.00019872087817431958, "loss": 2.4103, "step": 4904 }, { "epoch": 0.06, "learning_rate": 0.00019871608542036188, "loss": 2.4324, "step": 4912 }, { "epoch": 0.06, "learning_rate": 0.00019871128376868348, "loss": 2.4135, "step": 4920 }, { "epoch": 0.06, "learning_rate": 0.000198706473219766, "loss": 2.4204, "step": 4928 }, { "epoch": 0.06, "learning_rate": 0.00019870165377409188, "loss": 2.4385, "step": 4936 }, { "epoch": 0.06, "learning_rate": 0.0001986968254321445, "loss": 2.4291, "step": 4944 }, { "epoch": 0.06, "learning_rate": 0.00019869198819440814, "loss": 2.4131, "step": 4952 }, { "epoch": 0.06, "learning_rate": 0.00019868714206136787, "loss": 2.4162, "step": 4960 }, { "epoch": 0.06, "learning_rate": 0.00019868228703350983, "loss": 2.4106, "step": 4968 }, { "epoch": 0.06, "learning_rate": 0.00019867742311132088, "loss": 2.4347, "step": 4976 }, { "epoch": 0.06, "learning_rate": 0.00019867255029528885, "loss": 2.4151, "step": 4984 }, { "epoch": 0.06, "learning_rate": 0.0001986676685859025, "loss": 2.437, "step": 4992 }, { "epoch": 0.06, "learning_rate": 0.00019866277798365138, "loss": 2.4154, "step": 5000 }, { "epoch": 0.06, "learning_rate": 0.00019865787848902605, "loss": 2.4272, "step": 5008 }, { "epoch": 0.06, "learning_rate": 0.00019865297010251786, "loss": 2.4273, "step": 5016 }, { "epoch": 0.06, "learning_rate": 0.0001986480528246191, "loss": 2.4389, "step": 5024 }, { "epoch": 0.06, "learning_rate": 0.00019864312665582293, "loss": 2.4238, "step": 5032 }, { "epoch": 0.06, "learning_rate": 0.00019863819159662347, "loss": 2.443, "step": 5040 }, { "epoch": 0.06, "learning_rate": 0.00019863324764751562, "loss": 2.4488, "step": 5048 }, { "epoch": 0.06, "learning_rate": 0.0001986282948089953, "loss": 2.4082, "step": 5056 }, { "epoch": 0.06, "learning_rate": 0.00019862333308155917, "loss": 2.4275, "step": 5064 }, { "epoch": 0.06, "learning_rate": 0.0001986183624657049, "loss": 2.4202, "step": 5072 }, { "epoch": 0.06, "learning_rate": 0.00019861338296193098, "loss": 2.4266, "step": 5080 }, { "epoch": 0.06, "learning_rate": 0.0001986083945707369, "loss": 2.4172, "step": 5088 }, { "epoch": 0.06, "learning_rate": 0.00019860339729262295, "loss": 2.417, "step": 5096 }, { "epoch": 0.06, "learning_rate": 0.00019859839112809025, "loss": 2.4428, "step": 5104 }, { "epoch": 0.06, "learning_rate": 0.00019859337607764098, "loss": 2.4217, "step": 5112 }, { "epoch": 0.06, "learning_rate": 0.0001985883521417781, "loss": 2.4276, "step": 5120 }, { "epoch": 0.06, "learning_rate": 0.00019858331932100543, "loss": 2.4209, "step": 5128 }, { "epoch": 0.06, "learning_rate": 0.00019857827761582782, "loss": 2.4141, "step": 5136 }, { "epoch": 0.06, "learning_rate": 0.00019857322702675082, "loss": 2.4232, "step": 5144 }, { "epoch": 0.06, "learning_rate": 0.00019856816755428106, "loss": 2.4265, "step": 5152 }, { "epoch": 0.06, "learning_rate": 0.00019856309919892597, "loss": 2.4222, "step": 5160 }, { "epoch": 0.06, "learning_rate": 0.00019855802196119384, "loss": 2.4155, "step": 5168 }, { "epoch": 0.06, "learning_rate": 0.0001985529358415939, "loss": 2.3992, "step": 5176 }, { "epoch": 0.06, "learning_rate": 0.0001985478408406363, "loss": 2.4052, "step": 5184 }, { "epoch": 0.06, "learning_rate": 0.00019854273695883192, "loss": 2.4209, "step": 5192 }, { "epoch": 0.07, "learning_rate": 0.00019853762419669283, "loss": 2.4297, "step": 5200 }, { "epoch": 0.07, "learning_rate": 0.00019853250255473165, "loss": 2.4004, "step": 5208 }, { "epoch": 0.07, "learning_rate": 0.00019852737203346213, "loss": 2.4514, "step": 5216 }, { "epoch": 0.07, "learning_rate": 0.0001985222326333988, "loss": 2.4228, "step": 5224 }, { "epoch": 0.07, "learning_rate": 0.00019851708435505717, "loss": 2.4332, "step": 5232 }, { "epoch": 0.07, "learning_rate": 0.00019851192719895356, "loss": 2.4207, "step": 5240 }, { "epoch": 0.07, "learning_rate": 0.00019850676116560517, "loss": 2.4237, "step": 5248 }, { "epoch": 0.07, "learning_rate": 0.0001985015862555301, "loss": 2.4269, "step": 5256 }, { "epoch": 0.07, "learning_rate": 0.00019849640246924743, "loss": 2.4073, "step": 5264 }, { "epoch": 0.07, "learning_rate": 0.00019849120980727707, "loss": 2.4031, "step": 5272 }, { "epoch": 0.07, "learning_rate": 0.00019848600827013975, "loss": 2.431, "step": 5280 }, { "epoch": 0.07, "learning_rate": 0.00019848079785835722, "loss": 2.4159, "step": 5288 }, { "epoch": 0.07, "learning_rate": 0.000198475578572452, "loss": 2.4308, "step": 5296 }, { "epoch": 0.07, "learning_rate": 0.0001984703504129476, "loss": 2.4225, "step": 5304 }, { "epoch": 0.07, "learning_rate": 0.00019846511338036832, "loss": 2.4148, "step": 5312 }, { "epoch": 0.07, "learning_rate": 0.00019845986747523946, "loss": 2.4143, "step": 5320 }, { "epoch": 0.07, "learning_rate": 0.00019845461269808715, "loss": 2.4298, "step": 5328 }, { "epoch": 0.07, "learning_rate": 0.0001984493490494384, "loss": 2.4081, "step": 5336 }, { "epoch": 0.07, "learning_rate": 0.0001984440765298211, "loss": 2.4295, "step": 5344 }, { "epoch": 0.07, "learning_rate": 0.0001984387951397641, "loss": 2.4363, "step": 5352 }, { "epoch": 0.07, "learning_rate": 0.00019843350487979702, "loss": 2.4087, "step": 5360 }, { "epoch": 0.07, "learning_rate": 0.0001984282057504505, "loss": 2.4297, "step": 5368 }, { "epoch": 0.07, "learning_rate": 0.00019842289775225604, "loss": 2.4083, "step": 5376 }, { "epoch": 0.07, "learning_rate": 0.00019841758088574597, "loss": 2.4181, "step": 5384 }, { "epoch": 0.07, "learning_rate": 0.0001984122551514535, "loss": 2.4235, "step": 5392 }, { "epoch": 0.07, "learning_rate": 0.00019840692054991287, "loss": 2.4441, "step": 5400 }, { "epoch": 0.07, "learning_rate": 0.00019840157708165898, "loss": 2.444, "step": 5408 }, { "epoch": 0.07, "learning_rate": 0.00019839622474722784, "loss": 2.41, "step": 5416 }, { "epoch": 0.07, "learning_rate": 0.00019839086354715628, "loss": 2.4071, "step": 5424 }, { "epoch": 0.07, "learning_rate": 0.00019838549348198193, "loss": 2.4191, "step": 5432 }, { "epoch": 0.07, "learning_rate": 0.00019838011455224338, "loss": 2.4208, "step": 5440 }, { "epoch": 0.07, "learning_rate": 0.00019837472675848013, "loss": 2.4122, "step": 5448 }, { "epoch": 0.07, "learning_rate": 0.0001983693301012326, "loss": 2.4252, "step": 5456 }, { "epoch": 0.07, "learning_rate": 0.00019836392458104195, "loss": 2.4186, "step": 5464 }, { "epoch": 0.07, "learning_rate": 0.00019835851019845037, "loss": 2.413, "step": 5472 }, { "epoch": 0.07, "learning_rate": 0.0001983530869540009, "loss": 2.4262, "step": 5480 }, { "epoch": 0.07, "learning_rate": 0.0001983476548482374, "loss": 2.4401, "step": 5488 }, { "epoch": 0.07, "learning_rate": 0.00019834221388170478, "loss": 2.417, "step": 5496 }, { "epoch": 0.07, "learning_rate": 0.00019833676405494862, "loss": 2.4109, "step": 5504 }, { "epoch": 0.07, "learning_rate": 0.0001983313053685156, "loss": 2.4255, "step": 5512 }, { "epoch": 0.07, "learning_rate": 0.00019832583782295314, "loss": 2.4205, "step": 5520 }, { "epoch": 0.07, "learning_rate": 0.0001983203614188097, "loss": 2.419, "step": 5528 }, { "epoch": 0.07, "learning_rate": 0.0001983148761566344, "loss": 2.4319, "step": 5536 }, { "epoch": 0.07, "learning_rate": 0.00019830938203697747, "loss": 2.4192, "step": 5544 }, { "epoch": 0.07, "learning_rate": 0.00019830387906038987, "loss": 2.4212, "step": 5552 }, { "epoch": 0.07, "learning_rate": 0.00019829836722742362, "loss": 2.4213, "step": 5560 }, { "epoch": 0.07, "learning_rate": 0.0001982928465386314, "loss": 2.4333, "step": 5568 }, { "epoch": 0.07, "learning_rate": 0.000198287316994567, "loss": 2.4257, "step": 5576 }, { "epoch": 0.07, "learning_rate": 0.00019828177859578495, "loss": 2.4195, "step": 5584 }, { "epoch": 0.07, "learning_rate": 0.00019827623134284074, "loss": 2.4254, "step": 5592 }, { "epoch": 0.07, "learning_rate": 0.00019827067523629075, "loss": 2.4437, "step": 5600 }, { "epoch": 0.07, "learning_rate": 0.0001982651102766922, "loss": 2.4077, "step": 5608 }, { "epoch": 0.07, "learning_rate": 0.00019825953646460324, "loss": 2.4221, "step": 5616 }, { "epoch": 0.07, "learning_rate": 0.00019825395380058283, "loss": 2.4183, "step": 5624 }, { "epoch": 0.07, "learning_rate": 0.00019824836228519096, "loss": 2.3967, "step": 5632 }, { "epoch": 0.07, "learning_rate": 0.00019824276191898838, "loss": 2.4104, "step": 5640 }, { "epoch": 0.07, "learning_rate": 0.0001982371527025368, "loss": 2.4196, "step": 5648 }, { "epoch": 0.07, "learning_rate": 0.00019823153463639878, "loss": 2.4218, "step": 5656 }, { "epoch": 0.07, "learning_rate": 0.0001982259077211378, "loss": 2.4108, "step": 5664 }, { "epoch": 0.07, "learning_rate": 0.00019822027195731817, "loss": 2.4433, "step": 5672 }, { "epoch": 0.07, "learning_rate": 0.00019821462734550516, "loss": 2.4173, "step": 5680 }, { "epoch": 0.07, "learning_rate": 0.00019820897388626488, "loss": 2.4108, "step": 5688 }, { "epoch": 0.07, "learning_rate": 0.00019820331158016435, "loss": 2.4267, "step": 5696 }, { "epoch": 0.07, "learning_rate": 0.00019819764042777142, "loss": 2.4162, "step": 5704 }, { "epoch": 0.07, "learning_rate": 0.0001981919604296549, "loss": 2.4167, "step": 5712 }, { "epoch": 0.07, "learning_rate": 0.00019818627158638453, "loss": 2.405, "step": 5720 }, { "epoch": 0.07, "learning_rate": 0.00019818057389853078, "loss": 2.4068, "step": 5728 }, { "epoch": 0.07, "learning_rate": 0.00019817486736666514, "loss": 2.4205, "step": 5736 }, { "epoch": 0.07, "learning_rate": 0.0001981691519913599, "loss": 2.4149, "step": 5744 }, { "epoch": 0.07, "learning_rate": 0.00019816342777318832, "loss": 2.4238, "step": 5752 }, { "epoch": 0.07, "learning_rate": 0.00019815769471272452, "loss": 2.4134, "step": 5760 }, { "epoch": 0.07, "learning_rate": 0.00019815195281054344, "loss": 2.4193, "step": 5768 }, { "epoch": 0.07, "learning_rate": 0.000198146202067221, "loss": 2.4233, "step": 5776 }, { "epoch": 0.07, "learning_rate": 0.00019814044248333396, "loss": 2.4386, "step": 5784 }, { "epoch": 0.07, "learning_rate": 0.00019813467405945998, "loss": 2.4293, "step": 5792 }, { "epoch": 0.07, "learning_rate": 0.00019812889679617757, "loss": 2.4222, "step": 5800 }, { "epoch": 0.07, "learning_rate": 0.0001981231106940662, "loss": 2.4344, "step": 5808 }, { "epoch": 0.07, "learning_rate": 0.00019811731575370613, "loss": 2.4337, "step": 5816 }, { "epoch": 0.07, "learning_rate": 0.00019811151197567862, "loss": 2.4287, "step": 5824 }, { "epoch": 0.07, "learning_rate": 0.00019810569936056573, "loss": 2.418, "step": 5832 }, { "epoch": 0.07, "learning_rate": 0.0001980998779089504, "loss": 2.4213, "step": 5840 }, { "epoch": 0.07, "learning_rate": 0.00019809404762141653, "loss": 2.4079, "step": 5848 }, { "epoch": 0.07, "learning_rate": 0.00019808820849854882, "loss": 2.4137, "step": 5856 }, { "epoch": 0.07, "learning_rate": 0.000198082360540933, "loss": 2.416, "step": 5864 }, { "epoch": 0.07, "learning_rate": 0.00019807650374915547, "loss": 2.4408, "step": 5872 }, { "epoch": 0.07, "learning_rate": 0.00019807063812380372, "loss": 2.4035, "step": 5880 }, { "epoch": 0.07, "learning_rate": 0.00019806476366546595, "loss": 2.4086, "step": 5888 }, { "epoch": 0.07, "learning_rate": 0.00019805888037473143, "loss": 2.4334, "step": 5896 }, { "epoch": 0.07, "learning_rate": 0.00019805298825219017, "loss": 2.434, "step": 5904 }, { "epoch": 0.07, "learning_rate": 0.0001980470872984331, "loss": 2.4105, "step": 5912 }, { "epoch": 0.07, "learning_rate": 0.0001980411775140521, "loss": 2.4249, "step": 5920 }, { "epoch": 0.07, "learning_rate": 0.00019803525889963984, "loss": 2.4301, "step": 5928 }, { "epoch": 0.07, "learning_rate": 0.00019802933145579, "loss": 2.4166, "step": 5936 }, { "epoch": 0.07, "learning_rate": 0.000198023395183097, "loss": 2.4214, "step": 5944 }, { "epoch": 0.07, "learning_rate": 0.00019801745008215618, "loss": 2.4225, "step": 5952 }, { "epoch": 0.07, "learning_rate": 0.0001980114961535639, "loss": 2.4261, "step": 5960 }, { "epoch": 0.07, "learning_rate": 0.00019800553339791724, "loss": 2.4148, "step": 5968 }, { "epoch": 0.07, "learning_rate": 0.00019799956181581425, "loss": 2.4137, "step": 5976 }, { "epoch": 0.07, "learning_rate": 0.00019799358140785381, "loss": 2.4184, "step": 5984 }, { "epoch": 0.07, "learning_rate": 0.0001979875921746358, "loss": 2.4309, "step": 5992 }, { "epoch": 0.07, "learning_rate": 0.00019798159411676085, "loss": 2.4377, "step": 6000 }, { "epoch": 0.08, "learning_rate": 0.00019797558723483053, "loss": 2.4096, "step": 6008 }, { "epoch": 0.08, "learning_rate": 0.00019796957152944732, "loss": 2.4495, "step": 6016 }, { "epoch": 0.08, "learning_rate": 0.00019796354700121453, "loss": 2.4204, "step": 6024 }, { "epoch": 0.08, "learning_rate": 0.00019795751365073644, "loss": 2.431, "step": 6032 }, { "epoch": 0.08, "learning_rate": 0.00019795147147861809, "loss": 2.4253, "step": 6040 }, { "epoch": 0.08, "learning_rate": 0.0001979454204854655, "loss": 2.4138, "step": 6048 }, { "epoch": 0.08, "learning_rate": 0.0001979393606718856, "loss": 2.4097, "step": 6056 }, { "epoch": 0.08, "learning_rate": 0.0001979332920384861, "loss": 2.4326, "step": 6064 }, { "epoch": 0.08, "learning_rate": 0.00019792721458587566, "loss": 2.4241, "step": 6072 }, { "epoch": 0.08, "learning_rate": 0.00019792112831466382, "loss": 2.4096, "step": 6080 }, { "epoch": 0.08, "learning_rate": 0.00019791503322546102, "loss": 2.4228, "step": 6088 }, { "epoch": 0.08, "learning_rate": 0.00019790892931887853, "loss": 2.4267, "step": 6096 }, { "epoch": 0.08, "learning_rate": 0.00019790281659552855, "loss": 2.4323, "step": 6104 }, { "epoch": 0.08, "learning_rate": 0.00019789669505602416, "loss": 2.4442, "step": 6112 }, { "epoch": 0.08, "learning_rate": 0.00019789056470097927, "loss": 2.4554, "step": 6120 }, { "epoch": 0.08, "learning_rate": 0.0001978844255310088, "loss": 2.4064, "step": 6128 }, { "epoch": 0.08, "learning_rate": 0.00019787827754672838, "loss": 2.4185, "step": 6136 }, { "epoch": 0.08, "learning_rate": 0.00019787212074875472, "loss": 2.4449, "step": 6144 }, { "epoch": 0.08, "learning_rate": 0.00019786595513770523, "loss": 2.4167, "step": 6152 }, { "epoch": 0.08, "learning_rate": 0.00019785978071419833, "loss": 2.3857, "step": 6160 }, { "epoch": 0.08, "learning_rate": 0.00019785359747885324, "loss": 2.4374, "step": 6168 }, { "epoch": 0.08, "learning_rate": 0.00019784740543229014, "loss": 2.4185, "step": 6176 }, { "epoch": 0.08, "learning_rate": 0.00019784120457513003, "loss": 2.3988, "step": 6184 }, { "epoch": 0.08, "learning_rate": 0.0001978349949079949, "loss": 2.4153, "step": 6192 }, { "epoch": 0.08, "learning_rate": 0.0001978287764315074, "loss": 2.4346, "step": 6200 }, { "epoch": 0.08, "learning_rate": 0.00019782254914629138, "loss": 2.4229, "step": 6208 }, { "epoch": 0.08, "learning_rate": 0.00019781631305297123, "loss": 2.429, "step": 6216 }, { "epoch": 0.08, "learning_rate": 0.00019781006815217252, "loss": 2.4171, "step": 6224 }, { "epoch": 0.08, "learning_rate": 0.0001978038144445215, "loss": 2.4402, "step": 6232 }, { "epoch": 0.08, "learning_rate": 0.00019779755193064544, "loss": 2.4371, "step": 6240 }, { "epoch": 0.08, "learning_rate": 0.00019779128061117243, "loss": 2.4127, "step": 6248 }, { "epoch": 0.08, "learning_rate": 0.0001977850004867314, "loss": 2.4162, "step": 6256 }, { "epoch": 0.08, "learning_rate": 0.00019777871155795222, "loss": 2.4168, "step": 6264 }, { "epoch": 0.08, "learning_rate": 0.00019777241382546568, "loss": 2.4037, "step": 6272 }, { "epoch": 0.08, "learning_rate": 0.00019776610728990338, "loss": 2.4039, "step": 6280 }, { "epoch": 0.08, "learning_rate": 0.00019775979195189782, "loss": 2.4355, "step": 6288 }, { "epoch": 0.08, "learning_rate": 0.0001977534678120824, "loss": 2.42, "step": 6296 }, { "epoch": 0.08, "learning_rate": 0.0001977471348710914, "loss": 2.4269, "step": 6304 }, { "epoch": 0.08, "learning_rate": 0.00019774079312955995, "loss": 2.4303, "step": 6312 }, { "epoch": 0.08, "learning_rate": 0.00019773444258812414, "loss": 2.4375, "step": 6320 }, { "epoch": 0.08, "learning_rate": 0.00019772808324742088, "loss": 2.42, "step": 6328 }, { "epoch": 0.08, "learning_rate": 0.00019772171510808794, "loss": 2.415, "step": 6336 }, { "epoch": 0.08, "learning_rate": 0.00019771533817076407, "loss": 2.4304, "step": 6344 }, { "epoch": 0.08, "learning_rate": 0.0001977089524360888, "loss": 2.4173, "step": 6352 }, { "epoch": 0.08, "learning_rate": 0.00019770255790470254, "loss": 2.4176, "step": 6360 }, { "epoch": 0.08, "learning_rate": 0.0001976961545772467, "loss": 2.4532, "step": 6368 }, { "epoch": 0.08, "learning_rate": 0.00019768974245436348, "loss": 2.3959, "step": 6376 }, { "epoch": 0.08, "learning_rate": 0.00019768332153669596, "loss": 2.4328, "step": 6384 }, { "epoch": 0.08, "learning_rate": 0.00019767689182488812, "loss": 2.4021, "step": 6392 }, { "epoch": 0.08, "learning_rate": 0.00019767045331958486, "loss": 2.3979, "step": 6400 }, { "epoch": 0.08, "learning_rate": 0.00019766400602143187, "loss": 2.4045, "step": 6408 }, { "epoch": 0.08, "learning_rate": 0.0001976575499310758, "loss": 2.422, "step": 6416 }, { "epoch": 0.08, "learning_rate": 0.0001976510850491642, "loss": 2.4299, "step": 6424 }, { "epoch": 0.08, "learning_rate": 0.00019764461137634543, "loss": 2.4217, "step": 6432 }, { "epoch": 0.08, "learning_rate": 0.00019763812891326874, "loss": 2.4129, "step": 6440 }, { "epoch": 0.08, "learning_rate": 0.00019763163766058433, "loss": 2.4204, "step": 6448 }, { "epoch": 0.08, "learning_rate": 0.0001976251376189432, "loss": 2.4248, "step": 6456 }, { "epoch": 0.08, "learning_rate": 0.00019761862878899726, "loss": 2.4222, "step": 6464 }, { "epoch": 0.08, "learning_rate": 0.00019761211117139932, "loss": 2.4271, "step": 6472 }, { "epoch": 0.08, "learning_rate": 0.0001976055847668031, "loss": 2.4303, "step": 6480 }, { "epoch": 0.08, "learning_rate": 0.00019759904957586313, "loss": 2.4209, "step": 6488 }, { "epoch": 0.08, "learning_rate": 0.0001975925055992348, "loss": 2.406, "step": 6496 }, { "epoch": 0.08, "learning_rate": 0.00019758595283757453, "loss": 2.4003, "step": 6504 }, { "epoch": 0.08, "learning_rate": 0.00019757939129153948, "loss": 2.4214, "step": 6512 }, { "epoch": 0.08, "learning_rate": 0.00019757282096178773, "loss": 2.4195, "step": 6520 }, { "epoch": 0.08, "learning_rate": 0.00019756624184897825, "loss": 2.4205, "step": 6528 }, { "epoch": 0.08, "learning_rate": 0.0001975596539537709, "loss": 2.4012, "step": 6536 }, { "epoch": 0.08, "learning_rate": 0.00019755305727682637, "loss": 2.4396, "step": 6544 }, { "epoch": 0.08, "learning_rate": 0.00019754645181880632, "loss": 2.4492, "step": 6552 }, { "epoch": 0.08, "learning_rate": 0.00019753983758037322, "loss": 2.425, "step": 6560 }, { "epoch": 0.08, "learning_rate": 0.00019753321456219045, "loss": 2.4277, "step": 6568 }, { "epoch": 0.08, "learning_rate": 0.0001975265827649222, "loss": 2.4428, "step": 6576 }, { "epoch": 0.08, "learning_rate": 0.00019751994218923367, "loss": 2.4237, "step": 6584 }, { "epoch": 0.08, "learning_rate": 0.0001975132928357909, "loss": 2.4228, "step": 6592 }, { "epoch": 0.08, "learning_rate": 0.0001975066347052607, "loss": 2.4164, "step": 6600 }, { "epoch": 0.08, "learning_rate": 0.0001974999677983109, "loss": 2.4236, "step": 6608 }, { "epoch": 0.08, "learning_rate": 0.00019749329211561013, "loss": 2.4256, "step": 6616 }, { "epoch": 0.08, "learning_rate": 0.0001974866076578279, "loss": 2.4231, "step": 6624 }, { "epoch": 0.08, "learning_rate": 0.00019747991442563466, "loss": 2.4295, "step": 6632 }, { "epoch": 0.08, "learning_rate": 0.00019747321241970166, "loss": 2.4168, "step": 6640 }, { "epoch": 0.08, "learning_rate": 0.00019746650164070116, "loss": 2.4107, "step": 6648 }, { "epoch": 0.08, "learning_rate": 0.00019745978208930614, "loss": 2.4104, "step": 6656 }, { "epoch": 0.08, "learning_rate": 0.00019745305376619052, "loss": 2.421, "step": 6664 }, { "epoch": 0.08, "learning_rate": 0.00019744631667202917, "loss": 2.4239, "step": 6672 }, { "epoch": 0.08, "learning_rate": 0.00019743957080749778, "loss": 2.4177, "step": 6680 }, { "epoch": 0.08, "learning_rate": 0.00019743281617327286, "loss": 2.4119, "step": 6688 }, { "epoch": 0.08, "learning_rate": 0.00019742605277003192, "loss": 2.4283, "step": 6696 }, { "epoch": 0.08, "learning_rate": 0.00019741928059845325, "loss": 2.4355, "step": 6704 }, { "epoch": 0.08, "learning_rate": 0.00019741249965921607, "loss": 2.4084, "step": 6712 }, { "epoch": 0.08, "learning_rate": 0.00019740570995300052, "loss": 2.4132, "step": 6720 }, { "epoch": 0.08, "learning_rate": 0.00019739891148048752, "loss": 2.4178, "step": 6728 }, { "epoch": 0.08, "learning_rate": 0.00019739210424235892, "loss": 2.4083, "step": 6736 }, { "epoch": 0.08, "learning_rate": 0.00019738528823929746, "loss": 2.4052, "step": 6744 }, { "epoch": 0.08, "learning_rate": 0.0001973784634719867, "loss": 2.4327, "step": 6752 }, { "epoch": 0.08, "learning_rate": 0.00019737162994111124, "loss": 2.4188, "step": 6760 }, { "epoch": 0.08, "learning_rate": 0.00019736478764735636, "loss": 2.4104, "step": 6768 }, { "epoch": 0.08, "learning_rate": 0.00019735793659140827, "loss": 2.4135, "step": 6776 }, { "epoch": 0.08, "learning_rate": 0.00019735107677395415, "loss": 2.4231, "step": 6784 }, { "epoch": 0.08, "learning_rate": 0.000197344208195682, "loss": 2.4132, "step": 6792 }, { "epoch": 0.09, "learning_rate": 0.00019733733085728068, "loss": 2.436, "step": 6800 }, { "epoch": 0.09, "learning_rate": 0.00019733044475943998, "loss": 2.4167, "step": 6808 }, { "epoch": 0.09, "learning_rate": 0.0001973235499028505, "loss": 2.4176, "step": 6816 }, { "epoch": 0.09, "learning_rate": 0.00019731664628820376, "loss": 2.4045, "step": 6824 }, { "epoch": 0.09, "learning_rate": 0.00019730973391619215, "loss": 2.4262, "step": 6832 }, { "epoch": 0.09, "learning_rate": 0.00019730281278750898, "loss": 2.4304, "step": 6840 }, { "epoch": 0.09, "learning_rate": 0.00019729588290284835, "loss": 2.4195, "step": 6848 }, { "epoch": 0.09, "learning_rate": 0.0001972889442629053, "loss": 2.4183, "step": 6856 }, { "epoch": 0.09, "learning_rate": 0.0001972819968683758, "loss": 2.4232, "step": 6864 }, { "epoch": 0.09, "learning_rate": 0.0001972750407199565, "loss": 2.4193, "step": 6872 }, { "epoch": 0.09, "learning_rate": 0.0001972680758183452, "loss": 2.4227, "step": 6880 }, { "epoch": 0.09, "learning_rate": 0.00019726110216424037, "loss": 2.401, "step": 6888 }, { "epoch": 0.09, "learning_rate": 0.00019725411975834146, "loss": 2.4279, "step": 6896 }, { "epoch": 0.09, "learning_rate": 0.00019724712860134873, "loss": 2.4032, "step": 6904 }, { "epoch": 0.09, "learning_rate": 0.00019724012869396337, "loss": 2.4079, "step": 6912 }, { "epoch": 0.09, "learning_rate": 0.0001972331200368874, "loss": 2.4222, "step": 6920 }, { "epoch": 0.09, "learning_rate": 0.00019722610263082387, "loss": 2.4291, "step": 6928 }, { "epoch": 0.09, "learning_rate": 0.0001972190764764764, "loss": 2.403, "step": 6936 }, { "epoch": 0.09, "learning_rate": 0.00019721204157454981, "loss": 2.4193, "step": 6944 }, { "epoch": 0.09, "learning_rate": 0.00019720499792574964, "loss": 2.428, "step": 6952 }, { "epoch": 0.09, "learning_rate": 0.0001971979455307823, "loss": 2.4367, "step": 6960 }, { "epoch": 0.09, "learning_rate": 0.00019719088439035509, "loss": 2.3963, "step": 6968 }, { "epoch": 0.09, "learning_rate": 0.00019718381450517625, "loss": 2.4068, "step": 6976 }, { "epoch": 0.09, "learning_rate": 0.0001971767358759548, "loss": 2.4293, "step": 6984 }, { "epoch": 0.09, "learning_rate": 0.00019716964850340074, "loss": 2.4212, "step": 6992 }, { "epoch": 0.09, "learning_rate": 0.00019716255238822486, "loss": 2.4169, "step": 7000 }, { "epoch": 0.09, "learning_rate": 0.00019715544753113885, "loss": 2.4429, "step": 7008 }, { "epoch": 0.09, "learning_rate": 0.00019714833393285532, "loss": 2.4328, "step": 7016 }, { "epoch": 0.09, "learning_rate": 0.0001971412115940877, "loss": 2.4077, "step": 7024 }, { "epoch": 0.09, "learning_rate": 0.00019713408051555032, "loss": 2.4, "step": 7032 }, { "epoch": 0.09, "learning_rate": 0.00019712694069795838, "loss": 2.4126, "step": 7040 }, { "epoch": 0.09, "learning_rate": 0.000197119792142028, "loss": 2.4092, "step": 7048 }, { "epoch": 0.09, "learning_rate": 0.00019711263484847614, "loss": 2.4034, "step": 7056 }, { "epoch": 0.09, "learning_rate": 0.00019710546881802056, "loss": 2.4072, "step": 7064 }, { "epoch": 0.09, "learning_rate": 0.00019709829405138005, "loss": 2.4212, "step": 7072 }, { "epoch": 0.09, "learning_rate": 0.00019709111054927415, "loss": 2.4267, "step": 7080 }, { "epoch": 0.09, "learning_rate": 0.0001970839183124234, "loss": 2.3955, "step": 7088 }, { "epoch": 0.09, "learning_rate": 0.00019707671734154906, "loss": 2.4315, "step": 7096 }, { "epoch": 0.09, "learning_rate": 0.00019706950763737337, "loss": 2.4216, "step": 7104 }, { "epoch": 0.09, "learning_rate": 0.0001970622892006194, "loss": 2.4091, "step": 7112 }, { "epoch": 0.09, "learning_rate": 0.0001970550620320112, "loss": 2.4044, "step": 7120 }, { "epoch": 0.09, "learning_rate": 0.00019704782613227354, "loss": 2.4281, "step": 7128 }, { "epoch": 0.09, "learning_rate": 0.00019704058150213214, "loss": 2.426, "step": 7136 }, { "epoch": 0.09, "learning_rate": 0.0001970333281423136, "loss": 2.4268, "step": 7144 }, { "epoch": 0.09, "learning_rate": 0.00019702606605354544, "loss": 2.4068, "step": 7152 }, { "epoch": 0.09, "learning_rate": 0.00019701879523655594, "loss": 2.392, "step": 7160 }, { "epoch": 0.09, "learning_rate": 0.0001970115156920744, "loss": 2.4122, "step": 7168 }, { "epoch": 0.09, "learning_rate": 0.00019700422742083084, "loss": 2.4233, "step": 7176 }, { "epoch": 0.09, "learning_rate": 0.00019699693042355627, "loss": 2.411, "step": 7184 }, { "epoch": 0.09, "learning_rate": 0.00019698962470098252, "loss": 2.4073, "step": 7192 }, { "epoch": 0.09, "learning_rate": 0.00019698231025384234, "loss": 2.415, "step": 7200 }, { "epoch": 0.09, "learning_rate": 0.0001969749870828693, "loss": 2.4199, "step": 7208 }, { "epoch": 0.09, "learning_rate": 0.0001969676551887979, "loss": 2.417, "step": 7216 }, { "epoch": 0.09, "learning_rate": 0.00019696031457236345, "loss": 2.4365, "step": 7224 }, { "epoch": 0.09, "learning_rate": 0.0001969529652343022, "loss": 2.4072, "step": 7232 }, { "epoch": 0.09, "learning_rate": 0.00019694560717535125, "loss": 2.4145, "step": 7240 }, { "epoch": 0.09, "learning_rate": 0.00019693824039624853, "loss": 2.392, "step": 7248 }, { "epoch": 0.09, "learning_rate": 0.00019693086489773297, "loss": 2.4205, "step": 7256 }, { "epoch": 0.09, "learning_rate": 0.0001969234806805442, "loss": 2.4091, "step": 7264 }, { "epoch": 0.09, "learning_rate": 0.00019691608774542282, "loss": 2.4027, "step": 7272 }, { "epoch": 0.09, "learning_rate": 0.00019690868609311036, "loss": 2.4007, "step": 7280 }, { "epoch": 0.09, "learning_rate": 0.00019690127572434917, "loss": 2.4057, "step": 7288 }, { "epoch": 0.09, "learning_rate": 0.00019689385663988242, "loss": 2.4352, "step": 7296 }, { "epoch": 0.09, "learning_rate": 0.00019688642884045423, "loss": 2.4196, "step": 7304 }, { "epoch": 0.09, "learning_rate": 0.0001968789923268095, "loss": 2.4064, "step": 7312 }, { "epoch": 0.09, "learning_rate": 0.00019687154709969415, "loss": 2.4117, "step": 7320 }, { "epoch": 0.09, "learning_rate": 0.0001968640931598549, "loss": 2.4342, "step": 7328 }, { "epoch": 0.09, "learning_rate": 0.00019685663050803925, "loss": 2.4191, "step": 7336 }, { "epoch": 0.09, "learning_rate": 0.00019684915914499576, "loss": 2.4205, "step": 7344 }, { "epoch": 0.09, "learning_rate": 0.0001968416790714737, "loss": 2.4048, "step": 7352 }, { "epoch": 0.09, "learning_rate": 0.0001968341902882233, "loss": 2.4143, "step": 7360 }, { "epoch": 0.09, "learning_rate": 0.00019682669279599566, "loss": 2.3994, "step": 7368 }, { "epoch": 0.09, "learning_rate": 0.00019681918659554272, "loss": 2.3929, "step": 7376 }, { "epoch": 0.09, "learning_rate": 0.0001968116716876173, "loss": 2.4121, "step": 7384 }, { "epoch": 0.09, "learning_rate": 0.00019680414807297312, "loss": 2.4415, "step": 7392 }, { "epoch": 0.09, "learning_rate": 0.00019679661575236474, "loss": 2.4189, "step": 7400 }, { "epoch": 0.09, "learning_rate": 0.00019678907472654762, "loss": 2.4103, "step": 7408 }, { "epoch": 0.09, "learning_rate": 0.00019678152499627807, "loss": 2.4095, "step": 7416 }, { "epoch": 0.09, "learning_rate": 0.0001967739665623133, "loss": 2.4099, "step": 7424 }, { "epoch": 0.09, "learning_rate": 0.00019676639942541139, "loss": 2.4088, "step": 7432 }, { "epoch": 0.09, "learning_rate": 0.00019675882358633124, "loss": 2.3963, "step": 7440 }, { "epoch": 0.09, "learning_rate": 0.0001967512390458327, "loss": 2.433, "step": 7448 }, { "epoch": 0.09, "learning_rate": 0.00019674364580467643, "loss": 2.4292, "step": 7456 }, { "epoch": 0.09, "learning_rate": 0.000196736043863624, "loss": 2.4088, "step": 7464 }, { "epoch": 0.09, "learning_rate": 0.00019672843322343783, "loss": 2.4036, "step": 7472 }, { "epoch": 0.09, "learning_rate": 0.00019672081388488128, "loss": 2.4336, "step": 7480 }, { "epoch": 0.09, "learning_rate": 0.00019671318584871847, "loss": 2.4031, "step": 7488 }, { "epoch": 0.09, "learning_rate": 0.00019670554911571447, "loss": 2.403, "step": 7496 }, { "epoch": 0.09, "learning_rate": 0.00019669790368663517, "loss": 2.4226, "step": 7504 }, { "epoch": 0.09, "learning_rate": 0.0001966902495622474, "loss": 2.4025, "step": 7512 }, { "epoch": 0.09, "learning_rate": 0.0001966825867433188, "loss": 2.4083, "step": 7520 }, { "epoch": 0.09, "learning_rate": 0.00019667491523061794, "loss": 2.4034, "step": 7528 }, { "epoch": 0.09, "learning_rate": 0.0001966672350249142, "loss": 2.397, "step": 7536 }, { "epoch": 0.09, "learning_rate": 0.00019665954612697786, "loss": 2.4118, "step": 7544 }, { "epoch": 0.09, "learning_rate": 0.00019665184853758012, "loss": 2.4071, "step": 7552 }, { "epoch": 0.09, "learning_rate": 0.00019664414225749295, "loss": 2.4014, "step": 7560 }, { "epoch": 0.09, "learning_rate": 0.00019663642728748925, "loss": 2.4183, "step": 7568 }, { "epoch": 0.09, "learning_rate": 0.0001966287036283428, "loss": 2.4104, "step": 7576 }, { "epoch": 0.09, "learning_rate": 0.00019662097128082825, "loss": 2.4273, "step": 7584 }, { "epoch": 0.09, "learning_rate": 0.00019661323024572114, "loss": 2.4006, "step": 7592 }, { "epoch": 0.1, "learning_rate": 0.00019660548052379776, "loss": 2.4077, "step": 7600 }, { "epoch": 0.1, "learning_rate": 0.00019659772211583543, "loss": 2.4195, "step": 7608 }, { "epoch": 0.1, "learning_rate": 0.0001965899550226123, "loss": 2.4095, "step": 7616 }, { "epoch": 0.1, "learning_rate": 0.00019658217924490727, "loss": 2.4084, "step": 7624 }, { "epoch": 0.1, "learning_rate": 0.00019657439478350028, "loss": 2.4152, "step": 7632 }, { "epoch": 0.1, "learning_rate": 0.00019656660163917206, "loss": 2.4218, "step": 7640 }, { "epoch": 0.1, "learning_rate": 0.0001965587998127042, "loss": 2.4112, "step": 7648 }, { "epoch": 0.1, "learning_rate": 0.0001965509893048792, "loss": 2.4048, "step": 7656 }, { "epoch": 0.1, "learning_rate": 0.0001965431701164804, "loss": 2.4148, "step": 7664 }, { "epoch": 0.1, "learning_rate": 0.00019653534224829203, "loss": 2.4049, "step": 7672 }, { "epoch": 0.1, "learning_rate": 0.00019652750570109913, "loss": 2.4004, "step": 7680 }, { "epoch": 0.1, "learning_rate": 0.00019651966047568774, "loss": 2.4197, "step": 7688 }, { "epoch": 0.1, "learning_rate": 0.0001965118065728446, "loss": 2.4023, "step": 7696 }, { "epoch": 0.1, "learning_rate": 0.00019650394399335752, "loss": 2.4011, "step": 7704 }, { "epoch": 0.1, "learning_rate": 0.000196496072738015, "loss": 2.4232, "step": 7712 }, { "epoch": 0.1, "learning_rate": 0.00019648819280760648, "loss": 2.4206, "step": 7720 }, { "epoch": 0.1, "learning_rate": 0.00019648030420292228, "loss": 2.4185, "step": 7728 }, { "epoch": 0.1, "learning_rate": 0.0001964724069247536, "loss": 2.4076, "step": 7736 }, { "epoch": 0.1, "learning_rate": 0.0001964645009738925, "loss": 2.4251, "step": 7744 }, { "epoch": 0.1, "learning_rate": 0.00019645658635113192, "loss": 2.3953, "step": 7752 }, { "epoch": 0.1, "learning_rate": 0.00019644866305726556, "loss": 2.3957, "step": 7760 }, { "epoch": 0.1, "learning_rate": 0.00019644073109308818, "loss": 2.4033, "step": 7768 }, { "epoch": 0.1, "learning_rate": 0.00019643279045939525, "loss": 2.3995, "step": 7776 }, { "epoch": 0.1, "learning_rate": 0.00019642484115698318, "loss": 2.41, "step": 7784 }, { "epoch": 0.1, "learning_rate": 0.0001964168831866493, "loss": 2.4021, "step": 7792 }, { "epoch": 0.1, "learning_rate": 0.00019640891654919168, "loss": 2.4041, "step": 7800 }, { "epoch": 0.1, "learning_rate": 0.00019640094124540934, "loss": 2.4291, "step": 7808 }, { "epoch": 0.1, "learning_rate": 0.00019639295727610215, "loss": 2.4106, "step": 7816 }, { "epoch": 0.1, "learning_rate": 0.0001963849646420709, "loss": 2.3936, "step": 7824 }, { "epoch": 0.1, "learning_rate": 0.00019637696334411718, "loss": 2.4082, "step": 7832 }, { "epoch": 0.1, "learning_rate": 0.00019636895338304345, "loss": 2.4291, "step": 7840 }, { "epoch": 0.1, "learning_rate": 0.00019636093475965312, "loss": 2.4239, "step": 7848 }, { "epoch": 0.1, "learning_rate": 0.00019635290747475038, "loss": 2.3975, "step": 7856 }, { "epoch": 0.1, "learning_rate": 0.00019634487152914032, "loss": 2.4098, "step": 7864 }, { "epoch": 0.1, "learning_rate": 0.00019633682692362888, "loss": 2.4143, "step": 7872 }, { "epoch": 0.1, "learning_rate": 0.00019632877365902295, "loss": 2.4115, "step": 7880 }, { "epoch": 0.1, "learning_rate": 0.00019632071173613015, "loss": 2.4082, "step": 7888 }, { "epoch": 0.1, "learning_rate": 0.00019631264115575913, "loss": 2.4044, "step": 7896 }, { "epoch": 0.1, "learning_rate": 0.00019630456191871922, "loss": 2.4067, "step": 7904 }, { "epoch": 0.1, "learning_rate": 0.0001962964740258208, "loss": 2.4153, "step": 7912 }, { "epoch": 0.1, "learning_rate": 0.00019628837747787502, "loss": 2.4341, "step": 7920 }, { "epoch": 0.1, "learning_rate": 0.0001962802722756939, "loss": 2.4136, "step": 7928 }, { "epoch": 0.1, "learning_rate": 0.00019627215842009038, "loss": 2.4327, "step": 7936 }, { "epoch": 0.1, "learning_rate": 0.00019626403591187824, "loss": 2.4059, "step": 7944 }, { "epoch": 0.1, "learning_rate": 0.00019625590475187205, "loss": 2.4112, "step": 7952 }, { "epoch": 0.1, "learning_rate": 0.00019624776494088739, "loss": 2.4184, "step": 7960 }, { "epoch": 0.1, "learning_rate": 0.00019623961647974062, "loss": 2.4053, "step": 7968 }, { "epoch": 0.1, "learning_rate": 0.000196231459369249, "loss": 2.4093, "step": 7976 }, { "epoch": 0.1, "learning_rate": 0.00019622329361023056, "loss": 2.4293, "step": 7984 }, { "epoch": 0.1, "learning_rate": 0.00019621511920350434, "loss": 2.3955, "step": 7992 }, { "epoch": 0.1, "learning_rate": 0.00019620693614989023, "loss": 2.4111, "step": 8000 }, { "epoch": 0.1, "learning_rate": 0.00019619874445020888, "loss": 2.395, "step": 8008 }, { "epoch": 0.1, "learning_rate": 0.0001961905441052819, "loss": 2.4094, "step": 8016 }, { "epoch": 0.1, "learning_rate": 0.0001961823351159317, "loss": 2.4233, "step": 8024 }, { "epoch": 0.1, "learning_rate": 0.00019617411748298167, "loss": 2.4006, "step": 8032 }, { "epoch": 0.1, "learning_rate": 0.00019616589120725593, "loss": 2.4228, "step": 8040 }, { "epoch": 0.1, "learning_rate": 0.00019615765628957954, "loss": 2.4056, "step": 8048 }, { "epoch": 0.1, "learning_rate": 0.0001961494127307784, "loss": 2.4062, "step": 8056 }, { "epoch": 0.1, "learning_rate": 0.00019614116053167936, "loss": 2.4097, "step": 8064 }, { "epoch": 0.1, "learning_rate": 0.00019613289969310996, "loss": 2.4107, "step": 8072 }, { "epoch": 0.1, "learning_rate": 0.0001961246302158988, "loss": 2.4202, "step": 8080 }, { "epoch": 0.1, "learning_rate": 0.00019611635210087523, "loss": 2.417, "step": 8088 }, { "epoch": 0.1, "learning_rate": 0.00019610806534886953, "loss": 2.3945, "step": 8096 }, { "epoch": 0.1, "learning_rate": 0.0001960997699607128, "loss": 2.4208, "step": 8104 }, { "epoch": 0.1, "learning_rate": 0.000196091465937237, "loss": 2.3983, "step": 8112 }, { "epoch": 0.1, "learning_rate": 0.00019608315327927496, "loss": 2.401, "step": 8120 }, { "epoch": 0.1, "learning_rate": 0.00019607483198766045, "loss": 2.4182, "step": 8128 }, { "epoch": 0.1, "learning_rate": 0.00019606650206322802, "loss": 2.412, "step": 8136 }, { "epoch": 0.1, "learning_rate": 0.0001960581635068131, "loss": 2.3973, "step": 8144 }, { "epoch": 0.1, "learning_rate": 0.000196049816319252, "loss": 2.4032, "step": 8152 }, { "epoch": 0.1, "learning_rate": 0.00019604146050138194, "loss": 2.3854, "step": 8160 }, { "epoch": 0.1, "learning_rate": 0.0001960330960540409, "loss": 2.4162, "step": 8168 }, { "epoch": 0.1, "learning_rate": 0.00019602472297806784, "loss": 2.4235, "step": 8176 }, { "epoch": 0.1, "learning_rate": 0.0001960163412743025, "loss": 2.4081, "step": 8184 }, { "epoch": 0.1, "learning_rate": 0.00019600795094358554, "loss": 2.3797, "step": 8192 }, { "epoch": 0.1, "learning_rate": 0.00019599955198675842, "loss": 2.4345, "step": 8200 }, { "epoch": 0.1, "learning_rate": 0.00019599114440466356, "loss": 2.4186, "step": 8208 }, { "epoch": 0.1, "learning_rate": 0.00019598272819814413, "loss": 2.3856, "step": 8216 }, { "epoch": 0.1, "learning_rate": 0.0001959743033680443, "loss": 2.4097, "step": 8224 }, { "epoch": 0.1, "learning_rate": 0.00019596586991520897, "loss": 2.42, "step": 8232 }, { "epoch": 0.1, "learning_rate": 0.00019595742784048404, "loss": 2.4136, "step": 8240 }, { "epoch": 0.1, "learning_rate": 0.00019594897714471615, "loss": 2.4032, "step": 8248 }, { "epoch": 0.1, "learning_rate": 0.00019594051782875286, "loss": 2.4065, "step": 8256 }, { "epoch": 0.1, "learning_rate": 0.0001959320498934426, "loss": 2.4106, "step": 8264 }, { "epoch": 0.1, "learning_rate": 0.0001959235733396346, "loss": 2.4144, "step": 8272 }, { "epoch": 0.1, "learning_rate": 0.00019591508816817915, "loss": 2.3956, "step": 8280 }, { "epoch": 0.1, "learning_rate": 0.00019590659437992714, "loss": 2.395, "step": 8288 }, { "epoch": 0.1, "learning_rate": 0.00019589809197573046, "loss": 2.3663, "step": 8296 }, { "epoch": 0.1, "learning_rate": 0.00019588958095644192, "loss": 2.419, "step": 8304 }, { "epoch": 0.1, "learning_rate": 0.00019588106132291505, "loss": 2.3952, "step": 8312 }, { "epoch": 0.1, "learning_rate": 0.00019587253307600438, "loss": 2.4023, "step": 8320 }, { "epoch": 0.1, "learning_rate": 0.00019586399621656525, "loss": 2.3927, "step": 8328 }, { "epoch": 0.1, "learning_rate": 0.0001958554507454538, "loss": 2.4151, "step": 8336 }, { "epoch": 0.1, "learning_rate": 0.00019584689666352713, "loss": 2.4198, "step": 8344 }, { "epoch": 0.1, "learning_rate": 0.00019583833397164316, "loss": 2.4017, "step": 8352 }, { "epoch": 0.1, "learning_rate": 0.0001958297626706607, "loss": 2.3867, "step": 8360 }, { "epoch": 0.1, "learning_rate": 0.00019582118276143936, "loss": 2.4177, "step": 8368 }, { "epoch": 0.1, "learning_rate": 0.00019581259424483968, "loss": 2.4213, "step": 8376 }, { "epoch": 0.1, "learning_rate": 0.00019580399712172304, "loss": 2.4288, "step": 8384 }, { "epoch": 0.1, "learning_rate": 0.00019579539139295168, "loss": 2.4018, "step": 8392 }, { "epoch": 0.1, "learning_rate": 0.00019578677705938872, "loss": 2.3918, "step": 8400 }, { "epoch": 0.11, "learning_rate": 0.00019577815412189807, "loss": 2.4063, "step": 8408 }, { "epoch": 0.11, "learning_rate": 0.00019576952258134464, "loss": 2.3996, "step": 8416 }, { "epoch": 0.11, "learning_rate": 0.0001957608824385941, "loss": 2.4193, "step": 8424 }, { "epoch": 0.11, "learning_rate": 0.00019575223369451298, "loss": 2.3985, "step": 8432 }, { "epoch": 0.11, "learning_rate": 0.00019574357634996874, "loss": 2.4147, "step": 8440 }, { "epoch": 0.11, "learning_rate": 0.00019573491040582964, "loss": 2.3948, "step": 8448 }, { "epoch": 0.11, "learning_rate": 0.00019572623586296484, "loss": 2.3941, "step": 8456 }, { "epoch": 0.11, "learning_rate": 0.0001957175527222443, "loss": 2.4034, "step": 8464 }, { "epoch": 0.11, "learning_rate": 0.00019570886098453893, "loss": 2.4085, "step": 8472 }, { "epoch": 0.11, "learning_rate": 0.00019570016065072044, "loss": 2.4159, "step": 8480 }, { "epoch": 0.11, "learning_rate": 0.0001956914517216615, "loss": 2.4078, "step": 8488 }, { "epoch": 0.11, "learning_rate": 0.00019568273419823547, "loss": 2.4148, "step": 8496 }, { "epoch": 0.11, "learning_rate": 0.00019567400808131671, "loss": 2.414, "step": 8504 }, { "epoch": 0.11, "learning_rate": 0.00019566527337178038, "loss": 2.3968, "step": 8512 }, { "epoch": 0.11, "learning_rate": 0.00019565653007050254, "loss": 2.4054, "step": 8520 }, { "epoch": 0.11, "learning_rate": 0.00019564777817836012, "loss": 2.4014, "step": 8528 }, { "epoch": 0.11, "learning_rate": 0.00019563901769623082, "loss": 2.4193, "step": 8536 }, { "epoch": 0.11, "learning_rate": 0.00019563024862499334, "loss": 2.412, "step": 8544 }, { "epoch": 0.11, "learning_rate": 0.0001956214709655271, "loss": 2.4057, "step": 8552 }, { "epoch": 0.11, "learning_rate": 0.00019561268471871248, "loss": 2.4084, "step": 8560 }, { "epoch": 0.11, "learning_rate": 0.0001956038898854307, "loss": 2.4129, "step": 8568 }, { "epoch": 0.11, "learning_rate": 0.00019559508646656385, "loss": 2.4073, "step": 8576 }, { "epoch": 0.11, "learning_rate": 0.0001955862744629948, "loss": 2.4017, "step": 8584 }, { "epoch": 0.11, "learning_rate": 0.0001955774538756074, "loss": 2.4086, "step": 8592 }, { "epoch": 0.11, "learning_rate": 0.00019556862470528625, "loss": 2.4054, "step": 8600 }, { "epoch": 0.11, "learning_rate": 0.00019555978695291694, "loss": 2.413, "step": 8608 }, { "epoch": 0.11, "learning_rate": 0.00019555094061938578, "loss": 2.3965, "step": 8616 }, { "epoch": 0.11, "learning_rate": 0.00019554208570558005, "loss": 2.4004, "step": 8624 }, { "epoch": 0.11, "learning_rate": 0.0001955332222123878, "loss": 2.3984, "step": 8632 }, { "epoch": 0.11, "learning_rate": 0.00019552435014069805, "loss": 2.4077, "step": 8640 }, { "epoch": 0.11, "learning_rate": 0.0001955154694914006, "loss": 2.4086, "step": 8648 }, { "epoch": 0.11, "learning_rate": 0.00019550658026538614, "loss": 2.403, "step": 8656 }, { "epoch": 0.11, "learning_rate": 0.0001954976824635461, "loss": 2.4241, "step": 8664 }, { "epoch": 0.11, "learning_rate": 0.00019548877608677304, "loss": 2.4181, "step": 8672 }, { "epoch": 0.11, "learning_rate": 0.0001954798611359601, "loss": 2.4077, "step": 8680 }, { "epoch": 0.11, "learning_rate": 0.00019547093761200146, "loss": 2.3978, "step": 8688 }, { "epoch": 0.11, "learning_rate": 0.00019546200551579212, "loss": 2.406, "step": 8696 }, { "epoch": 0.11, "learning_rate": 0.00019545306484822784, "loss": 2.4211, "step": 8704 }, { "epoch": 0.11, "learning_rate": 0.00019544411561020535, "loss": 2.398, "step": 8712 }, { "epoch": 0.11, "learning_rate": 0.00019543515780262225, "loss": 2.3854, "step": 8720 }, { "epoch": 0.11, "learning_rate": 0.0001954261914263769, "loss": 2.3961, "step": 8728 }, { "epoch": 0.11, "learning_rate": 0.00019541721648236863, "loss": 2.4074, "step": 8736 }, { "epoch": 0.11, "learning_rate": 0.0001954082329714975, "loss": 2.4012, "step": 8744 }, { "epoch": 0.11, "learning_rate": 0.00019539924089466459, "loss": 2.396, "step": 8752 }, { "epoch": 0.11, "learning_rate": 0.0001953902402527717, "loss": 2.4133, "step": 8760 }, { "epoch": 0.11, "learning_rate": 0.00019538123104672158, "loss": 2.4083, "step": 8768 }, { "epoch": 0.11, "learning_rate": 0.00019537221327741778, "loss": 2.3939, "step": 8776 }, { "epoch": 0.11, "learning_rate": 0.00019536318694576472, "loss": 2.3961, "step": 8784 }, { "epoch": 0.11, "learning_rate": 0.0001953541520526677, "loss": 2.4101, "step": 8792 }, { "epoch": 0.11, "learning_rate": 0.0001953451085990329, "loss": 2.4035, "step": 8800 }, { "epoch": 0.11, "learning_rate": 0.00019533605658576727, "loss": 2.3905, "step": 8808 }, { "epoch": 0.11, "learning_rate": 0.0001953269960137787, "loss": 2.4051, "step": 8816 }, { "epoch": 0.11, "learning_rate": 0.00019531792688397596, "loss": 2.4191, "step": 8824 }, { "epoch": 0.11, "learning_rate": 0.00019530884919726854, "loss": 2.4101, "step": 8832 }, { "epoch": 0.11, "learning_rate": 0.00019529976295456697, "loss": 2.3873, "step": 8840 }, { "epoch": 0.11, "learning_rate": 0.00019529066815678251, "loss": 2.408, "step": 8848 }, { "epoch": 0.11, "learning_rate": 0.0001952815648048273, "loss": 2.4048, "step": 8856 }, { "epoch": 0.11, "learning_rate": 0.00019527245289961437, "loss": 2.3951, "step": 8864 }, { "epoch": 0.11, "learning_rate": 0.00019526333244205762, "loss": 2.416, "step": 8872 }, { "epoch": 0.11, "learning_rate": 0.00019525420343307172, "loss": 2.3938, "step": 8880 }, { "epoch": 0.11, "learning_rate": 0.0001952450658735723, "loss": 2.4105, "step": 8888 }, { "epoch": 0.11, "learning_rate": 0.00019523591976447583, "loss": 2.4079, "step": 8896 }, { "epoch": 0.11, "learning_rate": 0.00019522676510669954, "loss": 2.4108, "step": 8904 }, { "epoch": 0.11, "learning_rate": 0.00019521760190116167, "loss": 2.4022, "step": 8912 }, { "epoch": 0.11, "learning_rate": 0.0001952084301487812, "loss": 2.3883, "step": 8920 }, { "epoch": 0.11, "learning_rate": 0.00019519924985047794, "loss": 2.4126, "step": 8928 }, { "epoch": 0.11, "learning_rate": 0.00019519006100717274, "loss": 2.423, "step": 8936 }, { "epoch": 0.11, "learning_rate": 0.00019518086361978713, "loss": 2.4109, "step": 8944 }, { "epoch": 0.11, "learning_rate": 0.00019517165768924354, "loss": 2.4021, "step": 8952 }, { "epoch": 0.11, "learning_rate": 0.00019516244321646532, "loss": 2.4075, "step": 8960 }, { "epoch": 0.11, "learning_rate": 0.00019515322020237662, "loss": 2.385, "step": 8968 }, { "epoch": 0.11, "learning_rate": 0.0001951439886479024, "loss": 2.4168, "step": 8976 }, { "epoch": 0.11, "learning_rate": 0.00019513474855396856, "loss": 2.4148, "step": 8984 }, { "epoch": 0.11, "learning_rate": 0.00019512549992150186, "loss": 2.4234, "step": 8992 }, { "epoch": 0.11, "learning_rate": 0.00019511624275142986, "loss": 2.411, "step": 9000 }, { "epoch": 0.11, "learning_rate": 0.00019510697704468099, "loss": 2.4034, "step": 9008 }, { "epoch": 0.11, "learning_rate": 0.0001950977028021846, "loss": 2.4339, "step": 9016 }, { "epoch": 0.11, "learning_rate": 0.0001950884200248708, "loss": 2.4157, "step": 9024 }, { "epoch": 0.11, "learning_rate": 0.00019507912871367063, "loss": 2.4059, "step": 9032 }, { "epoch": 0.11, "learning_rate": 0.0001950698288695159, "loss": 2.406, "step": 9040 }, { "epoch": 0.11, "learning_rate": 0.00019506052049333937, "loss": 2.4054, "step": 9048 }, { "epoch": 0.11, "learning_rate": 0.00019505120358607463, "loss": 2.3838, "step": 9056 }, { "epoch": 0.11, "learning_rate": 0.00019504187814865608, "loss": 2.4067, "step": 9064 }, { "epoch": 0.11, "learning_rate": 0.00019503254418201904, "loss": 2.3902, "step": 9072 }, { "epoch": 0.11, "learning_rate": 0.00019502320168709962, "loss": 2.4173, "step": 9080 }, { "epoch": 0.11, "learning_rate": 0.00019501385066483484, "loss": 2.4129, "step": 9088 }, { "epoch": 0.11, "learning_rate": 0.00019500449111616258, "loss": 2.4028, "step": 9096 }, { "epoch": 0.11, "learning_rate": 0.0001949951230420215, "loss": 2.4211, "step": 9104 }, { "epoch": 0.11, "learning_rate": 0.00019498574644335123, "loss": 2.4257, "step": 9112 }, { "epoch": 0.11, "learning_rate": 0.00019497636132109208, "loss": 2.4118, "step": 9120 }, { "epoch": 0.11, "learning_rate": 0.00019496696767618544, "loss": 2.4061, "step": 9128 }, { "epoch": 0.11, "learning_rate": 0.00019495756550957338, "loss": 2.4011, "step": 9136 }, { "epoch": 0.11, "learning_rate": 0.00019494815482219886, "loss": 2.4206, "step": 9144 }, { "epoch": 0.11, "learning_rate": 0.0001949387356150058, "loss": 2.4149, "step": 9152 }, { "epoch": 0.11, "learning_rate": 0.0001949293078889388, "loss": 2.4166, "step": 9160 }, { "epoch": 0.11, "learning_rate": 0.00019491987164494353, "loss": 2.4275, "step": 9168 }, { "epoch": 0.11, "learning_rate": 0.0001949104268839663, "loss": 2.3892, "step": 9176 }, { "epoch": 0.11, "learning_rate": 0.00019490097360695433, "loss": 2.4166, "step": 9184 }, { "epoch": 0.11, "learning_rate": 0.0001948915118148558, "loss": 2.408, "step": 9192 }, { "epoch": 0.12, "learning_rate": 0.00019488204150861968, "loss": 2.4122, "step": 9200 }, { "epoch": 0.12, "learning_rate": 0.00019487256268919573, "loss": 2.4185, "step": 9208 }, { "epoch": 0.12, "learning_rate": 0.0001948630753575347, "loss": 2.3912, "step": 9216 }, { "epoch": 0.12, "learning_rate": 0.00019485357951458808, "loss": 2.4062, "step": 9224 }, { "epoch": 0.12, "learning_rate": 0.00019484407516130817, "loss": 2.3918, "step": 9232 }, { "epoch": 0.12, "learning_rate": 0.0001948345622986483, "loss": 2.3841, "step": 9240 }, { "epoch": 0.12, "learning_rate": 0.0001948250409275626, "loss": 2.4323, "step": 9248 }, { "epoch": 0.12, "learning_rate": 0.00019481551104900583, "loss": 2.3951, "step": 9256 }, { "epoch": 0.12, "learning_rate": 0.00019480597266393398, "loss": 2.3887, "step": 9264 }, { "epoch": 0.12, "learning_rate": 0.0001947964257733036, "loss": 2.4072, "step": 9272 }, { "epoch": 0.12, "learning_rate": 0.00019478687037807215, "loss": 2.4259, "step": 9280 }, { "epoch": 0.12, "learning_rate": 0.00019477730647919807, "loss": 2.4183, "step": 9288 }, { "epoch": 0.12, "learning_rate": 0.00019476773407764049, "loss": 2.4153, "step": 9296 }, { "epoch": 0.12, "learning_rate": 0.00019475815317435952, "loss": 2.4182, "step": 9304 }, { "epoch": 0.12, "learning_rate": 0.0001947485637703161, "loss": 2.4176, "step": 9312 }, { "epoch": 0.12, "learning_rate": 0.00019473896586647186, "loss": 2.4123, "step": 9320 }, { "epoch": 0.12, "learning_rate": 0.00019472935946378956, "loss": 2.3762, "step": 9328 }, { "epoch": 0.12, "learning_rate": 0.0001947197445632326, "loss": 2.4025, "step": 9336 }, { "epoch": 0.12, "learning_rate": 0.0001947101211657653, "loss": 2.4291, "step": 9344 }, { "epoch": 0.12, "learning_rate": 0.00019470048927235285, "loss": 2.3911, "step": 9352 }, { "epoch": 0.12, "learning_rate": 0.00019469084888396122, "loss": 2.4181, "step": 9360 }, { "epoch": 0.12, "learning_rate": 0.0001946812000015574, "loss": 2.4105, "step": 9368 }, { "epoch": 0.12, "learning_rate": 0.000194671542626109, "loss": 2.4023, "step": 9376 }, { "epoch": 0.12, "learning_rate": 0.0001946618767585847, "loss": 2.4063, "step": 9384 }, { "epoch": 0.12, "learning_rate": 0.00019465220239995383, "loss": 2.4072, "step": 9392 }, { "epoch": 0.12, "learning_rate": 0.00019464251955118677, "loss": 2.4167, "step": 9400 }, { "epoch": 0.12, "learning_rate": 0.00019463282821325457, "loss": 2.4303, "step": 9408 }, { "epoch": 0.12, "learning_rate": 0.0001946231283871293, "loss": 2.3933, "step": 9416 }, { "epoch": 0.12, "learning_rate": 0.0001946134200737837, "loss": 2.4019, "step": 9424 }, { "epoch": 0.12, "learning_rate": 0.00019460370327419155, "loss": 2.4053, "step": 9432 }, { "epoch": 0.12, "learning_rate": 0.00019459397798932734, "loss": 2.4121, "step": 9440 }, { "epoch": 0.12, "learning_rate": 0.00019458424422016648, "loss": 2.4365, "step": 9448 }, { "epoch": 0.12, "learning_rate": 0.00019457450196768518, "loss": 2.4131, "step": 9456 }, { "epoch": 0.12, "learning_rate": 0.00019456475123286058, "loss": 2.386, "step": 9464 }, { "epoch": 0.12, "learning_rate": 0.0001945549920166706, "loss": 2.3913, "step": 9472 }, { "epoch": 0.12, "learning_rate": 0.00019454522432009404, "loss": 2.4037, "step": 9480 }, { "epoch": 0.12, "learning_rate": 0.00019453544814411055, "loss": 2.3996, "step": 9488 }, { "epoch": 0.12, "learning_rate": 0.00019452566348970057, "loss": 2.411, "step": 9496 }, { "epoch": 0.12, "learning_rate": 0.00019451587035784556, "loss": 2.4048, "step": 9504 }, { "epoch": 0.12, "learning_rate": 0.00019450606874952758, "loss": 2.4188, "step": 9512 }, { "epoch": 0.12, "learning_rate": 0.00019449625866572982, "loss": 2.3966, "step": 9520 }, { "epoch": 0.12, "learning_rate": 0.00019448644010743604, "loss": 2.4092, "step": 9528 }, { "epoch": 0.12, "learning_rate": 0.00019447661307563102, "loss": 2.4065, "step": 9536 }, { "epoch": 0.12, "learning_rate": 0.00019446677757130042, "loss": 2.3949, "step": 9544 }, { "epoch": 0.12, "learning_rate": 0.00019445693359543064, "loss": 2.3914, "step": 9552 }, { "epoch": 0.12, "learning_rate": 0.000194447081149009, "loss": 2.4077, "step": 9560 }, { "epoch": 0.12, "learning_rate": 0.0001944372202330236, "loss": 2.4113, "step": 9568 }, { "epoch": 0.12, "learning_rate": 0.00019442735084846343, "loss": 2.4031, "step": 9576 }, { "epoch": 0.12, "learning_rate": 0.00019441747299631841, "loss": 2.4068, "step": 9584 }, { "epoch": 0.12, "learning_rate": 0.00019440758667757914, "loss": 2.4021, "step": 9592 }, { "epoch": 0.12, "learning_rate": 0.00019439769189323727, "loss": 2.3959, "step": 9600 }, { "epoch": 0.12, "learning_rate": 0.00019438778864428507, "loss": 2.3896, "step": 9608 }, { "epoch": 0.12, "learning_rate": 0.00019437787693171588, "loss": 2.4095, "step": 9616 }, { "epoch": 0.12, "learning_rate": 0.00019436795675652367, "loss": 2.4162, "step": 9624 }, { "epoch": 0.12, "learning_rate": 0.0001943580281197035, "loss": 2.3949, "step": 9632 }, { "epoch": 0.12, "learning_rate": 0.00019434809102225113, "loss": 2.3892, "step": 9640 }, { "epoch": 0.12, "learning_rate": 0.00019433814546516314, "loss": 2.4045, "step": 9648 }, { "epoch": 0.12, "learning_rate": 0.00019432819144943707, "loss": 2.3994, "step": 9656 }, { "epoch": 0.12, "learning_rate": 0.00019431822897607122, "loss": 2.3975, "step": 9664 }, { "epoch": 0.12, "learning_rate": 0.0001943082580460648, "loss": 2.4102, "step": 9672 }, { "epoch": 0.12, "learning_rate": 0.00019429827866041777, "loss": 2.387, "step": 9680 }, { "epoch": 0.12, "learning_rate": 0.00019428829082013106, "loss": 2.3991, "step": 9688 }, { "epoch": 0.12, "learning_rate": 0.00019427829452620641, "loss": 2.4186, "step": 9696 }, { "epoch": 0.12, "learning_rate": 0.00019426828977964634, "loss": 2.4008, "step": 9704 }, { "epoch": 0.12, "learning_rate": 0.00019425827658145432, "loss": 2.4016, "step": 9712 }, { "epoch": 0.12, "learning_rate": 0.0001942482549326346, "loss": 2.3905, "step": 9720 }, { "epoch": 0.12, "learning_rate": 0.00019423822483419226, "loss": 2.423, "step": 9728 }, { "epoch": 0.12, "learning_rate": 0.00019422818628713327, "loss": 2.3927, "step": 9736 }, { "epoch": 0.12, "learning_rate": 0.00019421813929246451, "loss": 2.403, "step": 9744 }, { "epoch": 0.12, "learning_rate": 0.00019420808385119353, "loss": 2.4096, "step": 9752 }, { "epoch": 0.12, "learning_rate": 0.00019419801996432894, "loss": 2.4053, "step": 9760 }, { "epoch": 0.12, "learning_rate": 0.00019418794763288, "loss": 2.4083, "step": 9768 }, { "epoch": 0.12, "learning_rate": 0.000194177866857857, "loss": 2.4248, "step": 9776 }, { "epoch": 0.12, "learning_rate": 0.0001941677776402709, "loss": 2.3963, "step": 9784 }, { "epoch": 0.12, "learning_rate": 0.0001941576799811336, "loss": 2.4204, "step": 9792 }, { "epoch": 0.12, "learning_rate": 0.00019414757388145788, "loss": 2.3917, "step": 9800 }, { "epoch": 0.12, "learning_rate": 0.0001941374593422573, "loss": 2.4247, "step": 9808 }, { "epoch": 0.12, "learning_rate": 0.00019412733636454632, "loss": 2.4044, "step": 9816 }, { "epoch": 0.12, "learning_rate": 0.00019411720494934019, "loss": 2.4155, "step": 9824 }, { "epoch": 0.12, "learning_rate": 0.00019410706509765503, "loss": 2.413, "step": 9832 }, { "epoch": 0.12, "learning_rate": 0.00019409691681050782, "loss": 2.4246, "step": 9840 }, { "epoch": 0.12, "learning_rate": 0.00019408676008891637, "loss": 2.4097, "step": 9848 }, { "epoch": 0.12, "learning_rate": 0.00019407659493389935, "loss": 2.418, "step": 9856 }, { "epoch": 0.12, "learning_rate": 0.00019406642134647625, "loss": 2.4174, "step": 9864 }, { "epoch": 0.12, "learning_rate": 0.00019405623932766743, "loss": 2.3935, "step": 9872 }, { "epoch": 0.12, "learning_rate": 0.00019404604887849413, "loss": 2.4197, "step": 9880 }, { "epoch": 0.12, "learning_rate": 0.00019403584999997832, "loss": 2.4144, "step": 9888 }, { "epoch": 0.12, "learning_rate": 0.00019402564269314294, "loss": 2.4046, "step": 9896 }, { "epoch": 0.12, "learning_rate": 0.0001940154269590117, "loss": 2.4087, "step": 9904 }, { "epoch": 0.12, "learning_rate": 0.00019400520279860926, "loss": 2.3906, "step": 9912 }, { "epoch": 0.12, "learning_rate": 0.0001939949702129609, "loss": 2.4114, "step": 9920 }, { "epoch": 0.12, "learning_rate": 0.000193984729203093, "loss": 2.4047, "step": 9928 }, { "epoch": 0.12, "learning_rate": 0.00019397447977003264, "loss": 2.4079, "step": 9936 }, { "epoch": 0.12, "learning_rate": 0.00019396422191480782, "loss": 2.4078, "step": 9944 }, { "epoch": 0.12, "learning_rate": 0.00019395395563844725, "loss": 2.4187, "step": 9952 }, { "epoch": 0.12, "learning_rate": 0.00019394368094198067, "loss": 2.4035, "step": 9960 }, { "epoch": 0.12, "learning_rate": 0.00019393339782643854, "loss": 2.3984, "step": 9968 }, { "epoch": 0.12, "learning_rate": 0.00019392310629285219, "loss": 2.394, "step": 9976 }, { "epoch": 0.12, "learning_rate": 0.00019391280634225387, "loss": 2.3946, "step": 9984 }, { "epoch": 0.12, "learning_rate": 0.00019390249797567648, "loss": 2.404, "step": 9992 }, { "epoch": 0.12, "learning_rate": 0.00019389218119415398, "loss": 2.3919, "step": 10000 }, { "epoch": 0.13, "learning_rate": 0.0001938818559987211, "loss": 2.3999, "step": 10008 }, { "epoch": 0.13, "learning_rate": 0.00019387152239041332, "loss": 2.4205, "step": 10016 }, { "epoch": 0.13, "learning_rate": 0.00019386118037026707, "loss": 2.3882, "step": 10024 }, { "epoch": 0.13, "learning_rate": 0.00019385082993931966, "loss": 2.3965, "step": 10032 }, { "epoch": 0.13, "learning_rate": 0.00019384047109860913, "loss": 2.4062, "step": 10040 }, { "epoch": 0.13, "learning_rate": 0.00019383010384917438, "loss": 2.4062, "step": 10048 }, { "epoch": 0.13, "learning_rate": 0.00019381972819205526, "loss": 2.418, "step": 10056 }, { "epoch": 0.13, "learning_rate": 0.00019380934412829232, "loss": 2.4023, "step": 10064 }, { "epoch": 0.13, "learning_rate": 0.0001937989516589271, "loss": 2.4137, "step": 10072 }, { "epoch": 0.13, "learning_rate": 0.0001937885507850018, "loss": 2.4112, "step": 10080 }, { "epoch": 0.13, "learning_rate": 0.00019377814150755963, "loss": 2.3932, "step": 10088 }, { "epoch": 0.13, "learning_rate": 0.00019376772382764465, "loss": 2.387, "step": 10096 }, { "epoch": 0.13, "learning_rate": 0.00019375729774630157, "loss": 2.379, "step": 10104 }, { "epoch": 0.13, "learning_rate": 0.00019374686326457613, "loss": 2.4042, "step": 10112 }, { "epoch": 0.13, "learning_rate": 0.00019373642038351483, "loss": 2.4076, "step": 10120 }, { "epoch": 0.13, "learning_rate": 0.00019372596910416506, "loss": 2.4092, "step": 10128 }, { "epoch": 0.13, "learning_rate": 0.000193715509427575, "loss": 2.4144, "step": 10136 }, { "epoch": 0.13, "learning_rate": 0.0001937050413547937, "loss": 2.3994, "step": 10144 }, { "epoch": 0.13, "learning_rate": 0.00019369456488687106, "loss": 2.4128, "step": 10152 }, { "epoch": 0.13, "learning_rate": 0.0001936840800248578, "loss": 2.3965, "step": 10160 }, { "epoch": 0.13, "learning_rate": 0.00019367358676980546, "loss": 2.3984, "step": 10168 }, { "epoch": 0.13, "learning_rate": 0.00019366308512276653, "loss": 2.4089, "step": 10176 }, { "epoch": 0.13, "learning_rate": 0.0001936525750847942, "loss": 2.4114, "step": 10184 }, { "epoch": 0.13, "learning_rate": 0.00019364205665694262, "loss": 2.4011, "step": 10192 }, { "epoch": 0.13, "learning_rate": 0.00019363152984026668, "loss": 2.3928, "step": 10200 }, { "epoch": 0.13, "learning_rate": 0.00019362099463582217, "loss": 2.3791, "step": 10208 }, { "epoch": 0.13, "learning_rate": 0.00019361045104466574, "loss": 2.3928, "step": 10216 }, { "epoch": 0.13, "learning_rate": 0.0001935998990678548, "loss": 2.4021, "step": 10224 }, { "epoch": 0.13, "learning_rate": 0.00019358933870644774, "loss": 2.3935, "step": 10232 }, { "epoch": 0.13, "learning_rate": 0.00019357876996150362, "loss": 2.4221, "step": 10240 }, { "epoch": 0.13, "learning_rate": 0.00019356819283408242, "loss": 2.4058, "step": 10248 }, { "epoch": 0.13, "learning_rate": 0.00019355760732524507, "loss": 2.3928, "step": 10256 }, { "epoch": 0.13, "learning_rate": 0.00019354701343605313, "loss": 2.3875, "step": 10264 }, { "epoch": 0.13, "learning_rate": 0.00019353641116756913, "loss": 2.4003, "step": 10272 }, { "epoch": 0.13, "learning_rate": 0.00019352580052085647, "loss": 2.3862, "step": 10280 }, { "epoch": 0.13, "learning_rate": 0.0001935151814969793, "loss": 2.4032, "step": 10288 }, { "epoch": 0.13, "learning_rate": 0.0001935045540970026, "loss": 2.4051, "step": 10296 }, { "epoch": 0.13, "learning_rate": 0.00019349391832199235, "loss": 2.4073, "step": 10304 }, { "epoch": 0.13, "learning_rate": 0.00019348327417301517, "loss": 2.4072, "step": 10312 }, { "epoch": 0.13, "learning_rate": 0.00019347262165113864, "loss": 2.3915, "step": 10320 }, { "epoch": 0.13, "learning_rate": 0.00019346196075743113, "loss": 2.3974, "step": 10328 }, { "epoch": 0.13, "learning_rate": 0.00019345129149296188, "loss": 2.4104, "step": 10336 }, { "epoch": 0.13, "learning_rate": 0.00019344061385880094, "loss": 2.391, "step": 10344 }, { "epoch": 0.13, "learning_rate": 0.00019342992785601927, "loss": 2.3983, "step": 10352 }, { "epoch": 0.13, "learning_rate": 0.00019341923348568853, "loss": 2.3955, "step": 10360 }, { "epoch": 0.13, "learning_rate": 0.0001934085307488814, "loss": 2.3923, "step": 10368 }, { "epoch": 0.13, "learning_rate": 0.00019339781964667122, "loss": 2.3957, "step": 10376 }, { "epoch": 0.13, "learning_rate": 0.00019338710018013228, "loss": 2.4006, "step": 10384 }, { "epoch": 0.13, "learning_rate": 0.0001933763723503397, "loss": 2.398, "step": 10392 }, { "epoch": 0.13, "learning_rate": 0.0001933656361583694, "loss": 2.4, "step": 10400 }, { "epoch": 0.13, "learning_rate": 0.00019335489160529818, "loss": 2.405, "step": 10408 }, { "epoch": 0.13, "learning_rate": 0.00019334413869220363, "loss": 2.4081, "step": 10416 }, { "epoch": 0.13, "learning_rate": 0.00019333337742016425, "loss": 2.4103, "step": 10424 }, { "epoch": 0.13, "learning_rate": 0.00019332260779025931, "loss": 2.4046, "step": 10432 }, { "epoch": 0.13, "learning_rate": 0.00019331182980356892, "loss": 2.3788, "step": 10440 }, { "epoch": 0.13, "learning_rate": 0.0001933010434611741, "loss": 2.3966, "step": 10448 }, { "epoch": 0.13, "learning_rate": 0.00019329024876415661, "loss": 2.3871, "step": 10456 }, { "epoch": 0.13, "learning_rate": 0.00019327944571359912, "loss": 2.3946, "step": 10464 }, { "epoch": 0.13, "learning_rate": 0.00019326863431058512, "loss": 2.4228, "step": 10472 }, { "epoch": 0.13, "learning_rate": 0.00019325781455619892, "loss": 2.3953, "step": 10480 }, { "epoch": 0.13, "learning_rate": 0.0001932469864515257, "loss": 2.3816, "step": 10488 }, { "epoch": 0.13, "learning_rate": 0.0001932361499976514, "loss": 2.396, "step": 10496 }, { "epoch": 0.13, "learning_rate": 0.00019322530519566293, "loss": 2.3901, "step": 10504 }, { "epoch": 0.13, "learning_rate": 0.00019321445204664793, "loss": 2.3853, "step": 10512 }, { "epoch": 0.13, "learning_rate": 0.00019320359055169487, "loss": 2.4011, "step": 10520 }, { "epoch": 0.13, "learning_rate": 0.00019319272071189318, "loss": 2.4012, "step": 10528 }, { "epoch": 0.13, "learning_rate": 0.00019318184252833297, "loss": 2.3994, "step": 10536 }, { "epoch": 0.13, "learning_rate": 0.0001931709560021053, "loss": 2.3926, "step": 10544 }, { "epoch": 0.13, "learning_rate": 0.00019316006113430202, "loss": 2.395, "step": 10552 }, { "epoch": 0.13, "learning_rate": 0.00019314915792601581, "loss": 2.4044, "step": 10560 }, { "epoch": 0.13, "learning_rate": 0.00019313824637834023, "loss": 2.3973, "step": 10568 }, { "epoch": 0.13, "learning_rate": 0.0001931273264923696, "loss": 2.3845, "step": 10576 }, { "epoch": 0.13, "learning_rate": 0.00019311639826919918, "loss": 2.396, "step": 10584 }, { "epoch": 0.13, "learning_rate": 0.00019310546170992493, "loss": 2.4032, "step": 10592 }, { "epoch": 0.13, "learning_rate": 0.00019309451681564382, "loss": 2.4047, "step": 10600 }, { "epoch": 0.13, "learning_rate": 0.0001930835635874535, "loss": 2.3954, "step": 10608 }, { "epoch": 0.13, "learning_rate": 0.0001930726020264525, "loss": 2.3902, "step": 10616 }, { "epoch": 0.13, "learning_rate": 0.00019306163213374025, "loss": 2.3962, "step": 10624 }, { "epoch": 0.13, "learning_rate": 0.00019305065391041695, "loss": 2.3868, "step": 10632 }, { "epoch": 0.13, "learning_rate": 0.00019303966735758366, "loss": 2.3881, "step": 10640 }, { "epoch": 0.13, "learning_rate": 0.00019302867247634225, "loss": 2.4076, "step": 10648 }, { "epoch": 0.13, "learning_rate": 0.0001930176692677955, "loss": 2.3905, "step": 10656 }, { "epoch": 0.13, "learning_rate": 0.00019300665773304686, "loss": 2.3978, "step": 10664 }, { "epoch": 0.13, "learning_rate": 0.00019299563787320082, "loss": 2.392, "step": 10672 }, { "epoch": 0.13, "learning_rate": 0.0001929846096893626, "loss": 2.3802, "step": 10680 }, { "epoch": 0.13, "learning_rate": 0.00019297357318263822, "loss": 2.3949, "step": 10688 }, { "epoch": 0.13, "learning_rate": 0.0001929625283541346, "loss": 2.4079, "step": 10696 }, { "epoch": 0.13, "learning_rate": 0.0001929514752049595, "loss": 2.4035, "step": 10704 }, { "epoch": 0.13, "learning_rate": 0.00019294041373622148, "loss": 2.4049, "step": 10712 }, { "epoch": 0.13, "learning_rate": 0.00019292934394902987, "loss": 2.3937, "step": 10720 }, { "epoch": 0.13, "learning_rate": 0.00019291826584449503, "loss": 2.3969, "step": 10728 }, { "epoch": 0.13, "learning_rate": 0.00019290717942372794, "loss": 2.3707, "step": 10736 }, { "epoch": 0.13, "learning_rate": 0.00019289608468784053, "loss": 2.3787, "step": 10744 }, { "epoch": 0.13, "learning_rate": 0.00019288498163794554, "loss": 2.4003, "step": 10752 }, { "epoch": 0.13, "learning_rate": 0.00019287387027515653, "loss": 2.3972, "step": 10760 }, { "epoch": 0.13, "learning_rate": 0.00019286275060058795, "loss": 2.4054, "step": 10768 }, { "epoch": 0.13, "learning_rate": 0.00019285162261535496, "loss": 2.3946, "step": 10776 }, { "epoch": 0.13, "learning_rate": 0.00019284048632057374, "loss": 2.3795, "step": 10784 }, { "epoch": 0.13, "learning_rate": 0.0001928293417173611, "loss": 2.4216, "step": 10792 }, { "epoch": 0.14, "learning_rate": 0.00019281818880683487, "loss": 2.3951, "step": 10800 }, { "epoch": 0.14, "learning_rate": 0.00019280702759011354, "loss": 2.3861, "step": 10808 }, { "epoch": 0.14, "learning_rate": 0.00019279585806831657, "loss": 2.3896, "step": 10816 }, { "epoch": 0.14, "learning_rate": 0.00019278468024256417, "loss": 2.4081, "step": 10824 }, { "epoch": 0.14, "learning_rate": 0.00019277349411397744, "loss": 2.3815, "step": 10832 }, { "epoch": 0.14, "learning_rate": 0.00019276229968367826, "loss": 2.4099, "step": 10840 }, { "epoch": 0.14, "learning_rate": 0.0001927510969527894, "loss": 2.403, "step": 10848 }, { "epoch": 0.14, "learning_rate": 0.00019273988592243438, "loss": 2.4118, "step": 10856 }, { "epoch": 0.14, "learning_rate": 0.00019272866659373765, "loss": 2.4056, "step": 10864 }, { "epoch": 0.14, "learning_rate": 0.00019271743896782443, "loss": 2.4091, "step": 10872 }, { "epoch": 0.14, "learning_rate": 0.00019270620304582078, "loss": 2.3838, "step": 10880 }, { "epoch": 0.14, "learning_rate": 0.0001926949588288536, "loss": 2.4042, "step": 10888 }, { "epoch": 0.14, "learning_rate": 0.0001926837063180506, "loss": 2.3995, "step": 10896 }, { "epoch": 0.14, "learning_rate": 0.0001926724455145404, "loss": 2.4141, "step": 10904 }, { "epoch": 0.14, "learning_rate": 0.00019266117641945235, "loss": 2.3887, "step": 10912 }, { "epoch": 0.14, "learning_rate": 0.0001926498990339167, "loss": 2.4013, "step": 10920 }, { "epoch": 0.14, "learning_rate": 0.0001926386133590645, "loss": 2.4007, "step": 10928 }, { "epoch": 0.14, "learning_rate": 0.0001926273193960276, "loss": 2.3902, "step": 10936 }, { "epoch": 0.14, "learning_rate": 0.0001926160171459388, "loss": 2.4156, "step": 10944 }, { "epoch": 0.14, "learning_rate": 0.0001926047066099316, "loss": 2.4051, "step": 10952 }, { "epoch": 0.14, "learning_rate": 0.00019259338778914036, "loss": 2.3947, "step": 10960 }, { "epoch": 0.14, "learning_rate": 0.00019258206068470035, "loss": 2.3846, "step": 10968 }, { "epoch": 0.14, "learning_rate": 0.0001925707252977476, "loss": 2.3745, "step": 10976 }, { "epoch": 0.14, "learning_rate": 0.00019255938162941898, "loss": 2.3938, "step": 10984 }, { "epoch": 0.14, "learning_rate": 0.00019254802968085216, "loss": 2.3954, "step": 10992 }, { "epoch": 0.14, "learning_rate": 0.00019253666945318572, "loss": 2.3911, "step": 11000 }, { "epoch": 0.14, "learning_rate": 0.00019252530094755898, "loss": 2.4118, "step": 11008 }, { "epoch": 0.14, "learning_rate": 0.00019251392416511225, "loss": 2.3904, "step": 11016 }, { "epoch": 0.14, "learning_rate": 0.0001925025391069864, "loss": 2.3712, "step": 11024 }, { "epoch": 0.14, "learning_rate": 0.0001924911457743234, "loss": 2.4212, "step": 11032 }, { "epoch": 0.14, "learning_rate": 0.00019247974416826587, "loss": 2.3729, "step": 11040 }, { "epoch": 0.14, "learning_rate": 0.0001924683342899574, "loss": 2.3915, "step": 11048 }, { "epoch": 0.14, "learning_rate": 0.00019245691614054226, "loss": 2.3949, "step": 11056 }, { "epoch": 0.14, "learning_rate": 0.00019244548972116566, "loss": 2.3909, "step": 11064 }, { "epoch": 0.14, "learning_rate": 0.00019243405503297357, "loss": 2.4039, "step": 11072 }, { "epoch": 0.14, "learning_rate": 0.0001924226120771129, "loss": 2.378, "step": 11080 }, { "epoch": 0.14, "learning_rate": 0.00019241116085473128, "loss": 2.3805, "step": 11088 }, { "epoch": 0.14, "learning_rate": 0.00019239970136697716, "loss": 2.3944, "step": 11096 }, { "epoch": 0.14, "learning_rate": 0.00019238823361499995, "loss": 2.4051, "step": 11104 }, { "epoch": 0.14, "learning_rate": 0.0001923767575999497, "loss": 2.4014, "step": 11112 }, { "epoch": 0.14, "learning_rate": 0.00019236527332297746, "loss": 2.4039, "step": 11120 }, { "epoch": 0.14, "learning_rate": 0.00019235378078523498, "loss": 2.3894, "step": 11128 }, { "epoch": 0.14, "learning_rate": 0.00019234227998787492, "loss": 2.3844, "step": 11136 }, { "epoch": 0.14, "learning_rate": 0.0001923307709320508, "loss": 2.4063, "step": 11144 }, { "epoch": 0.14, "learning_rate": 0.00019231925361891682, "loss": 2.4008, "step": 11152 }, { "epoch": 0.14, "learning_rate": 0.0001923077280496282, "loss": 2.394, "step": 11160 }, { "epoch": 0.14, "learning_rate": 0.0001922961942253408, "loss": 2.4016, "step": 11168 }, { "epoch": 0.14, "learning_rate": 0.00019228465214721145, "loss": 2.4011, "step": 11176 }, { "epoch": 0.14, "learning_rate": 0.00019227310181639775, "loss": 2.4036, "step": 11184 }, { "epoch": 0.14, "learning_rate": 0.00019226154323405813, "loss": 2.4048, "step": 11192 }, { "epoch": 0.14, "learning_rate": 0.0001922499764013518, "loss": 2.3917, "step": 11200 }, { "epoch": 0.14, "learning_rate": 0.0001922384013194389, "loss": 2.4117, "step": 11208 }, { "epoch": 0.14, "learning_rate": 0.0001922268179894804, "loss": 2.3976, "step": 11216 }, { "epoch": 0.14, "learning_rate": 0.0001922152264126379, "loss": 2.3852, "step": 11224 }, { "epoch": 0.14, "learning_rate": 0.0001922036265900741, "loss": 2.3877, "step": 11232 }, { "epoch": 0.14, "learning_rate": 0.0001921920185229523, "loss": 2.4108, "step": 11240 }, { "epoch": 0.14, "learning_rate": 0.0001921804022124368, "loss": 2.4057, "step": 11248 }, { "epoch": 0.14, "learning_rate": 0.0001921687776596926, "loss": 2.4048, "step": 11256 }, { "epoch": 0.14, "learning_rate": 0.0001921571448658856, "loss": 2.402, "step": 11264 }, { "epoch": 0.14, "learning_rate": 0.00019214550383218253, "loss": 2.3869, "step": 11272 }, { "epoch": 0.14, "learning_rate": 0.00019213385455975086, "loss": 2.3903, "step": 11280 }, { "epoch": 0.14, "learning_rate": 0.00019212219704975894, "loss": 2.405, "step": 11288 }, { "epoch": 0.14, "learning_rate": 0.00019211053130337605, "loss": 2.4182, "step": 11296 }, { "epoch": 0.14, "learning_rate": 0.0001920988573217721, "loss": 2.3914, "step": 11304 }, { "epoch": 0.14, "learning_rate": 0.00019208717510611797, "loss": 2.3852, "step": 11312 }, { "epoch": 0.14, "learning_rate": 0.0001920754846575853, "loss": 2.3982, "step": 11320 }, { "epoch": 0.14, "learning_rate": 0.00019206378597734657, "loss": 2.3879, "step": 11328 }, { "epoch": 0.14, "learning_rate": 0.00019205207906657513, "loss": 2.3958, "step": 11336 }, { "epoch": 0.14, "learning_rate": 0.0001920403639264451, "loss": 2.4021, "step": 11344 }, { "epoch": 0.14, "learning_rate": 0.0001920286405581314, "loss": 2.4259, "step": 11352 }, { "epoch": 0.14, "learning_rate": 0.00019201690896280987, "loss": 2.3875, "step": 11360 }, { "epoch": 0.14, "learning_rate": 0.00019200516914165712, "loss": 2.4076, "step": 11368 }, { "epoch": 0.14, "learning_rate": 0.00019199342109585055, "loss": 2.3825, "step": 11376 }, { "epoch": 0.14, "learning_rate": 0.00019198166482656842, "loss": 2.3666, "step": 11384 }, { "epoch": 0.14, "learning_rate": 0.00019196990033498986, "loss": 2.3811, "step": 11392 }, { "epoch": 0.14, "learning_rate": 0.0001919581276222948, "loss": 2.3987, "step": 11400 }, { "epoch": 0.14, "learning_rate": 0.00019194634668966392, "loss": 2.3926, "step": 11408 }, { "epoch": 0.14, "learning_rate": 0.00019193455753827878, "loss": 2.3905, "step": 11416 }, { "epoch": 0.14, "learning_rate": 0.00019192276016932183, "loss": 2.3905, "step": 11424 }, { "epoch": 0.14, "learning_rate": 0.00019191095458397618, "loss": 2.3871, "step": 11432 }, { "epoch": 0.14, "learning_rate": 0.00019189914078342595, "loss": 2.4105, "step": 11440 }, { "epoch": 0.14, "learning_rate": 0.00019188731876885597, "loss": 2.4054, "step": 11448 }, { "epoch": 0.14, "learning_rate": 0.0001918754885414519, "loss": 2.411, "step": 11456 }, { "epoch": 0.14, "learning_rate": 0.00019186365010240026, "loss": 2.3928, "step": 11464 }, { "epoch": 0.14, "learning_rate": 0.0001918518034528884, "loss": 2.3947, "step": 11472 }, { "epoch": 0.14, "learning_rate": 0.00019183994859410446, "loss": 2.3808, "step": 11480 }, { "epoch": 0.14, "learning_rate": 0.00019182808552723737, "loss": 2.4019, "step": 11488 }, { "epoch": 0.14, "learning_rate": 0.000191816214253477, "loss": 2.3943, "step": 11496 }, { "epoch": 0.14, "learning_rate": 0.00019180433477401388, "loss": 2.3967, "step": 11504 }, { "epoch": 0.14, "learning_rate": 0.00019179244709003956, "loss": 2.3844, "step": 11512 }, { "epoch": 0.14, "learning_rate": 0.00019178055120274624, "loss": 2.407, "step": 11520 }, { "epoch": 0.14, "learning_rate": 0.00019176864711332705, "loss": 2.394, "step": 11528 }, { "epoch": 0.14, "learning_rate": 0.00019175673482297586, "loss": 2.3861, "step": 11536 }, { "epoch": 0.14, "learning_rate": 0.00019174481433288746, "loss": 2.4107, "step": 11544 }, { "epoch": 0.14, "learning_rate": 0.00019173288564425733, "loss": 2.3898, "step": 11552 }, { "epoch": 0.14, "learning_rate": 0.0001917209487582819, "loss": 2.3807, "step": 11560 }, { "epoch": 0.14, "learning_rate": 0.0001917090036761584, "loss": 2.4037, "step": 11568 }, { "epoch": 0.14, "learning_rate": 0.00019169705039908479, "loss": 2.3935, "step": 11576 }, { "epoch": 0.14, "learning_rate": 0.00019168508892825994, "loss": 2.4099, "step": 11584 }, { "epoch": 0.14, "learning_rate": 0.00019167311926488354, "loss": 2.3978, "step": 11592 }, { "epoch": 0.14, "learning_rate": 0.00019166114141015608, "loss": 2.4021, "step": 11600 }, { "epoch": 0.15, "learning_rate": 0.0001916491553652788, "loss": 2.3752, "step": 11608 }, { "epoch": 0.15, "learning_rate": 0.00019163716113145395, "loss": 2.4018, "step": 11616 }, { "epoch": 0.15, "learning_rate": 0.00019162515870988438, "loss": 2.3985, "step": 11624 }, { "epoch": 0.15, "learning_rate": 0.0001916131481017739, "loss": 2.3943, "step": 11632 }, { "epoch": 0.15, "learning_rate": 0.00019160112930832713, "loss": 2.3845, "step": 11640 }, { "epoch": 0.15, "learning_rate": 0.00019158910233074946, "loss": 2.4047, "step": 11648 }, { "epoch": 0.15, "learning_rate": 0.00019157706717024716, "loss": 2.3881, "step": 11656 }, { "epoch": 0.15, "learning_rate": 0.00019156502382802727, "loss": 2.3916, "step": 11664 }, { "epoch": 0.15, "learning_rate": 0.0001915529723052976, "loss": 2.3867, "step": 11672 }, { "epoch": 0.15, "learning_rate": 0.00019154091260326696, "loss": 2.3928, "step": 11680 }, { "epoch": 0.15, "learning_rate": 0.0001915288447231448, "loss": 2.3753, "step": 11688 }, { "epoch": 0.15, "learning_rate": 0.00019151676866614153, "loss": 2.3932, "step": 11696 }, { "epoch": 0.15, "learning_rate": 0.0001915046844334682, "loss": 2.3908, "step": 11704 }, { "epoch": 0.15, "learning_rate": 0.00019149259202633686, "loss": 2.4105, "step": 11712 }, { "epoch": 0.15, "learning_rate": 0.00019148049144596037, "loss": 2.3955, "step": 11720 }, { "epoch": 0.15, "learning_rate": 0.0001914683826935522, "loss": 2.395, "step": 11728 }, { "epoch": 0.15, "learning_rate": 0.0001914562657703269, "loss": 2.3903, "step": 11736 }, { "epoch": 0.15, "learning_rate": 0.0001914441406774997, "loss": 2.3949, "step": 11744 }, { "epoch": 0.15, "learning_rate": 0.00019143200741628672, "loss": 2.3807, "step": 11752 }, { "epoch": 0.15, "learning_rate": 0.00019141986598790475, "loss": 2.3761, "step": 11760 }, { "epoch": 0.15, "learning_rate": 0.00019140771639357163, "loss": 2.3888, "step": 11768 }, { "epoch": 0.15, "learning_rate": 0.00019139555863450578, "loss": 2.394, "step": 11776 }, { "epoch": 0.15, "learning_rate": 0.00019138339271192664, "loss": 2.3867, "step": 11784 }, { "epoch": 0.15, "learning_rate": 0.00019137121862705436, "loss": 2.3905, "step": 11792 }, { "epoch": 0.15, "learning_rate": 0.00019135903638110993, "loss": 2.3857, "step": 11800 }, { "epoch": 0.15, "learning_rate": 0.00019134684597531514, "loss": 2.3907, "step": 11808 }, { "epoch": 0.15, "learning_rate": 0.00019133464741089262, "loss": 2.3862, "step": 11816 }, { "epoch": 0.15, "learning_rate": 0.00019132244068906587, "loss": 2.3944, "step": 11824 }, { "epoch": 0.15, "learning_rate": 0.0001913102258110591, "loss": 2.4102, "step": 11832 }, { "epoch": 0.15, "learning_rate": 0.0001912980027780974, "loss": 2.3836, "step": 11840 }, { "epoch": 0.15, "learning_rate": 0.0001912857715914067, "loss": 2.3724, "step": 11848 }, { "epoch": 0.15, "learning_rate": 0.00019127353225221368, "loss": 2.403, "step": 11856 }, { "epoch": 0.15, "learning_rate": 0.00019126128476174592, "loss": 2.3876, "step": 11864 }, { "epoch": 0.15, "learning_rate": 0.00019124902912123174, "loss": 2.3896, "step": 11872 }, { "epoch": 0.15, "learning_rate": 0.00019123676533190032, "loss": 2.3701, "step": 11880 }, { "epoch": 0.15, "learning_rate": 0.00019122449339498162, "loss": 2.3926, "step": 11888 }, { "epoch": 0.15, "learning_rate": 0.00019121221331170653, "loss": 2.363, "step": 11896 }, { "epoch": 0.15, "learning_rate": 0.00019119992508330659, "loss": 2.3798, "step": 11904 }, { "epoch": 0.15, "learning_rate": 0.00019118762871101426, "loss": 2.4065, "step": 11912 }, { "epoch": 0.15, "learning_rate": 0.00019117532419606284, "loss": 2.4163, "step": 11920 }, { "epoch": 0.15, "learning_rate": 0.00019116301153968633, "loss": 2.3922, "step": 11928 }, { "epoch": 0.15, "learning_rate": 0.0001911506907431197, "loss": 2.4043, "step": 11936 }, { "epoch": 0.15, "learning_rate": 0.00019113836180759857, "loss": 2.4003, "step": 11944 }, { "epoch": 0.15, "learning_rate": 0.0001911260247343595, "loss": 2.3917, "step": 11952 }, { "epoch": 0.15, "learning_rate": 0.00019111367952463987, "loss": 2.395, "step": 11960 }, { "epoch": 0.15, "learning_rate": 0.0001911013261796778, "loss": 2.4013, "step": 11968 }, { "epoch": 0.15, "learning_rate": 0.00019108896470071226, "loss": 2.3944, "step": 11976 }, { "epoch": 0.15, "learning_rate": 0.00019107659508898299, "loss": 2.4123, "step": 11984 }, { "epoch": 0.15, "learning_rate": 0.00019106421734573067, "loss": 2.412, "step": 11992 }, { "epoch": 0.15, "learning_rate": 0.00019105183147219673, "loss": 2.4034, "step": 12000 }, { "epoch": 0.15, "learning_rate": 0.00019103943746962327, "loss": 2.3749, "step": 12008 }, { "epoch": 0.15, "learning_rate": 0.00019102703533925347, "loss": 2.3911, "step": 12016 }, { "epoch": 0.15, "learning_rate": 0.00019101462508233115, "loss": 2.3802, "step": 12024 }, { "epoch": 0.15, "learning_rate": 0.000191002206700101, "loss": 2.386, "step": 12032 }, { "epoch": 0.15, "learning_rate": 0.00019098978019380848, "loss": 2.3939, "step": 12040 }, { "epoch": 0.15, "learning_rate": 0.00019097734556469995, "loss": 2.3811, "step": 12048 }, { "epoch": 0.15, "learning_rate": 0.00019096490281402247, "loss": 2.3995, "step": 12056 }, { "epoch": 0.15, "learning_rate": 0.00019095245194302403, "loss": 2.4037, "step": 12064 }, { "epoch": 0.15, "learning_rate": 0.00019093999295295336, "loss": 2.3969, "step": 12072 }, { "epoch": 0.15, "learning_rate": 0.00019092752584506, "loss": 2.391, "step": 12080 }, { "epoch": 0.15, "learning_rate": 0.0001909150506205944, "loss": 2.3966, "step": 12088 }, { "epoch": 0.15, "learning_rate": 0.00019090256728080768, "loss": 2.4, "step": 12096 }, { "epoch": 0.15, "learning_rate": 0.0001908900758269519, "loss": 2.3954, "step": 12104 }, { "epoch": 0.15, "learning_rate": 0.00019087757626027986, "loss": 2.3941, "step": 12112 }, { "epoch": 0.15, "learning_rate": 0.0001908650685820452, "loss": 2.38, "step": 12120 }, { "epoch": 0.15, "learning_rate": 0.00019085255279350236, "loss": 2.3901, "step": 12128 }, { "epoch": 0.15, "learning_rate": 0.00019084002889590662, "loss": 2.3823, "step": 12136 }, { "epoch": 0.15, "learning_rate": 0.00019082749689051405, "loss": 2.3969, "step": 12144 }, { "epoch": 0.15, "learning_rate": 0.00019081495677858153, "loss": 2.3891, "step": 12152 }, { "epoch": 0.15, "learning_rate": 0.00019080240856136677, "loss": 2.3703, "step": 12160 }, { "epoch": 0.15, "learning_rate": 0.00019078985224012826, "loss": 2.3761, "step": 12168 }, { "epoch": 0.15, "learning_rate": 0.0001907772878161254, "loss": 2.3934, "step": 12176 }, { "epoch": 0.15, "learning_rate": 0.00019076471529061825, "loss": 2.3807, "step": 12184 }, { "epoch": 0.15, "learning_rate": 0.00019075213466486778, "loss": 2.3938, "step": 12192 }, { "epoch": 0.15, "learning_rate": 0.00019073954594013578, "loss": 2.3723, "step": 12200 }, { "epoch": 0.15, "learning_rate": 0.0001907269491176848, "loss": 2.4025, "step": 12208 }, { "epoch": 0.15, "learning_rate": 0.0001907143441987783, "loss": 2.3859, "step": 12216 }, { "epoch": 0.15, "learning_rate": 0.0001907017311846804, "loss": 2.3931, "step": 12224 }, { "epoch": 0.15, "learning_rate": 0.00019068911007665614, "loss": 2.4062, "step": 12232 }, { "epoch": 0.15, "learning_rate": 0.00019067648087597137, "loss": 2.3993, "step": 12240 }, { "epoch": 0.15, "learning_rate": 0.00019066384358389267, "loss": 2.369, "step": 12248 }, { "epoch": 0.15, "learning_rate": 0.00019065119820168753, "loss": 2.3985, "step": 12256 }, { "epoch": 0.15, "learning_rate": 0.00019063854473062424, "loss": 2.3921, "step": 12264 }, { "epoch": 0.15, "learning_rate": 0.00019062588317197182, "loss": 2.4, "step": 12272 }, { "epoch": 0.15, "learning_rate": 0.00019061321352700016, "loss": 2.3945, "step": 12280 }, { "epoch": 0.15, "learning_rate": 0.00019060053579697997, "loss": 2.4166, "step": 12288 }, { "epoch": 0.15, "learning_rate": 0.00019058784998318273, "loss": 2.3814, "step": 12296 }, { "epoch": 0.15, "learning_rate": 0.0001905751560868808, "loss": 2.3883, "step": 12304 }, { "epoch": 0.15, "learning_rate": 0.00019056245410934726, "loss": 2.3767, "step": 12312 }, { "epoch": 0.15, "learning_rate": 0.00019054974405185605, "loss": 2.3678, "step": 12320 }, { "epoch": 0.15, "learning_rate": 0.00019053702591568196, "loss": 2.4128, "step": 12328 }, { "epoch": 0.15, "learning_rate": 0.00019052429970210053, "loss": 2.3963, "step": 12336 }, { "epoch": 0.15, "learning_rate": 0.0001905115654123881, "loss": 2.3806, "step": 12344 }, { "epoch": 0.15, "learning_rate": 0.00019049882304782186, "loss": 2.3816, "step": 12352 }, { "epoch": 0.15, "learning_rate": 0.0001904860726096798, "loss": 2.3895, "step": 12360 }, { "epoch": 0.15, "learning_rate": 0.0001904733140992407, "loss": 2.4059, "step": 12368 }, { "epoch": 0.15, "learning_rate": 0.00019046054751778422, "loss": 2.3718, "step": 12376 }, { "epoch": 0.15, "learning_rate": 0.00019044777286659071, "loss": 2.3923, "step": 12384 }, { "epoch": 0.15, "learning_rate": 0.00019043499014694142, "loss": 2.3875, "step": 12392 }, { "epoch": 0.15, "learning_rate": 0.0001904221993601184, "loss": 2.3916, "step": 12400 }, { "epoch": 0.16, "learning_rate": 0.00019040940050740448, "loss": 2.3685, "step": 12408 }, { "epoch": 0.16, "learning_rate": 0.00019039659359008332, "loss": 2.3798, "step": 12416 }, { "epoch": 0.16, "learning_rate": 0.00019038377860943937, "loss": 2.3655, "step": 12424 }, { "epoch": 0.16, "learning_rate": 0.0001903709555667579, "loss": 2.3882, "step": 12432 }, { "epoch": 0.16, "learning_rate": 0.000190358124463325, "loss": 2.3843, "step": 12440 }, { "epoch": 0.16, "learning_rate": 0.00019034528530042754, "loss": 2.3885, "step": 12448 }, { "epoch": 0.16, "learning_rate": 0.00019033243807935326, "loss": 2.3696, "step": 12456 }, { "epoch": 0.16, "learning_rate": 0.0001903195828013906, "loss": 2.4002, "step": 12464 }, { "epoch": 0.16, "learning_rate": 0.0001903067194678289, "loss": 2.3927, "step": 12472 }, { "epoch": 0.16, "learning_rate": 0.0001902938480799583, "loss": 2.3861, "step": 12480 }, { "epoch": 0.16, "learning_rate": 0.00019028096863906967, "loss": 2.3856, "step": 12488 }, { "epoch": 0.16, "learning_rate": 0.00019026808114645482, "loss": 2.4021, "step": 12496 }, { "epoch": 0.16, "learning_rate": 0.00019025518560340625, "loss": 2.3694, "step": 12504 }, { "epoch": 0.16, "learning_rate": 0.0001902422820112173, "loss": 2.3779, "step": 12512 }, { "epoch": 0.16, "learning_rate": 0.00019022937037118217, "loss": 2.399, "step": 12520 }, { "epoch": 0.16, "learning_rate": 0.00019021645068459576, "loss": 2.3916, "step": 12528 }, { "epoch": 0.16, "learning_rate": 0.00019020352295275386, "loss": 2.3976, "step": 12536 }, { "epoch": 0.16, "learning_rate": 0.0001901905871769531, "loss": 2.3913, "step": 12544 }, { "epoch": 0.16, "learning_rate": 0.00019017764335849084, "loss": 2.38, "step": 12552 }, { "epoch": 0.16, "learning_rate": 0.00019016469149866526, "loss": 2.3972, "step": 12560 }, { "epoch": 0.16, "learning_rate": 0.00019015173159877535, "loss": 2.3888, "step": 12568 }, { "epoch": 0.16, "learning_rate": 0.00019013876366012094, "loss": 2.3768, "step": 12576 }, { "epoch": 0.16, "learning_rate": 0.0001901257876840026, "loss": 2.4004, "step": 12584 }, { "epoch": 0.16, "learning_rate": 0.0001901128036717218, "loss": 2.3968, "step": 12592 }, { "epoch": 0.16, "learning_rate": 0.00019009981162458072, "loss": 2.3689, "step": 12600 }, { "epoch": 0.16, "learning_rate": 0.0001900868115438824, "loss": 2.3897, "step": 12608 }, { "epoch": 0.16, "learning_rate": 0.0001900738034309307, "loss": 2.3933, "step": 12616 }, { "epoch": 0.16, "learning_rate": 0.0001900607872870302, "loss": 2.3817, "step": 12624 }, { "epoch": 0.16, "learning_rate": 0.00019004776311348646, "loss": 2.367, "step": 12632 }, { "epoch": 0.16, "learning_rate": 0.00019003473091160558, "loss": 2.3762, "step": 12640 }, { "epoch": 0.16, "learning_rate": 0.0001900216906826947, "loss": 2.3858, "step": 12648 }, { "epoch": 0.16, "learning_rate": 0.00019000864242806168, "loss": 2.3918, "step": 12656 }, { "epoch": 0.16, "learning_rate": 0.00018999558614901522, "loss": 2.3958, "step": 12664 }, { "epoch": 0.16, "learning_rate": 0.0001899825218468647, "loss": 2.3904, "step": 12672 }, { "epoch": 0.16, "learning_rate": 0.00018996944952292047, "loss": 2.3878, "step": 12680 }, { "epoch": 0.16, "learning_rate": 0.00018995636917849357, "loss": 2.3922, "step": 12688 }, { "epoch": 0.16, "learning_rate": 0.0001899432808148959, "loss": 2.4021, "step": 12696 }, { "epoch": 0.16, "learning_rate": 0.00018993018443344017, "loss": 2.3734, "step": 12704 }, { "epoch": 0.16, "learning_rate": 0.00018991708003543981, "loss": 2.3859, "step": 12712 }, { "epoch": 0.16, "learning_rate": 0.00018990396762220922, "loss": 2.3797, "step": 12720 }, { "epoch": 0.16, "learning_rate": 0.00018989084719506338, "loss": 2.3693, "step": 12728 }, { "epoch": 0.16, "learning_rate": 0.00018987771875531826, "loss": 2.3839, "step": 12736 }, { "epoch": 0.16, "learning_rate": 0.00018986458230429057, "loss": 2.3936, "step": 12744 }, { "epoch": 0.16, "learning_rate": 0.00018985143784329785, "loss": 2.3934, "step": 12752 }, { "epoch": 0.16, "learning_rate": 0.00018983828537365833, "loss": 2.3911, "step": 12760 }, { "epoch": 0.16, "learning_rate": 0.00018982512489669118, "loss": 2.4017, "step": 12768 }, { "epoch": 0.16, "learning_rate": 0.0001898119564137163, "loss": 2.3777, "step": 12776 }, { "epoch": 0.16, "learning_rate": 0.0001897987799260545, "loss": 2.3865, "step": 12784 }, { "epoch": 0.16, "learning_rate": 0.0001897855954350272, "loss": 2.3924, "step": 12792 }, { "epoch": 0.16, "learning_rate": 0.00018977240294195676, "loss": 2.3995, "step": 12800 }, { "epoch": 0.16, "learning_rate": 0.00018975920244816631, "loss": 2.382, "step": 12808 }, { "epoch": 0.16, "learning_rate": 0.0001897459939549798, "loss": 2.3879, "step": 12816 }, { "epoch": 0.16, "learning_rate": 0.00018973277746372197, "loss": 2.3702, "step": 12824 }, { "epoch": 0.16, "learning_rate": 0.00018971955297571836, "loss": 2.3681, "step": 12832 }, { "epoch": 0.16, "learning_rate": 0.00018970632049229532, "loss": 2.3798, "step": 12840 }, { "epoch": 0.16, "learning_rate": 0.00018969308001477993, "loss": 2.3962, "step": 12848 }, { "epoch": 0.16, "learning_rate": 0.0001896798315445002, "loss": 2.3764, "step": 12856 }, { "epoch": 0.16, "learning_rate": 0.00018966657508278487, "loss": 2.3801, "step": 12864 }, { "epoch": 0.16, "learning_rate": 0.00018965331063096346, "loss": 2.3941, "step": 12872 }, { "epoch": 0.16, "learning_rate": 0.00018964003819036632, "loss": 2.3866, "step": 12880 }, { "epoch": 0.16, "learning_rate": 0.00018962675776232463, "loss": 2.3785, "step": 12888 }, { "epoch": 0.16, "learning_rate": 0.00018961346934817034, "loss": 2.3872, "step": 12896 }, { "epoch": 0.16, "learning_rate": 0.0001896001729492362, "loss": 2.3892, "step": 12904 }, { "epoch": 0.16, "learning_rate": 0.0001895868685668557, "loss": 2.3971, "step": 12912 }, { "epoch": 0.16, "learning_rate": 0.0001895735562023633, "loss": 2.3821, "step": 12920 }, { "epoch": 0.16, "learning_rate": 0.00018956023585709405, "loss": 2.4062, "step": 12928 }, { "epoch": 0.16, "learning_rate": 0.000189546907532384, "loss": 2.3856, "step": 12936 }, { "epoch": 0.16, "learning_rate": 0.00018953357122956986, "loss": 2.3817, "step": 12944 }, { "epoch": 0.16, "learning_rate": 0.0001895202269499892, "loss": 2.3994, "step": 12952 }, { "epoch": 0.16, "learning_rate": 0.0001895068746949803, "loss": 2.3995, "step": 12960 }, { "epoch": 0.16, "learning_rate": 0.0001894935144658824, "loss": 2.3993, "step": 12968 }, { "epoch": 0.16, "learning_rate": 0.00018948014626403548, "loss": 2.3906, "step": 12976 }, { "epoch": 0.16, "learning_rate": 0.0001894667700907802, "loss": 2.3824, "step": 12984 }, { "epoch": 0.16, "learning_rate": 0.0001894533859474582, "loss": 2.3823, "step": 12992 }, { "epoch": 0.16, "learning_rate": 0.00018943999383541177, "loss": 2.4173, "step": 13000 }, { "epoch": 0.16, "learning_rate": 0.0001894265937559841, "loss": 2.3766, "step": 13008 }, { "epoch": 0.16, "learning_rate": 0.00018941318571051916, "loss": 2.4138, "step": 13016 }, { "epoch": 0.16, "learning_rate": 0.00018939976970036164, "loss": 2.378, "step": 13024 }, { "epoch": 0.16, "learning_rate": 0.00018938634572685713, "loss": 2.4069, "step": 13032 }, { "epoch": 0.16, "learning_rate": 0.00018937291379135196, "loss": 2.3895, "step": 13040 }, { "epoch": 0.16, "learning_rate": 0.0001893594738951933, "loss": 2.3897, "step": 13048 }, { "epoch": 0.16, "learning_rate": 0.0001893460260397291, "loss": 2.3892, "step": 13056 }, { "epoch": 0.16, "learning_rate": 0.00018933257022630805, "loss": 2.3839, "step": 13064 }, { "epoch": 0.16, "learning_rate": 0.00018931910645627977, "loss": 2.3975, "step": 13072 }, { "epoch": 0.16, "learning_rate": 0.00018930563473099453, "loss": 2.3792, "step": 13080 }, { "epoch": 0.16, "learning_rate": 0.00018929215505180349, "loss": 2.4199, "step": 13088 }, { "epoch": 0.16, "learning_rate": 0.00018927866742005862, "loss": 2.3644, "step": 13096 }, { "epoch": 0.16, "learning_rate": 0.0001892651718371126, "loss": 2.385, "step": 13104 }, { "epoch": 0.16, "learning_rate": 0.000189251668304319, "loss": 2.4003, "step": 13112 }, { "epoch": 0.16, "learning_rate": 0.00018923815682303215, "loss": 2.388, "step": 13120 }, { "epoch": 0.16, "learning_rate": 0.00018922463739460714, "loss": 2.3739, "step": 13128 }, { "epoch": 0.16, "learning_rate": 0.00018921111002039994, "loss": 2.3848, "step": 13136 }, { "epoch": 0.16, "learning_rate": 0.0001891975747017672, "loss": 2.3927, "step": 13144 }, { "epoch": 0.16, "learning_rate": 0.0001891840314400665, "loss": 2.3622, "step": 13152 }, { "epoch": 0.16, "learning_rate": 0.00018917048023665609, "loss": 2.3949, "step": 13160 }, { "epoch": 0.16, "learning_rate": 0.00018915692109289516, "loss": 2.4043, "step": 13168 }, { "epoch": 0.16, "learning_rate": 0.00018914335401014353, "loss": 2.3888, "step": 13176 }, { "epoch": 0.16, "learning_rate": 0.00018912977898976198, "loss": 2.3936, "step": 13184 }, { "epoch": 0.16, "learning_rate": 0.00018911619603311197, "loss": 2.3957, "step": 13192 }, { "epoch": 0.17, "learning_rate": 0.00018910260514155578, "loss": 2.39, "step": 13200 }, { "epoch": 0.17, "learning_rate": 0.00018908900631645653, "loss": 2.3914, "step": 13208 }, { "epoch": 0.17, "learning_rate": 0.0001890753995591781, "loss": 2.3779, "step": 13216 }, { "epoch": 0.17, "learning_rate": 0.00018906178487108511, "loss": 2.3808, "step": 13224 }, { "epoch": 0.17, "learning_rate": 0.0001890481622535431, "loss": 2.3676, "step": 13232 }, { "epoch": 0.17, "learning_rate": 0.00018903453170791837, "loss": 2.3929, "step": 13240 }, { "epoch": 0.17, "learning_rate": 0.00018902089323557793, "loss": 2.4018, "step": 13248 }, { "epoch": 0.17, "learning_rate": 0.0001890072468378896, "loss": 2.3905, "step": 13256 }, { "epoch": 0.17, "learning_rate": 0.00018899359251622216, "loss": 2.3968, "step": 13264 }, { "epoch": 0.17, "learning_rate": 0.000188979930271945, "loss": 2.4097, "step": 13272 }, { "epoch": 0.17, "learning_rate": 0.0001889662601064283, "loss": 2.371, "step": 13280 }, { "epoch": 0.17, "learning_rate": 0.00018895258202104317, "loss": 2.406, "step": 13288 }, { "epoch": 0.17, "learning_rate": 0.00018893889601716147, "loss": 2.3976, "step": 13296 }, { "epoch": 0.17, "learning_rate": 0.00018892520209615575, "loss": 2.3921, "step": 13304 }, { "epoch": 0.17, "learning_rate": 0.00018891150025939952, "loss": 2.3893, "step": 13312 }, { "epoch": 0.17, "learning_rate": 0.00018889779050826694, "loss": 2.3908, "step": 13320 }, { "epoch": 0.17, "learning_rate": 0.00018888407284413302, "loss": 2.3696, "step": 13328 }, { "epoch": 0.17, "learning_rate": 0.0001888703472683736, "loss": 2.3959, "step": 13336 }, { "epoch": 0.17, "learning_rate": 0.00018885661378236518, "loss": 2.3824, "step": 13344 }, { "epoch": 0.17, "learning_rate": 0.00018884287238748527, "loss": 2.4161, "step": 13352 }, { "epoch": 0.17, "learning_rate": 0.000188829123085112, "loss": 2.4001, "step": 13360 }, { "epoch": 0.17, "learning_rate": 0.00018881536587662438, "loss": 2.3359, "step": 13368 }, { "epoch": 0.17, "learning_rate": 0.00018880160076340213, "loss": 2.3931, "step": 13376 }, { "epoch": 0.17, "learning_rate": 0.00018878782774682586, "loss": 2.3966, "step": 13384 }, { "epoch": 0.17, "learning_rate": 0.00018877404682827688, "loss": 2.4013, "step": 13392 }, { "epoch": 0.17, "learning_rate": 0.00018876025800913736, "loss": 2.3765, "step": 13400 }, { "epoch": 0.17, "learning_rate": 0.00018874646129079029, "loss": 2.3761, "step": 13408 }, { "epoch": 0.17, "learning_rate": 0.0001887326566746193, "loss": 2.4023, "step": 13416 }, { "epoch": 0.17, "learning_rate": 0.000188718844162009, "loss": 2.3807, "step": 13424 }, { "epoch": 0.17, "learning_rate": 0.00018870502375434463, "loss": 2.3871, "step": 13432 }, { "epoch": 0.17, "learning_rate": 0.0001886911954530124, "loss": 2.396, "step": 13440 }, { "epoch": 0.17, "learning_rate": 0.00018867735925939914, "loss": 2.3976, "step": 13448 }, { "epoch": 0.17, "learning_rate": 0.00018866351517489254, "loss": 2.3788, "step": 13456 }, { "epoch": 0.17, "learning_rate": 0.0001886496632008811, "loss": 2.3786, "step": 13464 }, { "epoch": 0.17, "learning_rate": 0.00018863580333875412, "loss": 2.3943, "step": 13472 }, { "epoch": 0.17, "learning_rate": 0.00018862193558990165, "loss": 2.3964, "step": 13480 }, { "epoch": 0.17, "learning_rate": 0.00018860805995571446, "loss": 2.4179, "step": 13488 }, { "epoch": 0.17, "learning_rate": 0.00018859417643758437, "loss": 2.37, "step": 13496 }, { "epoch": 0.17, "learning_rate": 0.00018858028503690365, "loss": 2.3721, "step": 13504 }, { "epoch": 0.17, "learning_rate": 0.00018856638575506565, "loss": 2.3841, "step": 13512 }, { "epoch": 0.17, "learning_rate": 0.0001885524785934643, "loss": 2.4048, "step": 13520 }, { "epoch": 0.17, "learning_rate": 0.00018853856355349448, "loss": 2.3759, "step": 13528 }, { "epoch": 0.17, "learning_rate": 0.00018852464063655176, "loss": 2.3836, "step": 13536 }, { "epoch": 0.17, "learning_rate": 0.0001885107098440325, "loss": 2.3986, "step": 13544 }, { "epoch": 0.17, "learning_rate": 0.00018849677117733392, "loss": 2.3937, "step": 13552 }, { "epoch": 0.17, "learning_rate": 0.000188482824637854, "loss": 2.3821, "step": 13560 }, { "epoch": 0.17, "learning_rate": 0.00018846887022699147, "loss": 2.3863, "step": 13568 }, { "epoch": 0.17, "learning_rate": 0.00018845490794614587, "loss": 2.3616, "step": 13576 }, { "epoch": 0.17, "learning_rate": 0.0001884409377967176, "loss": 2.378, "step": 13584 }, { "epoch": 0.17, "learning_rate": 0.00018842695978010766, "loss": 2.4052, "step": 13592 }, { "epoch": 0.17, "learning_rate": 0.0001884129738977181, "loss": 2.4167, "step": 13600 }, { "epoch": 0.17, "learning_rate": 0.00018839898015095155, "loss": 2.3874, "step": 13608 }, { "epoch": 0.17, "learning_rate": 0.00018838497854121154, "loss": 2.3905, "step": 13616 }, { "epoch": 0.17, "learning_rate": 0.00018837096906990233, "loss": 2.4128, "step": 13624 }, { "epoch": 0.17, "learning_rate": 0.000188356951738429, "loss": 2.4001, "step": 13632 }, { "epoch": 0.17, "learning_rate": 0.00018834292654819739, "loss": 2.4033, "step": 13640 }, { "epoch": 0.17, "learning_rate": 0.00018832889350061418, "loss": 2.4065, "step": 13648 }, { "epoch": 0.17, "learning_rate": 0.00018831485259708676, "loss": 2.3896, "step": 13656 }, { "epoch": 0.17, "learning_rate": 0.0001883008038390234, "loss": 2.38, "step": 13664 }, { "epoch": 0.17, "learning_rate": 0.0001882867472278331, "loss": 2.3854, "step": 13672 }, { "epoch": 0.17, "learning_rate": 0.0001882726827649256, "loss": 2.4, "step": 13680 }, { "epoch": 0.17, "learning_rate": 0.00018825861045171163, "loss": 2.4093, "step": 13688 }, { "epoch": 0.17, "learning_rate": 0.0001882445302896024, "loss": 2.3892, "step": 13696 }, { "epoch": 0.17, "learning_rate": 0.00018823044228001017, "loss": 2.4066, "step": 13704 }, { "epoch": 0.17, "learning_rate": 0.00018821634642434784, "loss": 2.3769, "step": 13712 }, { "epoch": 0.17, "learning_rate": 0.0001882022427240292, "loss": 2.387, "step": 13720 }, { "epoch": 0.17, "learning_rate": 0.00018818813118046866, "loss": 2.4067, "step": 13728 }, { "epoch": 0.17, "learning_rate": 0.00018817401179508167, "loss": 2.3972, "step": 13736 }, { "epoch": 0.17, "learning_rate": 0.00018815988456928422, "loss": 2.3924, "step": 13744 }, { "epoch": 0.17, "learning_rate": 0.00018814574950449324, "loss": 2.3757, "step": 13752 }, { "epoch": 0.17, "learning_rate": 0.00018813160660212638, "loss": 2.397, "step": 13760 }, { "epoch": 0.17, "learning_rate": 0.0001881174558636021, "loss": 2.3774, "step": 13768 }, { "epoch": 0.17, "learning_rate": 0.0001881032972903396, "loss": 2.4052, "step": 13776 }, { "epoch": 0.17, "learning_rate": 0.000188089130883759, "loss": 2.3775, "step": 13784 }, { "epoch": 0.17, "learning_rate": 0.000188074956645281, "loss": 2.3826, "step": 13792 }, { "epoch": 0.17, "learning_rate": 0.00018806077457632724, "loss": 2.4138, "step": 13800 }, { "epoch": 0.17, "learning_rate": 0.00018804658467832012, "loss": 2.4132, "step": 13808 }, { "epoch": 0.17, "learning_rate": 0.00018803238695268282, "loss": 2.3717, "step": 13816 }, { "epoch": 0.17, "learning_rate": 0.00018801818140083926, "loss": 2.3741, "step": 13824 }, { "epoch": 0.17, "learning_rate": 0.00018800396802421413, "loss": 2.3942, "step": 13832 }, { "epoch": 0.17, "learning_rate": 0.00018798974682423305, "loss": 2.4012, "step": 13840 }, { "epoch": 0.17, "learning_rate": 0.0001879755178023223, "loss": 2.4156, "step": 13848 }, { "epoch": 0.17, "learning_rate": 0.0001879612809599089, "loss": 2.4123, "step": 13856 }, { "epoch": 0.17, "learning_rate": 0.00018794703629842075, "loss": 2.3687, "step": 13864 }, { "epoch": 0.17, "learning_rate": 0.0001879327838192866, "loss": 2.3836, "step": 13872 }, { "epoch": 0.17, "learning_rate": 0.0001879185235239358, "loss": 2.3718, "step": 13880 }, { "epoch": 0.17, "learning_rate": 0.00018790425541379859, "loss": 2.3938, "step": 13888 }, { "epoch": 0.17, "learning_rate": 0.00018788997949030598, "loss": 2.4019, "step": 13896 }, { "epoch": 0.17, "learning_rate": 0.00018787569575488982, "loss": 2.3951, "step": 13904 }, { "epoch": 0.17, "learning_rate": 0.0001878614042089826, "loss": 2.3883, "step": 13912 }, { "epoch": 0.17, "learning_rate": 0.00018784710485401774, "loss": 2.3959, "step": 13920 }, { "epoch": 0.17, "learning_rate": 0.00018783279769142938, "loss": 2.3872, "step": 13928 }, { "epoch": 0.17, "learning_rate": 0.00018781848272265243, "loss": 2.4153, "step": 13936 }, { "epoch": 0.17, "learning_rate": 0.0001878041599491226, "loss": 2.3818, "step": 13944 }, { "epoch": 0.17, "learning_rate": 0.0001877898293722764, "loss": 2.3965, "step": 13952 }, { "epoch": 0.17, "learning_rate": 0.00018777549099355107, "loss": 2.3899, "step": 13960 }, { "epoch": 0.17, "learning_rate": 0.00018776114481438473, "loss": 2.3974, "step": 13968 }, { "epoch": 0.17, "learning_rate": 0.00018774679083621615, "loss": 2.3958, "step": 13976 }, { "epoch": 0.17, "learning_rate": 0.000187732429060485, "loss": 2.3926, "step": 13984 }, { "epoch": 0.17, "learning_rate": 0.00018771805948863168, "loss": 2.3912, "step": 13992 }, { "epoch": 0.17, "learning_rate": 0.00018770368212209736, "loss": 2.3841, "step": 14000 }, { "epoch": 0.18, "learning_rate": 0.00018768929696232403, "loss": 2.3808, "step": 14008 }, { "epoch": 0.18, "learning_rate": 0.00018767490401075442, "loss": 2.3908, "step": 14016 }, { "epoch": 0.18, "learning_rate": 0.00018766050326883207, "loss": 2.4197, "step": 14024 }, { "epoch": 0.18, "learning_rate": 0.00018764609473800127, "loss": 2.3863, "step": 14032 }, { "epoch": 0.18, "learning_rate": 0.00018763167841970714, "loss": 2.3756, "step": 14040 }, { "epoch": 0.18, "learning_rate": 0.00018761725431539557, "loss": 2.4033, "step": 14048 }, { "epoch": 0.18, "learning_rate": 0.00018760282242651316, "loss": 2.3984, "step": 14056 }, { "epoch": 0.18, "learning_rate": 0.00018758838275450743, "loss": 2.4083, "step": 14064 }, { "epoch": 0.18, "learning_rate": 0.00018757393530082652, "loss": 2.4045, "step": 14072 }, { "epoch": 0.18, "learning_rate": 0.00018755948006691947, "loss": 2.3828, "step": 14080 }, { "epoch": 0.18, "learning_rate": 0.00018754501705423607, "loss": 2.3839, "step": 14088 }, { "epoch": 0.18, "learning_rate": 0.0001875305462642268, "loss": 2.3793, "step": 14096 }, { "epoch": 0.18, "learning_rate": 0.0001875160676983431, "loss": 2.3988, "step": 14104 }, { "epoch": 0.18, "learning_rate": 0.00018750158135803698, "loss": 2.3787, "step": 14112 }, { "epoch": 0.18, "learning_rate": 0.00018748708724476148, "loss": 2.3917, "step": 14120 }, { "epoch": 0.18, "learning_rate": 0.00018747258535997013, "loss": 2.3884, "step": 14128 }, { "epoch": 0.18, "learning_rate": 0.00018745807570511746, "loss": 2.3827, "step": 14136 }, { "epoch": 0.18, "learning_rate": 0.0001874435582816587, "loss": 2.3758, "step": 14144 }, { "epoch": 0.18, "learning_rate": 0.0001874290330910499, "loss": 2.3704, "step": 14152 }, { "epoch": 0.18, "learning_rate": 0.0001874145001347478, "loss": 2.3942, "step": 14160 }, { "epoch": 0.18, "learning_rate": 0.00018739995941420996, "loss": 2.3794, "step": 14168 }, { "epoch": 0.18, "learning_rate": 0.00018738541093089476, "loss": 2.403, "step": 14176 }, { "epoch": 0.18, "learning_rate": 0.0001873708546862614, "loss": 2.3708, "step": 14184 }, { "epoch": 0.18, "learning_rate": 0.00018735629068176966, "loss": 2.4114, "step": 14192 }, { "epoch": 0.18, "learning_rate": 0.00018734171891888034, "loss": 2.4045, "step": 14200 }, { "epoch": 0.18, "learning_rate": 0.0001873271393990548, "loss": 2.3996, "step": 14208 }, { "epoch": 0.18, "learning_rate": 0.00018731255212375538, "loss": 2.3881, "step": 14216 }, { "epoch": 0.18, "learning_rate": 0.00018729795709444502, "loss": 2.3621, "step": 14224 }, { "epoch": 0.18, "learning_rate": 0.0001872833543125876, "loss": 2.3904, "step": 14232 }, { "epoch": 0.18, "learning_rate": 0.00018726874377964764, "loss": 2.3896, "step": 14240 }, { "epoch": 0.18, "learning_rate": 0.00018725412549709048, "loss": 2.4033, "step": 14248 }, { "epoch": 0.18, "learning_rate": 0.0001872394994663823, "loss": 2.375, "step": 14256 }, { "epoch": 0.18, "learning_rate": 0.00018722486568899002, "loss": 2.3939, "step": 14264 }, { "epoch": 0.18, "learning_rate": 0.00018721022416638125, "loss": 2.3886, "step": 14272 }, { "epoch": 0.18, "learning_rate": 0.00018719557490002448, "loss": 2.3943, "step": 14280 }, { "epoch": 0.18, "learning_rate": 0.00018718091789138902, "loss": 2.3837, "step": 14288 }, { "epoch": 0.18, "learning_rate": 0.00018716625314194475, "loss": 2.3855, "step": 14296 }, { "epoch": 0.18, "learning_rate": 0.0001871515806531626, "loss": 2.3876, "step": 14304 }, { "epoch": 0.18, "learning_rate": 0.00018713690042651405, "loss": 2.385, "step": 14312 }, { "epoch": 0.18, "learning_rate": 0.00018712221246347147, "loss": 2.3824, "step": 14320 }, { "epoch": 0.18, "learning_rate": 0.00018710751676550799, "loss": 2.3919, "step": 14328 }, { "epoch": 0.18, "learning_rate": 0.0001870928133340975, "loss": 2.4023, "step": 14336 }, { "epoch": 0.18, "learning_rate": 0.00018707810217071465, "loss": 2.4068, "step": 14344 }, { "epoch": 0.18, "learning_rate": 0.0001870633832768349, "loss": 2.3966, "step": 14352 }, { "epoch": 0.18, "learning_rate": 0.00018704865665393448, "loss": 2.3727, "step": 14360 }, { "epoch": 0.18, "learning_rate": 0.00018703392230349036, "loss": 2.3779, "step": 14368 }, { "epoch": 0.18, "learning_rate": 0.00018701918022698036, "loss": 2.3807, "step": 14376 }, { "epoch": 0.18, "learning_rate": 0.00018700443042588298, "loss": 2.3991, "step": 14384 }, { "epoch": 0.18, "learning_rate": 0.00018698967290167758, "loss": 2.3679, "step": 14392 }, { "epoch": 0.18, "learning_rate": 0.0001869749076558442, "loss": 2.3803, "step": 14400 }, { "epoch": 0.18, "learning_rate": 0.00018696013468986374, "loss": 2.3814, "step": 14408 }, { "epoch": 0.18, "learning_rate": 0.0001869453540052179, "loss": 2.394, "step": 14416 }, { "epoch": 0.18, "learning_rate": 0.00018693056560338902, "loss": 2.3942, "step": 14424 }, { "epoch": 0.18, "learning_rate": 0.00018691576948586035, "loss": 2.3973, "step": 14432 }, { "epoch": 0.18, "learning_rate": 0.0001869009656541158, "loss": 2.3868, "step": 14440 }, { "epoch": 0.18, "learning_rate": 0.00018688615410964013, "loss": 2.3882, "step": 14448 }, { "epoch": 0.18, "learning_rate": 0.00018687133485391886, "loss": 2.3745, "step": 14456 }, { "epoch": 0.18, "learning_rate": 0.0001868565078884383, "loss": 2.406, "step": 14464 }, { "epoch": 0.18, "learning_rate": 0.0001868416732146855, "loss": 2.3812, "step": 14472 }, { "epoch": 0.18, "learning_rate": 0.00018682683083414827, "loss": 2.3764, "step": 14480 }, { "epoch": 0.18, "learning_rate": 0.00018681198074831524, "loss": 2.3861, "step": 14488 }, { "epoch": 0.18, "learning_rate": 0.0001867971229586758, "loss": 2.3799, "step": 14496 }, { "epoch": 0.18, "learning_rate": 0.00018678225746672006, "loss": 2.3895, "step": 14504 }, { "epoch": 0.18, "learning_rate": 0.00018676738427393899, "loss": 2.3791, "step": 14512 }, { "epoch": 0.18, "learning_rate": 0.00018675250338182425, "loss": 2.3839, "step": 14520 }, { "epoch": 0.18, "learning_rate": 0.00018673761479186832, "loss": 2.3915, "step": 14528 }, { "epoch": 0.18, "learning_rate": 0.00018672271850556443, "loss": 2.4077, "step": 14536 }, { "epoch": 0.18, "learning_rate": 0.00018670781452440665, "loss": 2.3912, "step": 14544 }, { "epoch": 0.18, "learning_rate": 0.0001866929028498897, "loss": 2.3687, "step": 14552 }, { "epoch": 0.18, "learning_rate": 0.00018667798348350915, "loss": 2.3852, "step": 14560 }, { "epoch": 0.18, "learning_rate": 0.00018666305642676135, "loss": 2.407, "step": 14568 }, { "epoch": 0.18, "learning_rate": 0.00018664812168114338, "loss": 2.3976, "step": 14576 }, { "epoch": 0.18, "learning_rate": 0.00018663317924815315, "loss": 2.3687, "step": 14584 }, { "epoch": 0.18, "learning_rate": 0.0001866182291292892, "loss": 2.383, "step": 14592 }, { "epoch": 0.18, "learning_rate": 0.0001866032713260511, "loss": 2.3783, "step": 14600 }, { "epoch": 0.18, "learning_rate": 0.0001865883058399389, "loss": 2.3977, "step": 14608 }, { "epoch": 0.18, "learning_rate": 0.0001865733326724536, "loss": 2.3764, "step": 14616 }, { "epoch": 0.18, "learning_rate": 0.00018655835182509689, "loss": 2.382, "step": 14624 }, { "epoch": 0.18, "learning_rate": 0.00018654336329937133, "loss": 2.3731, "step": 14632 }, { "epoch": 0.18, "learning_rate": 0.00018652836709678015, "loss": 2.3948, "step": 14640 }, { "epoch": 0.18, "learning_rate": 0.00018651336321882735, "loss": 2.3867, "step": 14648 }, { "epoch": 0.18, "learning_rate": 0.0001864983516670178, "loss": 2.3776, "step": 14656 }, { "epoch": 0.18, "learning_rate": 0.00018648333244285705, "loss": 2.3812, "step": 14664 }, { "epoch": 0.18, "learning_rate": 0.00018646830554785142, "loss": 2.3921, "step": 14672 }, { "epoch": 0.18, "learning_rate": 0.00018645327098350804, "loss": 2.3925, "step": 14680 }, { "epoch": 0.18, "learning_rate": 0.00018643822875133478, "loss": 2.3856, "step": 14688 }, { "epoch": 0.18, "learning_rate": 0.0001864231788528403, "loss": 2.3744, "step": 14696 }, { "epoch": 0.18, "learning_rate": 0.00018640812128953402, "loss": 2.3906, "step": 14704 }, { "epoch": 0.18, "learning_rate": 0.00018639305606292614, "loss": 2.3844, "step": 14712 }, { "epoch": 0.18, "learning_rate": 0.0001863779831745276, "loss": 2.3816, "step": 14720 }, { "epoch": 0.18, "learning_rate": 0.00018636290262585012, "loss": 2.3888, "step": 14728 }, { "epoch": 0.18, "learning_rate": 0.0001863478144184062, "loss": 2.3826, "step": 14736 }, { "epoch": 0.18, "learning_rate": 0.00018633271855370912, "loss": 2.3709, "step": 14744 }, { "epoch": 0.18, "learning_rate": 0.0001863176150332729, "loss": 2.3821, "step": 14752 }, { "epoch": 0.18, "learning_rate": 0.0001863025038586123, "loss": 2.3784, "step": 14760 }, { "epoch": 0.18, "learning_rate": 0.00018628738503124293, "loss": 2.368, "step": 14768 }, { "epoch": 0.18, "learning_rate": 0.0001862722585526811, "loss": 2.3957, "step": 14776 }, { "epoch": 0.18, "learning_rate": 0.00018625712442444395, "loss": 2.3962, "step": 14784 }, { "epoch": 0.18, "learning_rate": 0.0001862419826480493, "loss": 2.3944, "step": 14792 }, { "epoch": 0.18, "learning_rate": 0.0001862268332250158, "loss": 2.3789, "step": 14800 }, { "epoch": 0.19, "learning_rate": 0.00018621167615686282, "loss": 2.364, "step": 14808 }, { "epoch": 0.19, "learning_rate": 0.00018619651144511062, "loss": 2.3748, "step": 14816 }, { "epoch": 0.19, "learning_rate": 0.00018618133909128006, "loss": 2.3811, "step": 14824 }, { "epoch": 0.19, "learning_rate": 0.00018616615909689284, "loss": 2.3867, "step": 14832 }, { "epoch": 0.19, "learning_rate": 0.00018615097146347146, "loss": 2.3912, "step": 14840 }, { "epoch": 0.19, "learning_rate": 0.0001861357761925391, "loss": 2.3685, "step": 14848 }, { "epoch": 0.19, "learning_rate": 0.00018612057328561984, "loss": 2.4118, "step": 14856 }, { "epoch": 0.19, "learning_rate": 0.00018610536274423837, "loss": 2.3947, "step": 14864 }, { "epoch": 0.19, "learning_rate": 0.0001860901445699203, "loss": 2.3841, "step": 14872 }, { "epoch": 0.19, "learning_rate": 0.00018607491876419184, "loss": 2.3682, "step": 14880 }, { "epoch": 0.19, "learning_rate": 0.0001860596853285801, "loss": 2.386, "step": 14888 }, { "epoch": 0.19, "learning_rate": 0.0001860444442646129, "loss": 2.3677, "step": 14896 }, { "epoch": 0.19, "learning_rate": 0.00018602919557381885, "loss": 2.3731, "step": 14904 }, { "epoch": 0.19, "learning_rate": 0.00018601393925772724, "loss": 2.3954, "step": 14912 }, { "epoch": 0.19, "learning_rate": 0.00018599867531786827, "loss": 2.3908, "step": 14920 }, { "epoch": 0.19, "learning_rate": 0.00018598340375577282, "loss": 2.3884, "step": 14928 }, { "epoch": 0.19, "learning_rate": 0.00018596812457297247, "loss": 2.3663, "step": 14936 }, { "epoch": 0.19, "learning_rate": 0.00018595283777099973, "loss": 2.3876, "step": 14944 }, { "epoch": 0.19, "learning_rate": 0.00018593754335138773, "loss": 2.3872, "step": 14952 }, { "epoch": 0.19, "learning_rate": 0.0001859222413156704, "loss": 2.4022, "step": 14960 }, { "epoch": 0.19, "learning_rate": 0.0001859069316653825, "loss": 2.3823, "step": 14968 }, { "epoch": 0.19, "learning_rate": 0.00018589161440205943, "loss": 2.3755, "step": 14976 }, { "epoch": 0.19, "learning_rate": 0.00018587628952723744, "loss": 2.3939, "step": 14984 }, { "epoch": 0.19, "learning_rate": 0.0001858609570424536, "loss": 2.3759, "step": 14992 }, { "epoch": 0.19, "learning_rate": 0.0001858456169492456, "loss": 2.3976, "step": 15000 }, { "epoch": 0.19, "learning_rate": 0.00018583026924915197, "loss": 2.3807, "step": 15008 }, { "epoch": 0.19, "learning_rate": 0.00018581491394371202, "loss": 2.3762, "step": 15016 }, { "epoch": 0.19, "learning_rate": 0.0001857995510344658, "loss": 2.3826, "step": 15024 }, { "epoch": 0.19, "learning_rate": 0.0001857841805229541, "loss": 2.407, "step": 15032 }, { "epoch": 0.19, "learning_rate": 0.00018576880241071852, "loss": 2.3696, "step": 15040 }, { "epoch": 0.19, "learning_rate": 0.0001857534166993014, "loss": 2.3774, "step": 15048 }, { "epoch": 0.19, "learning_rate": 0.00018573802339024584, "loss": 2.368, "step": 15056 }, { "epoch": 0.19, "learning_rate": 0.00018572262248509568, "loss": 2.3773, "step": 15064 }, { "epoch": 0.19, "learning_rate": 0.00018570721398539553, "loss": 2.3665, "step": 15072 }, { "epoch": 0.19, "learning_rate": 0.0001856917978926908, "loss": 2.3755, "step": 15080 }, { "epoch": 0.19, "learning_rate": 0.00018567637420852762, "loss": 2.41, "step": 15088 }, { "epoch": 0.19, "learning_rate": 0.00018566094293445297, "loss": 2.4029, "step": 15096 }, { "epoch": 0.19, "learning_rate": 0.00018564550407201442, "loss": 2.3754, "step": 15104 }, { "epoch": 0.19, "learning_rate": 0.00018563005762276045, "loss": 2.3788, "step": 15112 }, { "epoch": 0.19, "learning_rate": 0.00018561460358824022, "loss": 2.3852, "step": 15120 }, { "epoch": 0.19, "learning_rate": 0.00018559914197000376, "loss": 2.3849, "step": 15128 }, { "epoch": 0.19, "learning_rate": 0.00018558367276960168, "loss": 2.4004, "step": 15136 }, { "epoch": 0.19, "learning_rate": 0.00018556819598858555, "loss": 2.3679, "step": 15144 }, { "epoch": 0.19, "learning_rate": 0.00018555271162850752, "loss": 2.3715, "step": 15152 }, { "epoch": 0.19, "learning_rate": 0.00018553721969092062, "loss": 2.3428, "step": 15160 }, { "epoch": 0.19, "learning_rate": 0.0001855217201773786, "loss": 2.3644, "step": 15168 }, { "epoch": 0.19, "learning_rate": 0.00018550621308943598, "loss": 2.4002, "step": 15176 }, { "epoch": 0.19, "learning_rate": 0.00018549069842864805, "loss": 2.3878, "step": 15184 }, { "epoch": 0.19, "learning_rate": 0.0001854751761965708, "loss": 2.3729, "step": 15192 }, { "epoch": 0.19, "learning_rate": 0.00018545964639476105, "loss": 2.3946, "step": 15200 }, { "epoch": 0.19, "learning_rate": 0.00018544410902477634, "loss": 2.3885, "step": 15208 }, { "epoch": 0.19, "learning_rate": 0.000185428564088175, "loss": 2.383, "step": 15216 }, { "epoch": 0.19, "learning_rate": 0.00018541301158651608, "loss": 2.3915, "step": 15224 }, { "epoch": 0.19, "learning_rate": 0.0001853974515213594, "loss": 2.3809, "step": 15232 }, { "epoch": 0.19, "learning_rate": 0.00018538188389426554, "loss": 2.3801, "step": 15240 }, { "epoch": 0.19, "learning_rate": 0.0001853663087067959, "loss": 2.3656, "step": 15248 }, { "epoch": 0.19, "learning_rate": 0.00018535072596051255, "loss": 2.3878, "step": 15256 }, { "epoch": 0.19, "learning_rate": 0.0001853351356569783, "loss": 2.4025, "step": 15264 }, { "epoch": 0.19, "learning_rate": 0.00018531953779775683, "loss": 2.3873, "step": 15272 }, { "epoch": 0.19, "learning_rate": 0.00018530393238441251, "loss": 2.3677, "step": 15280 }, { "epoch": 0.19, "learning_rate": 0.00018528831941851047, "loss": 2.3819, "step": 15288 }, { "epoch": 0.19, "learning_rate": 0.00018527269890161662, "loss": 2.3778, "step": 15296 }, { "epoch": 0.19, "learning_rate": 0.00018525707083529757, "loss": 2.3795, "step": 15304 }, { "epoch": 0.19, "learning_rate": 0.00018524143522112075, "loss": 2.381, "step": 15312 }, { "epoch": 0.19, "learning_rate": 0.0001852257920606543, "loss": 2.3834, "step": 15320 }, { "epoch": 0.19, "learning_rate": 0.0001852101413554672, "loss": 2.3797, "step": 15328 }, { "epoch": 0.19, "learning_rate": 0.00018519448310712905, "loss": 2.3915, "step": 15336 }, { "epoch": 0.19, "learning_rate": 0.00018517881731721034, "loss": 2.3796, "step": 15344 }, { "epoch": 0.19, "learning_rate": 0.00018516314398728224, "loss": 2.3695, "step": 15352 }, { "epoch": 0.19, "learning_rate": 0.00018514746311891668, "loss": 2.3761, "step": 15360 }, { "epoch": 0.19, "learning_rate": 0.00018513177471368638, "loss": 2.398, "step": 15368 }, { "epoch": 0.19, "learning_rate": 0.0001851160787731648, "loss": 2.3725, "step": 15376 }, { "epoch": 0.19, "learning_rate": 0.00018510037529892613, "loss": 2.3802, "step": 15384 }, { "epoch": 0.19, "learning_rate": 0.00018508466429254542, "loss": 2.3788, "step": 15392 }, { "epoch": 0.19, "learning_rate": 0.00018506894575559825, "loss": 2.3796, "step": 15400 }, { "epoch": 0.19, "learning_rate": 0.00018505321968966128, "loss": 2.3792, "step": 15408 }, { "epoch": 0.19, "learning_rate": 0.0001850374860963116, "loss": 2.3848, "step": 15416 }, { "epoch": 0.19, "learning_rate": 0.00018502174497712724, "loss": 2.3791, "step": 15424 }, { "epoch": 0.19, "learning_rate": 0.00018500599633368693, "loss": 2.3767, "step": 15432 }, { "epoch": 0.19, "learning_rate": 0.00018499024016757027, "loss": 2.3721, "step": 15440 }, { "epoch": 0.19, "learning_rate": 0.00018497447648035736, "loss": 2.3896, "step": 15448 }, { "epoch": 0.19, "learning_rate": 0.00018495870527362936, "loss": 2.4002, "step": 15456 }, { "epoch": 0.19, "learning_rate": 0.00018494292654896793, "loss": 2.3835, "step": 15464 }, { "epoch": 0.19, "learning_rate": 0.0001849271403079556, "loss": 2.3942, "step": 15472 }, { "epoch": 0.19, "learning_rate": 0.0001849113465521757, "loss": 2.4037, "step": 15480 }, { "epoch": 0.19, "learning_rate": 0.00018489554528321216, "loss": 2.3669, "step": 15488 }, { "epoch": 0.19, "learning_rate": 0.00018487973650264985, "loss": 2.4058, "step": 15496 }, { "epoch": 0.19, "learning_rate": 0.00018486392021207422, "loss": 2.3779, "step": 15504 }, { "epoch": 0.19, "learning_rate": 0.00018484809641307163, "loss": 2.3867, "step": 15512 }, { "epoch": 0.19, "learning_rate": 0.0001848322651072291, "loss": 2.3882, "step": 15520 }, { "epoch": 0.19, "learning_rate": 0.00018481642629613435, "loss": 2.3751, "step": 15528 }, { "epoch": 0.19, "learning_rate": 0.000184800579981376, "loss": 2.3875, "step": 15536 }, { "epoch": 0.19, "learning_rate": 0.00018478472616454333, "loss": 2.3588, "step": 15544 }, { "epoch": 0.19, "learning_rate": 0.00018476886484722636, "loss": 2.3829, "step": 15552 }, { "epoch": 0.19, "learning_rate": 0.00018475299603101593, "loss": 2.3881, "step": 15560 }, { "epoch": 0.19, "learning_rate": 0.00018473711971750355, "loss": 2.4098, "step": 15568 }, { "epoch": 0.19, "learning_rate": 0.0001847212359082816, "loss": 2.3789, "step": 15576 }, { "epoch": 0.19, "learning_rate": 0.000184705344604943, "loss": 2.3727, "step": 15584 }, { "epoch": 0.19, "learning_rate": 0.00018468944580908171, "loss": 2.3799, "step": 15592 }, { "epoch": 0.2, "learning_rate": 0.0001846735395222922, "loss": 2.3727, "step": 15600 }, { "epoch": 0.2, "learning_rate": 0.0001846576257461698, "loss": 2.3747, "step": 15608 }, { "epoch": 0.2, "learning_rate": 0.00018464170448231055, "loss": 2.3403, "step": 15616 }, { "epoch": 0.2, "learning_rate": 0.0001846257757323113, "loss": 2.383, "step": 15624 }, { "epoch": 0.2, "learning_rate": 0.00018460983949776958, "loss": 2.3975, "step": 15632 }, { "epoch": 0.2, "learning_rate": 0.00018459389578028373, "loss": 2.3895, "step": 15640 }, { "epoch": 0.2, "learning_rate": 0.00018457794458145283, "loss": 2.3725, "step": 15648 }, { "epoch": 0.2, "learning_rate": 0.00018456198590287664, "loss": 2.3772, "step": 15656 }, { "epoch": 0.2, "learning_rate": 0.00018454601974615575, "loss": 2.3967, "step": 15664 }, { "epoch": 0.2, "learning_rate": 0.0001845300461128915, "loss": 2.3875, "step": 15672 }, { "epoch": 0.2, "learning_rate": 0.00018451406500468595, "loss": 2.3831, "step": 15680 }, { "epoch": 0.2, "learning_rate": 0.00018449807642314188, "loss": 2.3767, "step": 15688 }, { "epoch": 0.2, "learning_rate": 0.00018448208036986286, "loss": 2.3836, "step": 15696 }, { "epoch": 0.2, "learning_rate": 0.00018446607684645324, "loss": 2.3718, "step": 15704 }, { "epoch": 0.2, "learning_rate": 0.00018445006585451806, "loss": 2.3818, "step": 15712 }, { "epoch": 0.2, "learning_rate": 0.0001844340473956631, "loss": 2.394, "step": 15720 }, { "epoch": 0.2, "learning_rate": 0.000184418021471495, "loss": 2.3908, "step": 15728 }, { "epoch": 0.2, "learning_rate": 0.00018440198808362097, "loss": 2.3763, "step": 15736 }, { "epoch": 0.2, "learning_rate": 0.00018438594723364917, "loss": 2.3853, "step": 15744 }, { "epoch": 0.2, "learning_rate": 0.0001843698989231883, "loss": 2.3745, "step": 15752 }, { "epoch": 0.2, "learning_rate": 0.00018435384315384804, "loss": 2.3803, "step": 15760 }, { "epoch": 0.2, "learning_rate": 0.0001843377799272386, "loss": 2.3671, "step": 15768 }, { "epoch": 0.2, "learning_rate": 0.00018432170924497106, "loss": 2.3745, "step": 15776 }, { "epoch": 0.2, "learning_rate": 0.0001843056311086572, "loss": 2.3819, "step": 15784 }, { "epoch": 0.2, "learning_rate": 0.00018428954551990957, "loss": 2.3738, "step": 15792 }, { "epoch": 0.2, "learning_rate": 0.00018427345248034146, "loss": 2.3784, "step": 15800 }, { "epoch": 0.2, "learning_rate": 0.00018425735199156698, "loss": 2.391, "step": 15808 }, { "epoch": 0.2, "learning_rate": 0.0001842412440552008, "loss": 2.3849, "step": 15816 }, { "epoch": 0.2, "learning_rate": 0.00018422512867285855, "loss": 2.3773, "step": 15824 }, { "epoch": 0.2, "learning_rate": 0.00018420900584615647, "loss": 2.3881, "step": 15832 }, { "epoch": 0.2, "learning_rate": 0.0001841928755767116, "loss": 2.392, "step": 15840 }, { "epoch": 0.2, "learning_rate": 0.0001841767378661417, "loss": 2.393, "step": 15848 }, { "epoch": 0.2, "learning_rate": 0.00018416059271606527, "loss": 2.3561, "step": 15856 }, { "epoch": 0.2, "learning_rate": 0.00018414444012810163, "loss": 2.3845, "step": 15864 }, { "epoch": 0.2, "learning_rate": 0.00018412828010387077, "loss": 2.3522, "step": 15872 }, { "epoch": 0.2, "learning_rate": 0.00018411211264499346, "loss": 2.3897, "step": 15880 }, { "epoch": 0.2, "learning_rate": 0.0001840959377530912, "loss": 2.3724, "step": 15888 }, { "epoch": 0.2, "learning_rate": 0.00018407975542978624, "loss": 2.4019, "step": 15896 }, { "epoch": 0.2, "learning_rate": 0.00018406356567670154, "loss": 2.3802, "step": 15904 }, { "epoch": 0.2, "learning_rate": 0.0001840473684954609, "loss": 2.3986, "step": 15912 }, { "epoch": 0.2, "learning_rate": 0.00018403116388768877, "loss": 2.3751, "step": 15920 }, { "epoch": 0.2, "learning_rate": 0.00018401495185501037, "loss": 2.3934, "step": 15928 }, { "epoch": 0.2, "learning_rate": 0.0001839987323990517, "loss": 2.3873, "step": 15936 }, { "epoch": 0.2, "learning_rate": 0.00018398250552143945, "loss": 2.3821, "step": 15944 }, { "epoch": 0.2, "learning_rate": 0.00018396627122380116, "loss": 2.3839, "step": 15952 }, { "epoch": 0.2, "learning_rate": 0.0001839500295077649, "loss": 2.3619, "step": 15960 }, { "epoch": 0.2, "learning_rate": 0.00018393378037495975, "loss": 2.3718, "step": 15968 }, { "epoch": 0.2, "learning_rate": 0.00018391752382701537, "loss": 2.3725, "step": 15976 }, { "epoch": 0.2, "learning_rate": 0.0001839012598655622, "loss": 2.3796, "step": 15984 }, { "epoch": 0.2, "learning_rate": 0.00018388498849223136, "loss": 2.3857, "step": 15992 }, { "epoch": 0.2, "learning_rate": 0.0001838687097086549, "loss": 2.3749, "step": 16000 }, { "epoch": 0.2, "learning_rate": 0.00018385242351646533, "loss": 2.3798, "step": 16008 }, { "epoch": 0.2, "learning_rate": 0.00018383612991729623, "loss": 2.3691, "step": 16016 }, { "epoch": 0.2, "learning_rate": 0.00018381982891278164, "loss": 2.3696, "step": 16024 }, { "epoch": 0.2, "learning_rate": 0.00018380352050455652, "loss": 2.3618, "step": 16032 }, { "epoch": 0.2, "learning_rate": 0.00018378720469425648, "loss": 2.3924, "step": 16040 }, { "epoch": 0.2, "learning_rate": 0.0001837708814835179, "loss": 2.3676, "step": 16048 }, { "epoch": 0.2, "learning_rate": 0.00018375455087397792, "loss": 2.3559, "step": 16056 }, { "epoch": 0.2, "learning_rate": 0.0001837382128672744, "loss": 2.384, "step": 16064 }, { "epoch": 0.2, "learning_rate": 0.00018372186746504597, "loss": 2.3827, "step": 16072 }, { "epoch": 0.2, "learning_rate": 0.00018370551466893195, "loss": 2.3815, "step": 16080 }, { "epoch": 0.2, "learning_rate": 0.00018368915448057244, "loss": 2.3795, "step": 16088 }, { "epoch": 0.2, "learning_rate": 0.0001836727869016083, "loss": 2.3768, "step": 16096 }, { "epoch": 0.2, "learning_rate": 0.0001836564119336811, "loss": 2.3837, "step": 16104 }, { "epoch": 0.2, "learning_rate": 0.00018364002957843312, "loss": 2.3766, "step": 16112 }, { "epoch": 0.2, "learning_rate": 0.00018362363983750744, "loss": 2.3723, "step": 16120 }, { "epoch": 0.2, "learning_rate": 0.00018360724271254783, "loss": 2.3822, "step": 16128 }, { "epoch": 0.2, "learning_rate": 0.0001835908382051989, "loss": 2.3849, "step": 16136 }, { "epoch": 0.2, "learning_rate": 0.00018357442631710587, "loss": 2.3693, "step": 16144 }, { "epoch": 0.2, "learning_rate": 0.00018355800704991478, "loss": 2.387, "step": 16152 }, { "epoch": 0.2, "learning_rate": 0.0001835415804052724, "loss": 2.3625, "step": 16160 }, { "epoch": 0.2, "learning_rate": 0.00018352514638482622, "loss": 2.3718, "step": 16168 }, { "epoch": 0.2, "learning_rate": 0.00018350870499022443, "loss": 2.3725, "step": 16176 }, { "epoch": 0.2, "learning_rate": 0.0001834922562231161, "loss": 2.3827, "step": 16184 }, { "epoch": 0.2, "learning_rate": 0.00018347580008515086, "loss": 2.3833, "step": 16192 }, { "epoch": 0.2, "learning_rate": 0.00018345933657797924, "loss": 2.3621, "step": 16200 }, { "epoch": 0.2, "learning_rate": 0.00018344286570325238, "loss": 2.3729, "step": 16208 }, { "epoch": 0.2, "learning_rate": 0.00018342638746262225, "loss": 2.3715, "step": 16216 }, { "epoch": 0.2, "learning_rate": 0.00018340990185774153, "loss": 2.367, "step": 16224 }, { "epoch": 0.2, "learning_rate": 0.0001833934088902636, "loss": 2.3655, "step": 16232 }, { "epoch": 0.2, "learning_rate": 0.0001833769085618426, "loss": 2.367, "step": 16240 }, { "epoch": 0.2, "learning_rate": 0.0001833604008741335, "loss": 2.3616, "step": 16248 }, { "epoch": 0.2, "learning_rate": 0.00018334388582879187, "loss": 2.3609, "step": 16256 }, { "epoch": 0.2, "learning_rate": 0.00018332736342747404, "loss": 2.3617, "step": 16264 }, { "epoch": 0.2, "learning_rate": 0.00018331083367183722, "loss": 2.3633, "step": 16272 }, { "epoch": 0.2, "learning_rate": 0.0001832942965635391, "loss": 2.3614, "step": 16280 }, { "epoch": 0.2, "learning_rate": 0.0001832777521042384, "loss": 2.3657, "step": 16288 }, { "epoch": 0.2, "learning_rate": 0.00018326120029559437, "loss": 2.3888, "step": 16296 }, { "epoch": 0.2, "learning_rate": 0.00018324464113926708, "loss": 2.3891, "step": 16304 }, { "epoch": 0.2, "learning_rate": 0.0001832280746369173, "loss": 2.3752, "step": 16312 }, { "epoch": 0.2, "learning_rate": 0.00018321150079020655, "loss": 2.3781, "step": 16320 }, { "epoch": 0.2, "learning_rate": 0.00018319491960079714, "loss": 2.3646, "step": 16328 }, { "epoch": 0.2, "learning_rate": 0.000183178331070352, "loss": 2.3754, "step": 16336 }, { "epoch": 0.2, "learning_rate": 0.00018316173520053494, "loss": 2.3706, "step": 16344 }, { "epoch": 0.2, "learning_rate": 0.0001831451319930104, "loss": 2.3674, "step": 16352 }, { "epoch": 0.2, "learning_rate": 0.00018312852144944356, "loss": 2.3666, "step": 16360 }, { "epoch": 0.2, "learning_rate": 0.0001831119035715004, "loss": 2.3627, "step": 16368 }, { "epoch": 0.2, "learning_rate": 0.0001830952783608476, "loss": 2.3828, "step": 16376 }, { "epoch": 0.2, "learning_rate": 0.00018307864581915253, "loss": 2.3803, "step": 16384 }, { "epoch": 0.2, "learning_rate": 0.0001830620059480834, "loss": 2.3684, "step": 16392 }, { "epoch": 0.2, "learning_rate": 0.00018304535874930905, "loss": 2.3804, "step": 16400 }, { "epoch": 0.21, "learning_rate": 0.00018302870422449912, "loss": 2.3843, "step": 16408 }, { "epoch": 0.21, "learning_rate": 0.00018301204237532396, "loss": 2.3739, "step": 16416 }, { "epoch": 0.21, "learning_rate": 0.00018299537320345466, "loss": 2.398, "step": 16424 }, { "epoch": 0.21, "learning_rate": 0.00018297869671056303, "loss": 2.3739, "step": 16432 }, { "epoch": 0.21, "learning_rate": 0.00018296201289832163, "loss": 2.3642, "step": 16440 }, { "epoch": 0.21, "learning_rate": 0.0001829453217684038, "loss": 2.3537, "step": 16448 }, { "epoch": 0.21, "learning_rate": 0.0001829286233224835, "loss": 2.3654, "step": 16456 }, { "epoch": 0.21, "learning_rate": 0.0001829119175622355, "loss": 2.3842, "step": 16464 }, { "epoch": 0.21, "learning_rate": 0.00018289520448933538, "loss": 2.372, "step": 16472 }, { "epoch": 0.21, "learning_rate": 0.00018287848410545923, "loss": 2.385, "step": 16480 }, { "epoch": 0.21, "learning_rate": 0.0001828617564122841, "loss": 2.4041, "step": 16488 }, { "epoch": 0.21, "learning_rate": 0.00018284502141148766, "loss": 2.3851, "step": 16496 }, { "epoch": 0.21, "learning_rate": 0.00018282827910474832, "loss": 2.3728, "step": 16504 }, { "epoch": 0.21, "learning_rate": 0.00018281152949374527, "loss": 2.3858, "step": 16512 }, { "epoch": 0.21, "learning_rate": 0.0001827947725801584, "loss": 2.3586, "step": 16520 }, { "epoch": 0.21, "learning_rate": 0.0001827780083656683, "loss": 2.3819, "step": 16528 }, { "epoch": 0.21, "learning_rate": 0.00018276123685195632, "loss": 2.3959, "step": 16536 }, { "epoch": 0.21, "learning_rate": 0.00018274445804070458, "loss": 2.3927, "step": 16544 }, { "epoch": 0.21, "learning_rate": 0.00018272767193359594, "loss": 2.3581, "step": 16552 }, { "epoch": 0.21, "learning_rate": 0.00018271087853231386, "loss": 2.3796, "step": 16560 }, { "epoch": 0.21, "learning_rate": 0.00018269407783854267, "loss": 2.3681, "step": 16568 }, { "epoch": 0.21, "learning_rate": 0.0001826772698539674, "loss": 2.3837, "step": 16576 }, { "epoch": 0.21, "learning_rate": 0.00018266045458027375, "loss": 2.3791, "step": 16584 }, { "epoch": 0.21, "learning_rate": 0.00018264363201914822, "loss": 2.3623, "step": 16592 }, { "epoch": 0.21, "learning_rate": 0.00018262680217227806, "loss": 2.3698, "step": 16600 }, { "epoch": 0.21, "learning_rate": 0.00018260996504135114, "loss": 2.3674, "step": 16608 }, { "epoch": 0.21, "learning_rate": 0.00018259312062805615, "loss": 2.3728, "step": 16616 }, { "epoch": 0.21, "learning_rate": 0.0001825762689340825, "loss": 2.3722, "step": 16624 }, { "epoch": 0.21, "learning_rate": 0.0001825594099611203, "loss": 2.3819, "step": 16632 }, { "epoch": 0.21, "learning_rate": 0.0001825425437108605, "loss": 2.3665, "step": 16640 }, { "epoch": 0.21, "learning_rate": 0.00018252567018499453, "loss": 2.3813, "step": 16648 }, { "epoch": 0.21, "learning_rate": 0.0001825087893852148, "loss": 2.361, "step": 16656 }, { "epoch": 0.21, "learning_rate": 0.0001824919013132144, "loss": 2.3604, "step": 16664 }, { "epoch": 0.21, "learning_rate": 0.00018247500597068703, "loss": 2.3613, "step": 16672 }, { "epoch": 0.21, "learning_rate": 0.00018245810335932723, "loss": 2.3853, "step": 16680 }, { "epoch": 0.21, "learning_rate": 0.00018244119348083024, "loss": 2.3532, "step": 16688 }, { "epoch": 0.21, "learning_rate": 0.00018242427633689202, "loss": 2.3426, "step": 16696 }, { "epoch": 0.21, "learning_rate": 0.00018240735192920923, "loss": 2.3635, "step": 16704 }, { "epoch": 0.21, "learning_rate": 0.00018239042025947936, "loss": 2.3453, "step": 16712 }, { "epoch": 0.21, "learning_rate": 0.00018237348132940054, "loss": 2.3877, "step": 16720 }, { "epoch": 0.21, "learning_rate": 0.0001823565351406716, "loss": 2.3681, "step": 16728 }, { "epoch": 0.21, "learning_rate": 0.0001823395816949922, "loss": 2.371, "step": 16736 }, { "epoch": 0.21, "learning_rate": 0.0001823226209940626, "loss": 2.3846, "step": 16744 }, { "epoch": 0.21, "learning_rate": 0.000182305653039584, "loss": 2.3735, "step": 16752 }, { "epoch": 0.21, "learning_rate": 0.00018228867783325804, "loss": 2.3651, "step": 16760 }, { "epoch": 0.21, "learning_rate": 0.00018227169537678734, "loss": 2.3645, "step": 16768 }, { "epoch": 0.21, "learning_rate": 0.0001822547056718751, "loss": 2.3768, "step": 16776 }, { "epoch": 0.21, "learning_rate": 0.0001822377087202253, "loss": 2.3717, "step": 16784 }, { "epoch": 0.21, "learning_rate": 0.00018222070452354264, "loss": 2.3736, "step": 16792 }, { "epoch": 0.21, "learning_rate": 0.00018220369308353255, "loss": 2.3747, "step": 16800 }, { "epoch": 0.21, "learning_rate": 0.00018218667440190114, "loss": 2.3809, "step": 16808 }, { "epoch": 0.21, "learning_rate": 0.00018216964848035533, "loss": 2.368, "step": 16816 }, { "epoch": 0.21, "learning_rate": 0.00018215261532060273, "loss": 2.3652, "step": 16824 }, { "epoch": 0.21, "learning_rate": 0.00018213557492435166, "loss": 2.3799, "step": 16832 }, { "epoch": 0.21, "learning_rate": 0.00018211852729331114, "loss": 2.3597, "step": 16840 }, { "epoch": 0.21, "learning_rate": 0.00018210147242919098, "loss": 2.378, "step": 16848 }, { "epoch": 0.21, "learning_rate": 0.00018208441033370167, "loss": 2.365, "step": 16856 }, { "epoch": 0.21, "learning_rate": 0.00018206734100855451, "loss": 2.3826, "step": 16864 }, { "epoch": 0.21, "learning_rate": 0.00018205026445546136, "loss": 2.3758, "step": 16872 }, { "epoch": 0.21, "learning_rate": 0.00018203318067613495, "loss": 2.3749, "step": 16880 }, { "epoch": 0.21, "learning_rate": 0.0001820160896722887, "loss": 2.3445, "step": 16888 }, { "epoch": 0.21, "learning_rate": 0.0001819989914456367, "loss": 2.3681, "step": 16896 }, { "epoch": 0.21, "learning_rate": 0.00018198188599789384, "loss": 2.3507, "step": 16904 }, { "epoch": 0.21, "learning_rate": 0.00018196477333077567, "loss": 2.3637, "step": 16912 }, { "epoch": 0.21, "learning_rate": 0.00018194765344599852, "loss": 2.3783, "step": 16920 }, { "epoch": 0.21, "learning_rate": 0.00018193052634527942, "loss": 2.3551, "step": 16928 }, { "epoch": 0.21, "learning_rate": 0.0001819133920303361, "loss": 2.3797, "step": 16936 }, { "epoch": 0.21, "learning_rate": 0.00018189625050288706, "loss": 2.3521, "step": 16944 }, { "epoch": 0.21, "learning_rate": 0.00018187910176465147, "loss": 2.3728, "step": 16952 }, { "epoch": 0.21, "learning_rate": 0.00018186194581734923, "loss": 2.3808, "step": 16960 }, { "epoch": 0.21, "learning_rate": 0.00018184478266270108, "loss": 2.365, "step": 16968 }, { "epoch": 0.21, "learning_rate": 0.00018182761230242826, "loss": 2.353, "step": 16976 }, { "epoch": 0.21, "learning_rate": 0.00018181043473825293, "loss": 2.3863, "step": 16984 }, { "epoch": 0.21, "learning_rate": 0.00018179324997189792, "loss": 2.3677, "step": 16992 }, { "epoch": 0.21, "learning_rate": 0.00018177605800508674, "loss": 2.3686, "step": 17000 }, { "epoch": 0.21, "learning_rate": 0.00018175885883954364, "loss": 2.3806, "step": 17008 }, { "epoch": 0.21, "learning_rate": 0.00018174165247699362, "loss": 2.3568, "step": 17016 }, { "epoch": 0.21, "learning_rate": 0.00018172443891916235, "loss": 2.3748, "step": 17024 }, { "epoch": 0.21, "learning_rate": 0.00018170721816777627, "loss": 2.3875, "step": 17032 }, { "epoch": 0.21, "learning_rate": 0.00018168999022456255, "loss": 2.3762, "step": 17040 }, { "epoch": 0.21, "learning_rate": 0.000181672755091249, "loss": 2.3734, "step": 17048 }, { "epoch": 0.21, "learning_rate": 0.00018165551276956424, "loss": 2.3755, "step": 17056 }, { "epoch": 0.21, "learning_rate": 0.0001816382632612376, "loss": 2.3695, "step": 17064 }, { "epoch": 0.21, "learning_rate": 0.00018162100656799905, "loss": 2.3571, "step": 17072 }, { "epoch": 0.21, "learning_rate": 0.00018160374269157937, "loss": 2.361, "step": 17080 }, { "epoch": 0.21, "learning_rate": 0.00018158647163371002, "loss": 2.3679, "step": 17088 }, { "epoch": 0.21, "learning_rate": 0.0001815691933961232, "loss": 2.3724, "step": 17096 }, { "epoch": 0.21, "learning_rate": 0.00018155190798055184, "loss": 2.3684, "step": 17104 }, { "epoch": 0.21, "learning_rate": 0.00018153461538872952, "loss": 2.3734, "step": 17112 }, { "epoch": 0.21, "learning_rate": 0.0001815173156223906, "loss": 2.3753, "step": 17120 }, { "epoch": 0.21, "learning_rate": 0.00018150000868327022, "loss": 2.364, "step": 17128 }, { "epoch": 0.21, "learning_rate": 0.00018148269457310406, "loss": 2.3685, "step": 17136 }, { "epoch": 0.21, "learning_rate": 0.00018146537329362869, "loss": 2.356, "step": 17144 }, { "epoch": 0.21, "learning_rate": 0.00018144804484658132, "loss": 2.3608, "step": 17152 }, { "epoch": 0.21, "learning_rate": 0.0001814307092336999, "loss": 2.3891, "step": 17160 }, { "epoch": 0.21, "learning_rate": 0.0001814133664567231, "loss": 2.3568, "step": 17168 }, { "epoch": 0.21, "learning_rate": 0.0001813960165173903, "loss": 2.3695, "step": 17176 }, { "epoch": 0.21, "learning_rate": 0.0001813786594174416, "loss": 2.3599, "step": 17184 }, { "epoch": 0.21, "learning_rate": 0.0001813612951586178, "loss": 2.3915, "step": 17192 }, { "epoch": 0.21, "learning_rate": 0.00018134392374266045, "loss": 2.366, "step": 17200 }, { "epoch": 0.22, "learning_rate": 0.0001813265451713118, "loss": 2.3685, "step": 17208 }, { "epoch": 0.22, "learning_rate": 0.00018130915944631487, "loss": 2.3817, "step": 17216 }, { "epoch": 0.22, "learning_rate": 0.00018129176656941323, "loss": 2.373, "step": 17224 }, { "epoch": 0.22, "learning_rate": 0.00018127436654235142, "loss": 2.3615, "step": 17232 }, { "epoch": 0.22, "learning_rate": 0.0001812569593668745, "loss": 2.3635, "step": 17240 }, { "epoch": 0.22, "learning_rate": 0.00018123954504472832, "loss": 2.3688, "step": 17248 }, { "epoch": 0.22, "learning_rate": 0.00018122212357765945, "loss": 2.3604, "step": 17256 }, { "epoch": 0.22, "learning_rate": 0.0001812046949674151, "loss": 2.3814, "step": 17264 }, { "epoch": 0.22, "learning_rate": 0.00018118725921574338, "loss": 2.3913, "step": 17272 }, { "epoch": 0.22, "learning_rate": 0.00018116981632439286, "loss": 2.3708, "step": 17280 }, { "epoch": 0.22, "learning_rate": 0.0001811523662951131, "loss": 2.3765, "step": 17288 }, { "epoch": 0.22, "learning_rate": 0.00018113490912965416, "loss": 2.3437, "step": 17296 }, { "epoch": 0.22, "learning_rate": 0.00018111744482976686, "loss": 2.3527, "step": 17304 }, { "epoch": 0.22, "learning_rate": 0.00018109997339720284, "loss": 2.3859, "step": 17312 }, { "epoch": 0.22, "learning_rate": 0.00018108249483371437, "loss": 2.376, "step": 17320 }, { "epoch": 0.22, "learning_rate": 0.00018106500914105445, "loss": 2.3711, "step": 17328 }, { "epoch": 0.22, "learning_rate": 0.0001810475163209768, "loss": 2.3689, "step": 17336 }, { "epoch": 0.22, "learning_rate": 0.00018103001637523585, "loss": 2.351, "step": 17344 }, { "epoch": 0.22, "learning_rate": 0.0001810125093055867, "loss": 2.3794, "step": 17352 }, { "epoch": 0.22, "learning_rate": 0.00018099499511378526, "loss": 2.343, "step": 17360 }, { "epoch": 0.22, "learning_rate": 0.00018097747380158808, "loss": 2.3409, "step": 17368 }, { "epoch": 0.22, "learning_rate": 0.00018095994537075245, "loss": 2.3678, "step": 17376 }, { "epoch": 0.22, "learning_rate": 0.00018094240982303642, "loss": 2.3556, "step": 17384 }, { "epoch": 0.22, "learning_rate": 0.00018092486716019863, "loss": 2.3367, "step": 17392 }, { "epoch": 0.22, "learning_rate": 0.00018090731738399857, "loss": 2.3833, "step": 17400 }, { "epoch": 0.22, "learning_rate": 0.0001808897604961963, "loss": 2.3603, "step": 17408 }, { "epoch": 0.22, "learning_rate": 0.0001808721964985528, "loss": 2.3486, "step": 17416 }, { "epoch": 0.22, "learning_rate": 0.00018085462539282955, "loss": 2.3676, "step": 17424 }, { "epoch": 0.22, "learning_rate": 0.0001808370471807889, "loss": 2.3633, "step": 17432 }, { "epoch": 0.22, "learning_rate": 0.00018081946186419373, "loss": 2.374, "step": 17440 }, { "epoch": 0.22, "learning_rate": 0.0001808018694448079, "loss": 2.3513, "step": 17448 }, { "epoch": 0.22, "learning_rate": 0.0001807842699243957, "loss": 2.3595, "step": 17456 }, { "epoch": 0.22, "learning_rate": 0.00018076666330472233, "loss": 2.3797, "step": 17464 }, { "epoch": 0.22, "learning_rate": 0.00018074904958755356, "loss": 2.3481, "step": 17472 }, { "epoch": 0.22, "learning_rate": 0.00018073142877465608, "loss": 2.3589, "step": 17480 }, { "epoch": 0.22, "learning_rate": 0.00018071380086779704, "loss": 2.3441, "step": 17488 }, { "epoch": 0.22, "learning_rate": 0.00018069616586874446, "loss": 2.368, "step": 17496 }, { "epoch": 0.22, "learning_rate": 0.00018067852377926704, "loss": 2.3802, "step": 17504 }, { "epoch": 0.22, "learning_rate": 0.00018066087460113419, "loss": 2.3592, "step": 17512 }, { "epoch": 0.22, "learning_rate": 0.00018064321833611598, "loss": 2.3723, "step": 17520 }, { "epoch": 0.22, "learning_rate": 0.00018062555498598326, "loss": 2.3701, "step": 17528 }, { "epoch": 0.22, "learning_rate": 0.00018060788455250758, "loss": 2.3631, "step": 17536 }, { "epoch": 0.22, "learning_rate": 0.00018059020703746115, "loss": 2.36, "step": 17544 }, { "epoch": 0.22, "learning_rate": 0.0001805725224426169, "loss": 2.3722, "step": 17552 }, { "epoch": 0.22, "learning_rate": 0.0001805548307697486, "loss": 2.355, "step": 17560 }, { "epoch": 0.22, "learning_rate": 0.00018053713202063055, "loss": 2.375, "step": 17568 }, { "epoch": 0.22, "learning_rate": 0.00018051942619703784, "loss": 2.3581, "step": 17576 }, { "epoch": 0.22, "learning_rate": 0.00018050171330074623, "loss": 2.3616, "step": 17584 }, { "epoch": 0.22, "learning_rate": 0.0001804839933335323, "loss": 2.345, "step": 17592 }, { "epoch": 0.22, "learning_rate": 0.0001804662662971732, "loss": 2.367, "step": 17600 }, { "epoch": 0.22, "learning_rate": 0.00018044853219344688, "loss": 2.3672, "step": 17608 }, { "epoch": 0.22, "learning_rate": 0.00018043079102413197, "loss": 2.3736, "step": 17616 }, { "epoch": 0.22, "learning_rate": 0.0001804130427910078, "loss": 2.3985, "step": 17624 }, { "epoch": 0.22, "learning_rate": 0.00018039528749585443, "loss": 2.3715, "step": 17632 }, { "epoch": 0.22, "learning_rate": 0.0001803775251404526, "loss": 2.3789, "step": 17640 }, { "epoch": 0.22, "learning_rate": 0.00018035975572658377, "loss": 2.3686, "step": 17648 }, { "epoch": 0.22, "learning_rate": 0.00018034197925603015, "loss": 2.367, "step": 17656 }, { "epoch": 0.22, "learning_rate": 0.00018032419573057456, "loss": 2.3625, "step": 17664 }, { "epoch": 0.22, "learning_rate": 0.0001803064051520006, "loss": 2.3787, "step": 17672 }, { "epoch": 0.22, "learning_rate": 0.00018028860752209263, "loss": 2.3771, "step": 17680 }, { "epoch": 0.22, "learning_rate": 0.00018027080284263556, "loss": 2.3664, "step": 17688 }, { "epoch": 0.22, "learning_rate": 0.00018025299111541516, "loss": 2.3747, "step": 17696 }, { "epoch": 0.22, "learning_rate": 0.00018023517234221783, "loss": 2.3469, "step": 17704 }, { "epoch": 0.22, "learning_rate": 0.00018021734652483068, "loss": 2.3606, "step": 17712 }, { "epoch": 0.22, "learning_rate": 0.00018019951366504157, "loss": 2.3712, "step": 17720 }, { "epoch": 0.22, "learning_rate": 0.00018018167376463899, "loss": 2.368, "step": 17728 }, { "epoch": 0.22, "learning_rate": 0.0001801638268254122, "loss": 2.3606, "step": 17736 }, { "epoch": 0.22, "learning_rate": 0.00018014597284915116, "loss": 2.3681, "step": 17744 }, { "epoch": 0.22, "learning_rate": 0.0001801281118376465, "loss": 2.3725, "step": 17752 }, { "epoch": 0.22, "learning_rate": 0.0001801102437926896, "loss": 2.354, "step": 17760 }, { "epoch": 0.22, "learning_rate": 0.0001800923687160725, "loss": 2.3515, "step": 17768 }, { "epoch": 0.22, "learning_rate": 0.00018007448660958803, "loss": 2.3513, "step": 17776 }, { "epoch": 0.22, "learning_rate": 0.00018005659747502957, "loss": 2.3711, "step": 17784 }, { "epoch": 0.22, "learning_rate": 0.00018003870131419136, "loss": 2.3651, "step": 17792 }, { "epoch": 0.22, "learning_rate": 0.0001800207981288683, "loss": 2.3764, "step": 17800 }, { "epoch": 0.22, "learning_rate": 0.0001800028879208559, "loss": 2.3589, "step": 17808 }, { "epoch": 0.22, "learning_rate": 0.00017998497069195052, "loss": 2.3654, "step": 17816 }, { "epoch": 0.22, "learning_rate": 0.00017996704644394912, "loss": 2.3619, "step": 17824 }, { "epoch": 0.22, "learning_rate": 0.00017994911517864946, "loss": 2.3661, "step": 17832 }, { "epoch": 0.22, "learning_rate": 0.00017993117689784984, "loss": 2.3719, "step": 17840 }, { "epoch": 0.22, "learning_rate": 0.00017991323160334945, "loss": 2.3806, "step": 17848 }, { "epoch": 0.22, "learning_rate": 0.0001798952792969481, "loss": 2.3697, "step": 17856 }, { "epoch": 0.22, "learning_rate": 0.00017987731998044627, "loss": 2.3605, "step": 17864 }, { "epoch": 0.22, "learning_rate": 0.0001798593536556452, "loss": 2.3587, "step": 17872 }, { "epoch": 0.22, "learning_rate": 0.0001798413803243468, "loss": 2.3695, "step": 17880 }, { "epoch": 0.22, "learning_rate": 0.00017982339998835368, "loss": 2.3715, "step": 17888 }, { "epoch": 0.22, "learning_rate": 0.0001798054126494692, "loss": 2.3741, "step": 17896 }, { "epoch": 0.22, "learning_rate": 0.00017978741830949738, "loss": 2.3634, "step": 17904 }, { "epoch": 0.22, "learning_rate": 0.00017976941697024295, "loss": 2.337, "step": 17912 }, { "epoch": 0.22, "learning_rate": 0.0001797514086335113, "loss": 2.3751, "step": 17920 }, { "epoch": 0.22, "learning_rate": 0.00017973339330110862, "loss": 2.3771, "step": 17928 }, { "epoch": 0.22, "learning_rate": 0.0001797153709748417, "loss": 2.3653, "step": 17936 }, { "epoch": 0.22, "learning_rate": 0.00017969734165651814, "loss": 2.3601, "step": 17944 }, { "epoch": 0.22, "learning_rate": 0.0001796793053479461, "loss": 2.3713, "step": 17952 }, { "epoch": 0.22, "learning_rate": 0.00017966126205093457, "loss": 2.3614, "step": 17960 }, { "epoch": 0.22, "learning_rate": 0.00017964321176729318, "loss": 2.3672, "step": 17968 }, { "epoch": 0.22, "learning_rate": 0.00017962515449883225, "loss": 2.3607, "step": 17976 }, { "epoch": 0.22, "learning_rate": 0.0001796070902473629, "loss": 2.3666, "step": 17984 }, { "epoch": 0.22, "learning_rate": 0.00017958901901469676, "loss": 2.3635, "step": 17992 }, { "epoch": 0.23, "learning_rate": 0.00017957094080264634, "loss": 2.3672, "step": 18000 }, { "epoch": 0.23, "learning_rate": 0.00017955285561302477, "loss": 2.3717, "step": 18008 }, { "epoch": 0.23, "learning_rate": 0.0001795347634476459, "loss": 2.368, "step": 18016 }, { "epoch": 0.23, "learning_rate": 0.00017951666430832423, "loss": 2.3663, "step": 18024 }, { "epoch": 0.23, "learning_rate": 0.00017949855819687506, "loss": 2.367, "step": 18032 }, { "epoch": 0.23, "learning_rate": 0.0001794804451151143, "loss": 2.3878, "step": 18040 }, { "epoch": 0.23, "learning_rate": 0.00017946232506485857, "loss": 2.3693, "step": 18048 }, { "epoch": 0.23, "learning_rate": 0.00017944419804792527, "loss": 2.347, "step": 18056 }, { "epoch": 0.23, "learning_rate": 0.00017942606406613242, "loss": 2.346, "step": 18064 }, { "epoch": 0.23, "learning_rate": 0.0001794079231212987, "loss": 2.3581, "step": 18072 }, { "epoch": 0.23, "learning_rate": 0.00017938977521524355, "loss": 2.3576, "step": 18080 }, { "epoch": 0.23, "learning_rate": 0.00017937162034978714, "loss": 2.3717, "step": 18088 }, { "epoch": 0.23, "learning_rate": 0.0001793534585267503, "loss": 2.3828, "step": 18096 }, { "epoch": 0.23, "learning_rate": 0.00017933528974795456, "loss": 2.3749, "step": 18104 }, { "epoch": 0.23, "learning_rate": 0.0001793171140152221, "loss": 2.3684, "step": 18112 }, { "epoch": 0.23, "learning_rate": 0.00017929893133037593, "loss": 2.3748, "step": 18120 }, { "epoch": 0.23, "learning_rate": 0.00017928074169523957, "loss": 2.3783, "step": 18128 }, { "epoch": 0.23, "learning_rate": 0.0001792625451116374, "loss": 2.355, "step": 18136 }, { "epoch": 0.23, "learning_rate": 0.00017924434158139442, "loss": 2.3709, "step": 18144 }, { "epoch": 0.23, "learning_rate": 0.00017922613110633634, "loss": 2.3436, "step": 18152 }, { "epoch": 0.23, "learning_rate": 0.0001792079136882896, "loss": 2.3698, "step": 18160 }, { "epoch": 0.23, "learning_rate": 0.0001791896893290812, "loss": 2.3607, "step": 18168 }, { "epoch": 0.23, "learning_rate": 0.00017917145803053906, "loss": 2.353, "step": 18176 }, { "epoch": 0.23, "learning_rate": 0.00017915321979449162, "loss": 2.3529, "step": 18184 }, { "epoch": 0.23, "learning_rate": 0.00017913497462276808, "loss": 2.3774, "step": 18192 }, { "epoch": 0.23, "learning_rate": 0.0001791167225171983, "loss": 2.363, "step": 18200 }, { "epoch": 0.23, "learning_rate": 0.00017909846347961294, "loss": 2.3738, "step": 18208 }, { "epoch": 0.23, "learning_rate": 0.00017908019751184317, "loss": 2.362, "step": 18216 }, { "epoch": 0.23, "learning_rate": 0.000179061924615721, "loss": 2.374, "step": 18224 }, { "epoch": 0.23, "learning_rate": 0.0001790436447930792, "loss": 2.3554, "step": 18232 }, { "epoch": 0.23, "learning_rate": 0.00017902535804575104, "loss": 2.3519, "step": 18240 }, { "epoch": 0.23, "learning_rate": 0.00017900706437557054, "loss": 2.3493, "step": 18248 }, { "epoch": 0.23, "learning_rate": 0.00017898876378437251, "loss": 2.3605, "step": 18256 }, { "epoch": 0.23, "learning_rate": 0.00017897045627399241, "loss": 2.355, "step": 18264 }, { "epoch": 0.23, "learning_rate": 0.00017895214184626633, "loss": 2.3568, "step": 18272 }, { "epoch": 0.23, "learning_rate": 0.00017893382050303112, "loss": 2.3796, "step": 18280 }, { "epoch": 0.23, "learning_rate": 0.00017891549224612435, "loss": 2.3619, "step": 18288 }, { "epoch": 0.23, "learning_rate": 0.00017889715707738416, "loss": 2.3586, "step": 18296 }, { "epoch": 0.23, "learning_rate": 0.00017887881499864953, "loss": 2.3753, "step": 18304 }, { "epoch": 0.23, "learning_rate": 0.00017886046601176006, "loss": 2.3635, "step": 18312 }, { "epoch": 0.23, "learning_rate": 0.000178842110118556, "loss": 2.3602, "step": 18320 }, { "epoch": 0.23, "learning_rate": 0.0001788237473208784, "loss": 2.3755, "step": 18328 }, { "epoch": 0.23, "learning_rate": 0.00017880537762056894, "loss": 2.3766, "step": 18336 }, { "epoch": 0.23, "learning_rate": 0.00017878700101946993, "loss": 2.3753, "step": 18344 }, { "epoch": 0.23, "learning_rate": 0.0001787686175194245, "loss": 2.3663, "step": 18352 }, { "epoch": 0.23, "learning_rate": 0.00017875022712227642, "loss": 2.3524, "step": 18360 }, { "epoch": 0.23, "learning_rate": 0.00017873182982987008, "loss": 2.335, "step": 18368 }, { "epoch": 0.23, "learning_rate": 0.0001787134256440507, "loss": 2.3788, "step": 18376 }, { "epoch": 0.23, "learning_rate": 0.0001786950145666641, "loss": 2.3763, "step": 18384 }, { "epoch": 0.23, "learning_rate": 0.00017867659659955674, "loss": 2.3478, "step": 18392 }, { "epoch": 0.23, "learning_rate": 0.0001786581717445759, "loss": 2.3608, "step": 18400 }, { "epoch": 0.23, "learning_rate": 0.00017863974000356946, "loss": 2.3671, "step": 18408 }, { "epoch": 0.23, "learning_rate": 0.00017862130137838604, "loss": 2.3752, "step": 18416 }, { "epoch": 0.23, "learning_rate": 0.00017860285587087494, "loss": 2.3711, "step": 18424 }, { "epoch": 0.23, "learning_rate": 0.0001785844034828861, "loss": 2.3499, "step": 18432 }, { "epoch": 0.23, "learning_rate": 0.00017856594421627022, "loss": 2.3592, "step": 18440 }, { "epoch": 0.23, "learning_rate": 0.00017854747807287866, "loss": 2.365, "step": 18448 }, { "epoch": 0.23, "learning_rate": 0.00017852900505456346, "loss": 2.3702, "step": 18456 }, { "epoch": 0.23, "learning_rate": 0.00017851052516317735, "loss": 2.3503, "step": 18464 }, { "epoch": 0.23, "learning_rate": 0.00017849203840057375, "loss": 2.3636, "step": 18472 }, { "epoch": 0.23, "learning_rate": 0.0001784735447686068, "loss": 2.3577, "step": 18480 }, { "epoch": 0.23, "learning_rate": 0.00017845504426913133, "loss": 2.3783, "step": 18488 }, { "epoch": 0.23, "learning_rate": 0.00017843653690400278, "loss": 2.3564, "step": 18496 }, { "epoch": 0.23, "learning_rate": 0.0001784180226750774, "loss": 2.3723, "step": 18504 }, { "epoch": 0.23, "learning_rate": 0.000178399501584212, "loss": 2.3573, "step": 18512 }, { "epoch": 0.23, "learning_rate": 0.00017838097363326416, "loss": 2.3641, "step": 18520 }, { "epoch": 0.23, "learning_rate": 0.0001783624388240921, "loss": 2.3603, "step": 18528 }, { "epoch": 0.23, "learning_rate": 0.00017834389715855485, "loss": 2.351, "step": 18536 }, { "epoch": 0.23, "learning_rate": 0.00017832534863851195, "loss": 2.3676, "step": 18544 }, { "epoch": 0.23, "learning_rate": 0.00017830679326582373, "loss": 2.3389, "step": 18552 }, { "epoch": 0.23, "learning_rate": 0.00017828823104235118, "loss": 2.368, "step": 18560 }, { "epoch": 0.23, "learning_rate": 0.00017826966196995603, "loss": 2.3504, "step": 18568 }, { "epoch": 0.23, "learning_rate": 0.0001782510860505006, "loss": 2.3597, "step": 18576 }, { "epoch": 0.23, "learning_rate": 0.00017823250328584798, "loss": 2.3658, "step": 18584 }, { "epoch": 0.23, "learning_rate": 0.0001782139136778619, "loss": 2.3667, "step": 18592 }, { "epoch": 0.23, "learning_rate": 0.0001781953172284068, "loss": 2.3673, "step": 18600 }, { "epoch": 0.23, "learning_rate": 0.0001781767139393478, "loss": 2.3695, "step": 18608 }, { "epoch": 0.23, "learning_rate": 0.0001781581038125507, "loss": 2.3714, "step": 18616 }, { "epoch": 0.23, "learning_rate": 0.000178139486849882, "loss": 2.3517, "step": 18624 }, { "epoch": 0.23, "learning_rate": 0.00017812086305320885, "loss": 2.3468, "step": 18632 }, { "epoch": 0.23, "learning_rate": 0.00017810223242439917, "loss": 2.3598, "step": 18640 }, { "epoch": 0.23, "learning_rate": 0.00017808359496532144, "loss": 2.3608, "step": 18648 }, { "epoch": 0.23, "learning_rate": 0.00017806495067784493, "loss": 2.354, "step": 18656 }, { "epoch": 0.23, "learning_rate": 0.00017804629956383948, "loss": 2.359, "step": 18664 }, { "epoch": 0.23, "learning_rate": 0.00017802764162517582, "loss": 2.3571, "step": 18672 }, { "epoch": 0.23, "learning_rate": 0.00017800897686372517, "loss": 2.3655, "step": 18680 }, { "epoch": 0.23, "learning_rate": 0.00017799030528135949, "loss": 2.3576, "step": 18688 }, { "epoch": 0.23, "learning_rate": 0.00017797162687995143, "loss": 2.348, "step": 18696 }, { "epoch": 0.23, "learning_rate": 0.00017795294166137438, "loss": 2.3568, "step": 18704 }, { "epoch": 0.23, "learning_rate": 0.0001779342496275023, "loss": 2.342, "step": 18712 }, { "epoch": 0.23, "learning_rate": 0.0001779155507802099, "loss": 2.3503, "step": 18720 }, { "epoch": 0.23, "learning_rate": 0.0001778968451213726, "loss": 2.3769, "step": 18728 }, { "epoch": 0.23, "learning_rate": 0.0001778781326528665, "loss": 2.3731, "step": 18736 }, { "epoch": 0.23, "learning_rate": 0.00017785941337656827, "loss": 2.3486, "step": 18744 }, { "epoch": 0.23, "learning_rate": 0.0001778406872943554, "loss": 2.3552, "step": 18752 }, { "epoch": 0.23, "learning_rate": 0.00017782195440810598, "loss": 2.3627, "step": 18760 }, { "epoch": 0.23, "learning_rate": 0.00017780321471969884, "loss": 2.3813, "step": 18768 }, { "epoch": 0.23, "learning_rate": 0.0001777844682310135, "loss": 2.3415, "step": 18776 }, { "epoch": 0.23, "learning_rate": 0.00017776571494393007, "loss": 2.3774, "step": 18784 }, { "epoch": 0.23, "learning_rate": 0.0001777469548603294, "loss": 2.3631, "step": 18792 }, { "epoch": 0.23, "learning_rate": 0.00017772818798209304, "loss": 2.3417, "step": 18800 }, { "epoch": 0.24, "learning_rate": 0.00017770941431110318, "loss": 2.3654, "step": 18808 }, { "epoch": 0.24, "learning_rate": 0.00017769063384924272, "loss": 2.3642, "step": 18816 }, { "epoch": 0.24, "learning_rate": 0.0001776718465983953, "loss": 2.3471, "step": 18824 }, { "epoch": 0.24, "learning_rate": 0.000177653052560445, "loss": 2.3692, "step": 18832 }, { "epoch": 0.24, "learning_rate": 0.00017763425173727697, "loss": 2.3617, "step": 18840 }, { "epoch": 0.24, "learning_rate": 0.0001776154441307767, "loss": 2.3598, "step": 18848 }, { "epoch": 0.24, "learning_rate": 0.0001775966297428305, "loss": 2.3466, "step": 18856 }, { "epoch": 0.24, "learning_rate": 0.0001775778085753254, "loss": 2.3757, "step": 18864 }, { "epoch": 0.24, "learning_rate": 0.000177558980630149, "loss": 2.354, "step": 18872 }, { "epoch": 0.24, "learning_rate": 0.0001775401459091896, "loss": 2.3602, "step": 18880 }, { "epoch": 0.24, "learning_rate": 0.00017752130441433633, "loss": 2.3486, "step": 18888 }, { "epoch": 0.24, "learning_rate": 0.0001775024561474788, "loss": 2.3768, "step": 18896 }, { "epoch": 0.24, "learning_rate": 0.00017748360111050743, "loss": 2.3586, "step": 18904 }, { "epoch": 0.24, "learning_rate": 0.00017746473930531324, "loss": 2.3485, "step": 18912 }, { "epoch": 0.24, "learning_rate": 0.00017744587073378798, "loss": 2.3452, "step": 18920 }, { "epoch": 0.24, "learning_rate": 0.00017742699539782407, "loss": 2.368, "step": 18928 }, { "epoch": 0.24, "learning_rate": 0.00017740811329931453, "loss": 2.3618, "step": 18936 }, { "epoch": 0.24, "learning_rate": 0.00017738922444015322, "loss": 2.3616, "step": 18944 }, { "epoch": 0.24, "learning_rate": 0.00017737032882223454, "loss": 2.3601, "step": 18952 }, { "epoch": 0.24, "learning_rate": 0.00017735142644745362, "loss": 2.3789, "step": 18960 }, { "epoch": 0.24, "learning_rate": 0.00017733251731770627, "loss": 2.3681, "step": 18968 }, { "epoch": 0.24, "learning_rate": 0.00017731360143488897, "loss": 2.3673, "step": 18976 }, { "epoch": 0.24, "learning_rate": 0.00017729467880089883, "loss": 2.3599, "step": 18984 }, { "epoch": 0.24, "learning_rate": 0.00017727574941763373, "loss": 2.3417, "step": 18992 }, { "epoch": 0.24, "learning_rate": 0.00017725681328699215, "loss": 2.3678, "step": 19000 }, { "epoch": 0.24, "learning_rate": 0.00017723787041087335, "loss": 2.352, "step": 19008 }, { "epoch": 0.24, "learning_rate": 0.00017721892079117707, "loss": 2.3614, "step": 19016 }, { "epoch": 0.24, "learning_rate": 0.00017719996442980398, "loss": 2.3612, "step": 19024 }, { "epoch": 0.24, "learning_rate": 0.00017718100132865523, "loss": 2.3615, "step": 19032 }, { "epoch": 0.24, "learning_rate": 0.00017716203148963267, "loss": 2.3527, "step": 19040 }, { "epoch": 0.24, "learning_rate": 0.00017714305491463894, "loss": 2.3635, "step": 19048 }, { "epoch": 0.24, "learning_rate": 0.00017712407160557726, "loss": 2.3474, "step": 19056 }, { "epoch": 0.24, "learning_rate": 0.00017710508156435154, "loss": 2.3694, "step": 19064 }, { "epoch": 0.24, "learning_rate": 0.0001770860847928664, "loss": 2.3654, "step": 19072 }, { "epoch": 0.24, "learning_rate": 0.00017706708129302704, "loss": 2.3675, "step": 19080 }, { "epoch": 0.24, "learning_rate": 0.00017704807106673945, "loss": 2.3614, "step": 19088 }, { "epoch": 0.24, "learning_rate": 0.00017702905411591025, "loss": 2.3551, "step": 19096 }, { "epoch": 0.24, "learning_rate": 0.00017701003044244678, "loss": 2.3585, "step": 19104 }, { "epoch": 0.24, "learning_rate": 0.00017699100004825693, "loss": 2.3714, "step": 19112 }, { "epoch": 0.24, "learning_rate": 0.00017697196293524936, "loss": 2.3416, "step": 19120 }, { "epoch": 0.24, "learning_rate": 0.00017695291910533337, "loss": 2.3811, "step": 19128 }, { "epoch": 0.24, "learning_rate": 0.00017693386856041903, "loss": 2.3385, "step": 19136 }, { "epoch": 0.24, "learning_rate": 0.0001769148113024169, "loss": 2.3523, "step": 19144 }, { "epoch": 0.24, "learning_rate": 0.00017689574733323834, "loss": 2.3547, "step": 19152 }, { "epoch": 0.24, "learning_rate": 0.00017687667665479542, "loss": 2.372, "step": 19160 }, { "epoch": 0.24, "learning_rate": 0.00017685759926900073, "loss": 2.3551, "step": 19168 }, { "epoch": 0.24, "learning_rate": 0.0001768385151777677, "loss": 2.3483, "step": 19176 }, { "epoch": 0.24, "learning_rate": 0.0001768194243830103, "loss": 2.3489, "step": 19184 }, { "epoch": 0.24, "learning_rate": 0.00017680032688664328, "loss": 2.3497, "step": 19192 }, { "epoch": 0.24, "learning_rate": 0.000176781222690582, "loss": 2.3784, "step": 19200 }, { "epoch": 0.24, "learning_rate": 0.00017676211179674242, "loss": 2.3566, "step": 19208 }, { "epoch": 0.24, "learning_rate": 0.0001767429942070414, "loss": 2.3713, "step": 19216 }, { "epoch": 0.24, "learning_rate": 0.0001767238699233962, "loss": 2.364, "step": 19224 }, { "epoch": 0.24, "learning_rate": 0.00017670473894772492, "loss": 2.3437, "step": 19232 }, { "epoch": 0.24, "learning_rate": 0.00017668560128194635, "loss": 2.3489, "step": 19240 }, { "epoch": 0.24, "learning_rate": 0.00017666645692797977, "loss": 2.3529, "step": 19248 }, { "epoch": 0.24, "learning_rate": 0.00017664730588774533, "loss": 2.3495, "step": 19256 }, { "epoch": 0.24, "learning_rate": 0.00017662814816316378, "loss": 2.3709, "step": 19264 }, { "epoch": 0.24, "learning_rate": 0.00017660898375615645, "loss": 2.3841, "step": 19272 }, { "epoch": 0.24, "learning_rate": 0.00017658981266864554, "loss": 2.3774, "step": 19280 }, { "epoch": 0.24, "learning_rate": 0.00017657063490255373, "loss": 2.3625, "step": 19288 }, { "epoch": 0.24, "learning_rate": 0.0001765514504598044, "loss": 2.3602, "step": 19296 }, { "epoch": 0.24, "learning_rate": 0.0001765322593423217, "loss": 2.3767, "step": 19304 }, { "epoch": 0.24, "learning_rate": 0.00017651306155203042, "loss": 2.3594, "step": 19312 }, { "epoch": 0.24, "learning_rate": 0.00017649385709085592, "loss": 2.3774, "step": 19320 }, { "epoch": 0.24, "learning_rate": 0.00017647464596072437, "loss": 2.3725, "step": 19328 }, { "epoch": 0.24, "learning_rate": 0.00017645542816356244, "loss": 2.3644, "step": 19336 }, { "epoch": 0.24, "learning_rate": 0.00017643620370129764, "loss": 2.3864, "step": 19344 }, { "epoch": 0.24, "learning_rate": 0.00017641697257585808, "loss": 2.3797, "step": 19352 }, { "epoch": 0.24, "learning_rate": 0.00017639773478917247, "loss": 2.3655, "step": 19360 }, { "epoch": 0.24, "learning_rate": 0.00017637849034317032, "loss": 2.3545, "step": 19368 }, { "epoch": 0.24, "learning_rate": 0.00017635923923978172, "loss": 2.3781, "step": 19376 }, { "epoch": 0.24, "learning_rate": 0.00017633998148093745, "loss": 2.3663, "step": 19384 }, { "epoch": 0.24, "learning_rate": 0.0001763207170685689, "loss": 2.353, "step": 19392 }, { "epoch": 0.24, "learning_rate": 0.00017630144600460824, "loss": 2.361, "step": 19400 }, { "epoch": 0.24, "learning_rate": 0.0001762821682909882, "loss": 2.3603, "step": 19408 }, { "epoch": 0.24, "learning_rate": 0.0001762628839296423, "loss": 2.3727, "step": 19416 }, { "epoch": 0.24, "learning_rate": 0.00017624359292250458, "loss": 2.3707, "step": 19424 }, { "epoch": 0.24, "learning_rate": 0.00017622429527150985, "loss": 2.3632, "step": 19432 }, { "epoch": 0.24, "learning_rate": 0.00017620499097859357, "loss": 2.3458, "step": 19440 }, { "epoch": 0.24, "learning_rate": 0.00017618568004569183, "loss": 2.3635, "step": 19448 }, { "epoch": 0.24, "learning_rate": 0.0001761663624747414, "loss": 2.3594, "step": 19456 }, { "epoch": 0.24, "learning_rate": 0.00017614703826767972, "loss": 2.3644, "step": 19464 }, { "epoch": 0.24, "learning_rate": 0.00017612770742644491, "loss": 2.3531, "step": 19472 }, { "epoch": 0.24, "learning_rate": 0.00017610836995297577, "loss": 2.363, "step": 19480 }, { "epoch": 0.24, "learning_rate": 0.0001760890258492117, "loss": 2.3618, "step": 19488 }, { "epoch": 0.24, "learning_rate": 0.00017606967511709282, "loss": 2.3622, "step": 19496 }, { "epoch": 0.24, "learning_rate": 0.00017605031775855994, "loss": 2.3803, "step": 19504 }, { "epoch": 0.24, "learning_rate": 0.0001760309537755544, "loss": 2.3765, "step": 19512 }, { "epoch": 0.24, "learning_rate": 0.00017601158317001833, "loss": 2.3459, "step": 19520 }, { "epoch": 0.24, "learning_rate": 0.00017599220594389457, "loss": 2.3813, "step": 19528 }, { "epoch": 0.24, "learning_rate": 0.00017597282209912645, "loss": 2.3752, "step": 19536 }, { "epoch": 0.24, "learning_rate": 0.00017595343163765808, "loss": 2.3742, "step": 19544 }, { "epoch": 0.24, "learning_rate": 0.00017593403456143424, "loss": 2.3635, "step": 19552 }, { "epoch": 0.24, "learning_rate": 0.00017591463087240038, "loss": 2.3537, "step": 19560 }, { "epoch": 0.24, "learning_rate": 0.0001758952205725025, "loss": 2.3463, "step": 19568 }, { "epoch": 0.24, "learning_rate": 0.00017587580366368736, "loss": 2.3652, "step": 19576 }, { "epoch": 0.24, "learning_rate": 0.00017585638014790242, "loss": 2.3784, "step": 19584 }, { "epoch": 0.24, "learning_rate": 0.00017583695002709572, "loss": 2.37, "step": 19592 }, { "epoch": 0.24, "learning_rate": 0.00017581751330321595, "loss": 2.3507, "step": 19600 }, { "epoch": 0.25, "learning_rate": 0.00017579806997821256, "loss": 2.3713, "step": 19608 }, { "epoch": 0.25, "learning_rate": 0.0001757786200540356, "loss": 2.3637, "step": 19616 }, { "epoch": 0.25, "learning_rate": 0.00017575916353263572, "loss": 2.3668, "step": 19624 }, { "epoch": 0.25, "learning_rate": 0.00017573970041596438, "loss": 2.3752, "step": 19632 }, { "epoch": 0.25, "learning_rate": 0.00017572023070597362, "loss": 2.3644, "step": 19640 }, { "epoch": 0.25, "learning_rate": 0.00017570075440461608, "loss": 2.3576, "step": 19648 }, { "epoch": 0.25, "learning_rate": 0.0001756812715138451, "loss": 2.3859, "step": 19656 }, { "epoch": 0.25, "learning_rate": 0.00017566178203561487, "loss": 2.3603, "step": 19664 }, { "epoch": 0.25, "learning_rate": 0.00017564228597187988, "loss": 2.3396, "step": 19672 }, { "epoch": 0.25, "learning_rate": 0.0001756227833245956, "loss": 2.3573, "step": 19680 }, { "epoch": 0.25, "learning_rate": 0.00017560327409571797, "loss": 2.3511, "step": 19688 }, { "epoch": 0.25, "learning_rate": 0.00017558375828720366, "loss": 2.3829, "step": 19696 }, { "epoch": 0.25, "learning_rate": 0.00017556423590101003, "loss": 2.3708, "step": 19704 }, { "epoch": 0.25, "learning_rate": 0.00017554470693909507, "loss": 2.3486, "step": 19712 }, { "epoch": 0.25, "learning_rate": 0.0001755251714034174, "loss": 2.362, "step": 19720 }, { "epoch": 0.25, "learning_rate": 0.00017550562929593628, "loss": 2.3758, "step": 19728 }, { "epoch": 0.25, "learning_rate": 0.00017548608061861176, "loss": 2.3544, "step": 19736 }, { "epoch": 0.25, "learning_rate": 0.0001754665253734044, "loss": 2.371, "step": 19744 }, { "epoch": 0.25, "learning_rate": 0.0001754469635622755, "loss": 2.3826, "step": 19752 }, { "epoch": 0.25, "learning_rate": 0.00017542739518718698, "loss": 2.3571, "step": 19760 }, { "epoch": 0.25, "learning_rate": 0.0001754078202501015, "loss": 2.3608, "step": 19768 }, { "epoch": 0.25, "learning_rate": 0.00017538823875298224, "loss": 2.3789, "step": 19776 }, { "epoch": 0.25, "learning_rate": 0.0001753686506977931, "loss": 2.3562, "step": 19784 }, { "epoch": 0.25, "learning_rate": 0.00017534905608649874, "loss": 2.3731, "step": 19792 }, { "epoch": 0.25, "learning_rate": 0.00017532945492106436, "loss": 2.3503, "step": 19800 }, { "epoch": 0.25, "learning_rate": 0.0001753098472034558, "loss": 2.3792, "step": 19808 }, { "epoch": 0.25, "learning_rate": 0.00017529023293563967, "loss": 2.3617, "step": 19816 }, { "epoch": 0.25, "learning_rate": 0.0001752706121195831, "loss": 2.3721, "step": 19824 }, { "epoch": 0.25, "learning_rate": 0.00017525098475725396, "loss": 2.3495, "step": 19832 }, { "epoch": 0.25, "learning_rate": 0.0001752313508506208, "loss": 2.3503, "step": 19840 }, { "epoch": 0.25, "learning_rate": 0.00017521171040165277, "loss": 2.3765, "step": 19848 }, { "epoch": 0.25, "learning_rate": 0.0001751920634123197, "loss": 2.3723, "step": 19856 }, { "epoch": 0.25, "learning_rate": 0.00017517240988459208, "loss": 2.3673, "step": 19864 }, { "epoch": 0.25, "learning_rate": 0.00017515274982044104, "loss": 2.3582, "step": 19872 }, { "epoch": 0.25, "learning_rate": 0.00017513308322183833, "loss": 2.3634, "step": 19880 }, { "epoch": 0.25, "learning_rate": 0.00017511341009075648, "loss": 2.3637, "step": 19888 }, { "epoch": 0.25, "learning_rate": 0.0001750937304291685, "loss": 2.3578, "step": 19896 }, { "epoch": 0.25, "learning_rate": 0.00017507404423904824, "loss": 2.3792, "step": 19904 }, { "epoch": 0.25, "learning_rate": 0.00017505435152237006, "loss": 2.3734, "step": 19912 }, { "epoch": 0.25, "learning_rate": 0.00017503465228110905, "loss": 2.3611, "step": 19920 }, { "epoch": 0.25, "learning_rate": 0.00017501494651724094, "loss": 2.3591, "step": 19928 }, { "epoch": 0.25, "learning_rate": 0.00017499523423274204, "loss": 2.3544, "step": 19936 }, { "epoch": 0.25, "learning_rate": 0.00017497551542958946, "loss": 2.3551, "step": 19944 }, { "epoch": 0.25, "learning_rate": 0.00017495579010976087, "loss": 2.3635, "step": 19952 }, { "epoch": 0.25, "learning_rate": 0.00017493605827523457, "loss": 2.3465, "step": 19960 }, { "epoch": 0.25, "learning_rate": 0.00017491631992798957, "loss": 2.3459, "step": 19968 }, { "epoch": 0.25, "learning_rate": 0.00017489657507000552, "loss": 2.3583, "step": 19976 }, { "epoch": 0.25, "learning_rate": 0.0001748768237032627, "loss": 2.3568, "step": 19984 }, { "epoch": 0.25, "learning_rate": 0.0001748570658297421, "loss": 2.3692, "step": 19992 }, { "epoch": 0.25, "learning_rate": 0.0001748373014514253, "loss": 2.351, "step": 20000 }, { "epoch": 0.25, "learning_rate": 0.0001748175305702945, "loss": 2.3703, "step": 20008 }, { "epoch": 0.25, "learning_rate": 0.00017479775318833275, "loss": 2.3765, "step": 20016 }, { "epoch": 0.25, "learning_rate": 0.00017477796930752344, "loss": 2.3469, "step": 20024 }, { "epoch": 0.25, "learning_rate": 0.00017475817892985093, "loss": 2.3684, "step": 20032 }, { "epoch": 0.25, "learning_rate": 0.00017473838205729993, "loss": 2.3591, "step": 20040 }, { "epoch": 0.25, "learning_rate": 0.00017471857869185608, "loss": 2.3401, "step": 20048 }, { "epoch": 0.25, "learning_rate": 0.00017469876883550553, "loss": 2.3562, "step": 20056 }, { "epoch": 0.25, "learning_rate": 0.00017467895249023504, "loss": 2.3558, "step": 20064 }, { "epoch": 0.25, "learning_rate": 0.00017465912965803208, "loss": 2.3774, "step": 20072 }, { "epoch": 0.25, "learning_rate": 0.00017463930034088485, "loss": 2.3807, "step": 20080 }, { "epoch": 0.25, "learning_rate": 0.00017461946454078205, "loss": 2.359, "step": 20088 }, { "epoch": 0.25, "learning_rate": 0.0001745996222597131, "loss": 2.3857, "step": 20096 }, { "epoch": 0.25, "learning_rate": 0.00017457977349966805, "loss": 2.3659, "step": 20104 }, { "epoch": 0.25, "learning_rate": 0.0001745599182626377, "loss": 2.3506, "step": 20112 }, { "epoch": 0.25, "learning_rate": 0.00017454005655061333, "loss": 2.3504, "step": 20120 }, { "epoch": 0.25, "learning_rate": 0.000174520188365587, "loss": 2.3779, "step": 20128 }, { "epoch": 0.25, "learning_rate": 0.00017450031370955138, "loss": 2.3579, "step": 20136 }, { "epoch": 0.25, "learning_rate": 0.00017448043258449977, "loss": 2.3399, "step": 20144 }, { "epoch": 0.25, "learning_rate": 0.0001744605449924261, "loss": 2.3628, "step": 20152 }, { "epoch": 0.25, "learning_rate": 0.00017444065093532505, "loss": 2.3445, "step": 20160 }, { "epoch": 0.25, "learning_rate": 0.00017442075041519187, "loss": 2.3727, "step": 20168 }, { "epoch": 0.25, "learning_rate": 0.00017440084343402245, "loss": 2.3636, "step": 20176 }, { "epoch": 0.25, "learning_rate": 0.00017438092999381332, "loss": 2.3718, "step": 20184 }, { "epoch": 0.25, "learning_rate": 0.00017436101009656174, "loss": 2.355, "step": 20192 }, { "epoch": 0.25, "learning_rate": 0.00017434108374426554, "loss": 2.3559, "step": 20200 }, { "epoch": 0.25, "learning_rate": 0.0001743211509389232, "loss": 2.3768, "step": 20208 }, { "epoch": 0.25, "learning_rate": 0.00017430121168253388, "loss": 2.3529, "step": 20216 }, { "epoch": 0.25, "learning_rate": 0.00017428126597709737, "loss": 2.3641, "step": 20224 }, { "epoch": 0.25, "learning_rate": 0.00017426131382461415, "loss": 2.3489, "step": 20232 }, { "epoch": 0.25, "learning_rate": 0.00017424135522708527, "loss": 2.3587, "step": 20240 }, { "epoch": 0.25, "learning_rate": 0.00017422139018651245, "loss": 2.3844, "step": 20248 }, { "epoch": 0.25, "learning_rate": 0.0001742014187048981, "loss": 2.3504, "step": 20256 }, { "epoch": 0.25, "learning_rate": 0.00017418144078424526, "loss": 2.3695, "step": 20264 }, { "epoch": 0.25, "learning_rate": 0.0001741614564265576, "loss": 2.368, "step": 20272 }, { "epoch": 0.25, "learning_rate": 0.0001741414656338394, "loss": 2.3634, "step": 20280 }, { "epoch": 0.25, "learning_rate": 0.0001741214684080956, "loss": 2.3665, "step": 20288 }, { "epoch": 0.25, "learning_rate": 0.00017410146475133192, "loss": 2.3592, "step": 20296 }, { "epoch": 0.25, "learning_rate": 0.00017408145466555448, "loss": 2.3603, "step": 20304 }, { "epoch": 0.25, "learning_rate": 0.00017406143815277026, "loss": 2.3426, "step": 20312 }, { "epoch": 0.25, "learning_rate": 0.0001740414152149868, "loss": 2.3596, "step": 20320 }, { "epoch": 0.25, "learning_rate": 0.00017402138585421225, "loss": 2.3716, "step": 20328 }, { "epoch": 0.25, "learning_rate": 0.0001740013500724555, "loss": 2.3583, "step": 20336 }, { "epoch": 0.25, "learning_rate": 0.00017398130787172597, "loss": 2.3814, "step": 20344 }, { "epoch": 0.25, "learning_rate": 0.0001739612592540338, "loss": 2.3608, "step": 20352 }, { "epoch": 0.25, "learning_rate": 0.00017394120422138977, "loss": 2.3618, "step": 20360 }, { "epoch": 0.25, "learning_rate": 0.00017392114277580523, "loss": 2.3501, "step": 20368 }, { "epoch": 0.25, "learning_rate": 0.0001739010749192923, "loss": 2.3855, "step": 20376 }, { "epoch": 0.25, "learning_rate": 0.00017388100065386363, "loss": 2.3531, "step": 20384 }, { "epoch": 0.25, "learning_rate": 0.00017386091998153254, "loss": 2.3401, "step": 20392 }, { "epoch": 0.26, "learning_rate": 0.00017384083290431307, "loss": 2.3539, "step": 20400 }, { "epoch": 0.26, "learning_rate": 0.00017382073942421978, "loss": 2.3492, "step": 20408 }, { "epoch": 0.26, "learning_rate": 0.00017380063954326795, "loss": 2.375, "step": 20416 }, { "epoch": 0.26, "learning_rate": 0.00017378053326347348, "loss": 2.364, "step": 20424 }, { "epoch": 0.26, "learning_rate": 0.00017376042058685296, "loss": 2.3499, "step": 20432 }, { "epoch": 0.26, "learning_rate": 0.0001737403015154235, "loss": 2.3574, "step": 20440 }, { "epoch": 0.26, "learning_rate": 0.000173720176051203, "loss": 2.3583, "step": 20448 }, { "epoch": 0.26, "learning_rate": 0.00017370004419620992, "loss": 2.3536, "step": 20456 }, { "epoch": 0.26, "learning_rate": 0.0001736799059524633, "loss": 2.3585, "step": 20464 }, { "epoch": 0.26, "learning_rate": 0.00017365976132198297, "loss": 2.3634, "step": 20472 }, { "epoch": 0.26, "learning_rate": 0.00017363961030678927, "loss": 2.3562, "step": 20480 }, { "epoch": 0.26, "learning_rate": 0.00017361945290890333, "loss": 2.3574, "step": 20488 }, { "epoch": 0.26, "learning_rate": 0.00017359928913034667, "loss": 2.3597, "step": 20496 }, { "epoch": 0.26, "learning_rate": 0.0001735791189731417, "loss": 2.3698, "step": 20504 }, { "epoch": 0.26, "learning_rate": 0.00017355894243931136, "loss": 2.3545, "step": 20512 }, { "epoch": 0.26, "learning_rate": 0.00017353875953087926, "loss": 2.3419, "step": 20520 }, { "epoch": 0.26, "learning_rate": 0.0001735185702498696, "loss": 2.3703, "step": 20528 }, { "epoch": 0.26, "learning_rate": 0.00017349837459830727, "loss": 2.3631, "step": 20536 }, { "epoch": 0.26, "learning_rate": 0.00017347817257821774, "loss": 2.3385, "step": 20544 }, { "epoch": 0.26, "learning_rate": 0.00017345796419162722, "loss": 2.3378, "step": 20552 }, { "epoch": 0.26, "learning_rate": 0.00017343774944056245, "loss": 2.3522, "step": 20560 }, { "epoch": 0.26, "learning_rate": 0.00017341752832705087, "loss": 2.3528, "step": 20568 }, { "epoch": 0.26, "learning_rate": 0.0001733973008531205, "loss": 2.3652, "step": 20576 }, { "epoch": 0.26, "learning_rate": 0.00017337706702080015, "loss": 2.3476, "step": 20584 }, { "epoch": 0.26, "learning_rate": 0.0001733568268321191, "loss": 2.3499, "step": 20592 }, { "epoch": 0.26, "learning_rate": 0.00017333658028910727, "loss": 2.3661, "step": 20600 }, { "epoch": 0.26, "learning_rate": 0.00017331632739379533, "loss": 2.3412, "step": 20608 }, { "epoch": 0.26, "learning_rate": 0.0001732960681482145, "loss": 2.3603, "step": 20616 }, { "epoch": 0.26, "learning_rate": 0.00017327580255439674, "loss": 2.3723, "step": 20624 }, { "epoch": 0.26, "learning_rate": 0.00017325553061437452, "loss": 2.3664, "step": 20632 }, { "epoch": 0.26, "learning_rate": 0.000173235252330181, "loss": 2.3541, "step": 20640 }, { "epoch": 0.26, "learning_rate": 0.00017321496770384995, "loss": 2.3506, "step": 20648 }, { "epoch": 0.26, "learning_rate": 0.00017319467673741586, "loss": 2.3671, "step": 20656 }, { "epoch": 0.26, "learning_rate": 0.00017317437943291378, "loss": 2.366, "step": 20664 }, { "epoch": 0.26, "learning_rate": 0.0001731540757923794, "loss": 2.3544, "step": 20672 }, { "epoch": 0.26, "learning_rate": 0.00017313376581784906, "loss": 2.3636, "step": 20680 }, { "epoch": 0.26, "learning_rate": 0.00017311344951135974, "loss": 2.3882, "step": 20688 }, { "epoch": 0.26, "learning_rate": 0.00017309312687494905, "loss": 2.3519, "step": 20696 }, { "epoch": 0.26, "learning_rate": 0.0001730727979106553, "loss": 2.3672, "step": 20704 }, { "epoch": 0.26, "learning_rate": 0.0001730524626205172, "loss": 2.3559, "step": 20712 }, { "epoch": 0.26, "learning_rate": 0.00017303212100657446, "loss": 2.3584, "step": 20720 }, { "epoch": 0.26, "learning_rate": 0.00017301177307086713, "loss": 2.3725, "step": 20728 }, { "epoch": 0.26, "learning_rate": 0.00017299141881543602, "loss": 2.3512, "step": 20736 }, { "epoch": 0.26, "learning_rate": 0.00017297105824232246, "loss": 2.3546, "step": 20744 }, { "epoch": 0.26, "learning_rate": 0.00017295069135356866, "loss": 2.3544, "step": 20752 }, { "epoch": 0.26, "learning_rate": 0.0001729303181512172, "loss": 2.3528, "step": 20760 }, { "epoch": 0.26, "learning_rate": 0.00017290993863731136, "loss": 2.3577, "step": 20768 }, { "epoch": 0.26, "learning_rate": 0.00017288955281389516, "loss": 2.358, "step": 20776 }, { "epoch": 0.26, "learning_rate": 0.00017286916068301317, "loss": 2.3479, "step": 20784 }, { "epoch": 0.26, "learning_rate": 0.00017284876224671062, "loss": 2.3588, "step": 20792 }, { "epoch": 0.26, "learning_rate": 0.00017282835750703332, "loss": 2.3663, "step": 20800 }, { "epoch": 0.26, "learning_rate": 0.00017280794646602776, "loss": 2.3518, "step": 20808 }, { "epoch": 0.26, "learning_rate": 0.0001727875291257411, "loss": 2.3629, "step": 20816 }, { "epoch": 0.26, "learning_rate": 0.000172767105488221, "loss": 2.3465, "step": 20824 }, { "epoch": 0.26, "learning_rate": 0.0001727466755555159, "loss": 2.3512, "step": 20832 }, { "epoch": 0.26, "learning_rate": 0.00017272623932967476, "loss": 2.3667, "step": 20840 }, { "epoch": 0.26, "learning_rate": 0.00017270579681274723, "loss": 2.3549, "step": 20848 }, { "epoch": 0.26, "learning_rate": 0.00017268534800678363, "loss": 2.3753, "step": 20856 }, { "epoch": 0.26, "learning_rate": 0.0001726648929138348, "loss": 2.3611, "step": 20864 }, { "epoch": 0.26, "learning_rate": 0.0001726444315359523, "loss": 2.3641, "step": 20872 }, { "epoch": 0.26, "learning_rate": 0.00017262396387518827, "loss": 2.3571, "step": 20880 }, { "epoch": 0.26, "learning_rate": 0.00017260348993359553, "loss": 2.3429, "step": 20888 }, { "epoch": 0.26, "learning_rate": 0.00017258300971322745, "loss": 2.3627, "step": 20896 }, { "epoch": 0.26, "learning_rate": 0.00017256252321613813, "loss": 2.3658, "step": 20904 }, { "epoch": 0.26, "learning_rate": 0.0001725420304443822, "loss": 2.3496, "step": 20912 }, { "epoch": 0.26, "learning_rate": 0.00017252153140001503, "loss": 2.367, "step": 20920 }, { "epoch": 0.26, "learning_rate": 0.0001725010260850925, "loss": 2.3561, "step": 20928 }, { "epoch": 0.26, "learning_rate": 0.00017248051450167128, "loss": 2.3691, "step": 20936 }, { "epoch": 0.26, "learning_rate": 0.00017245999665180842, "loss": 2.3788, "step": 20944 }, { "epoch": 0.26, "learning_rate": 0.00017243947253756182, "loss": 2.3731, "step": 20952 }, { "epoch": 0.26, "learning_rate": 0.00017241894216098996, "loss": 2.3693, "step": 20960 }, { "epoch": 0.26, "learning_rate": 0.00017239840552415184, "loss": 2.3532, "step": 20968 }, { "epoch": 0.26, "learning_rate": 0.00017237786262910726, "loss": 2.364, "step": 20976 }, { "epoch": 0.26, "learning_rate": 0.0001723573134779165, "loss": 2.344, "step": 20984 }, { "epoch": 0.26, "learning_rate": 0.00017233675807264048, "loss": 2.352, "step": 20992 }, { "epoch": 0.26, "learning_rate": 0.00017231619641534088, "loss": 2.3354, "step": 21000 }, { "epoch": 0.26, "learning_rate": 0.0001722956285080799, "loss": 2.3586, "step": 21008 }, { "epoch": 0.26, "learning_rate": 0.00017227505435292036, "loss": 2.3695, "step": 21016 }, { "epoch": 0.26, "learning_rate": 0.00017225447395192574, "loss": 2.3683, "step": 21024 }, { "epoch": 0.26, "learning_rate": 0.00017223388730716014, "loss": 2.3712, "step": 21032 }, { "epoch": 0.26, "learning_rate": 0.00017221329442068824, "loss": 2.3521, "step": 21040 }, { "epoch": 0.26, "learning_rate": 0.0001721926952945755, "loss": 2.3694, "step": 21048 }, { "epoch": 0.26, "learning_rate": 0.00017217208993088775, "loss": 2.3718, "step": 21056 }, { "epoch": 0.26, "learning_rate": 0.00017215147833169172, "loss": 2.359, "step": 21064 }, { "epoch": 0.26, "learning_rate": 0.00017213086049905455, "loss": 2.3636, "step": 21072 }, { "epoch": 0.26, "learning_rate": 0.00017211023643504413, "loss": 2.3312, "step": 21080 }, { "epoch": 0.26, "learning_rate": 0.00017208960614172893, "loss": 2.3831, "step": 21088 }, { "epoch": 0.26, "learning_rate": 0.0001720689696211781, "loss": 2.3657, "step": 21096 }, { "epoch": 0.26, "learning_rate": 0.00017204832687546127, "loss": 2.3433, "step": 21104 }, { "epoch": 0.26, "learning_rate": 0.00017202767790664884, "loss": 2.3646, "step": 21112 }, { "epoch": 0.26, "learning_rate": 0.00017200702271681178, "loss": 2.3587, "step": 21120 }, { "epoch": 0.26, "learning_rate": 0.00017198636130802173, "loss": 2.3693, "step": 21128 }, { "epoch": 0.26, "learning_rate": 0.00017196569368235084, "loss": 2.3746, "step": 21136 }, { "epoch": 0.26, "learning_rate": 0.00017194501984187202, "loss": 2.3536, "step": 21144 }, { "epoch": 0.26, "learning_rate": 0.0001719243397886587, "loss": 2.3687, "step": 21152 }, { "epoch": 0.26, "learning_rate": 0.00017190365352478496, "loss": 2.388, "step": 21160 }, { "epoch": 0.26, "learning_rate": 0.00017188296105232555, "loss": 2.3701, "step": 21168 }, { "epoch": 0.26, "learning_rate": 0.00017186226237335582, "loss": 2.3608, "step": 21176 }, { "epoch": 0.26, "learning_rate": 0.0001718415574899517, "loss": 2.3408, "step": 21184 }, { "epoch": 0.26, "learning_rate": 0.00017182084640418973, "loss": 2.3441, "step": 21192 }, { "epoch": 0.27, "learning_rate": 0.0001718001291181472, "loss": 2.3467, "step": 21200 }, { "epoch": 0.27, "learning_rate": 0.0001717794056339019, "loss": 2.3735, "step": 21208 }, { "epoch": 0.27, "learning_rate": 0.00017175867595353226, "loss": 2.3646, "step": 21216 }, { "epoch": 0.27, "learning_rate": 0.00017173794007911737, "loss": 2.3566, "step": 21224 }, { "epoch": 0.27, "learning_rate": 0.0001717171980127369, "loss": 2.3412, "step": 21232 }, { "epoch": 0.27, "learning_rate": 0.00017169644975647118, "loss": 2.368, "step": 21240 }, { "epoch": 0.27, "learning_rate": 0.0001716756953124012, "loss": 2.3452, "step": 21248 }, { "epoch": 0.27, "learning_rate": 0.0001716549346826084, "loss": 2.3668, "step": 21256 }, { "epoch": 0.27, "learning_rate": 0.000171634167869175, "loss": 2.3482, "step": 21264 }, { "epoch": 0.27, "learning_rate": 0.00017161339487418385, "loss": 2.3584, "step": 21272 }, { "epoch": 0.27, "learning_rate": 0.00017159261569971824, "loss": 2.3733, "step": 21280 }, { "epoch": 0.27, "learning_rate": 0.00017157183034786238, "loss": 2.3621, "step": 21288 }, { "epoch": 0.27, "learning_rate": 0.00017155103882070073, "loss": 2.3795, "step": 21296 }, { "epoch": 0.27, "learning_rate": 0.0001715302411203187, "loss": 2.3466, "step": 21304 }, { "epoch": 0.27, "learning_rate": 0.0001715094372488021, "loss": 2.3504, "step": 21312 }, { "epoch": 0.27, "learning_rate": 0.00017148862720823752, "loss": 2.36, "step": 21320 }, { "epoch": 0.27, "learning_rate": 0.000171467811000712, "loss": 2.359, "step": 21328 }, { "epoch": 0.27, "learning_rate": 0.00017144698862831337, "loss": 2.3521, "step": 21336 }, { "epoch": 0.27, "learning_rate": 0.00017142616009312996, "loss": 2.376, "step": 21344 }, { "epoch": 0.27, "learning_rate": 0.00017140532539725075, "loss": 2.3709, "step": 21352 }, { "epoch": 0.27, "learning_rate": 0.0001713844845427653, "loss": 2.3589, "step": 21360 }, { "epoch": 0.27, "learning_rate": 0.00017136363753176393, "loss": 2.3604, "step": 21368 }, { "epoch": 0.27, "learning_rate": 0.0001713427843663374, "loss": 2.3421, "step": 21376 }, { "epoch": 0.27, "learning_rate": 0.00017132192504857715, "loss": 2.3505, "step": 21384 }, { "epoch": 0.27, "learning_rate": 0.00017130105958057531, "loss": 2.368, "step": 21392 }, { "epoch": 0.27, "learning_rate": 0.00017128018796442457, "loss": 2.3544, "step": 21400 }, { "epoch": 0.27, "learning_rate": 0.00017125931020221818, "loss": 2.3421, "step": 21408 }, { "epoch": 0.27, "learning_rate": 0.00017123842629605013, "loss": 2.3609, "step": 21416 }, { "epoch": 0.27, "learning_rate": 0.0001712175362480149, "loss": 2.3649, "step": 21424 }, { "epoch": 0.27, "learning_rate": 0.00017119664006020764, "loss": 2.362, "step": 21432 }, { "epoch": 0.27, "learning_rate": 0.00017117573773472417, "loss": 2.361, "step": 21440 }, { "epoch": 0.27, "learning_rate": 0.00017115482927366083, "loss": 2.3711, "step": 21448 }, { "epoch": 0.27, "learning_rate": 0.00017113391467911464, "loss": 2.3486, "step": 21456 }, { "epoch": 0.27, "learning_rate": 0.0001711129939531832, "loss": 2.3584, "step": 21464 }, { "epoch": 0.27, "learning_rate": 0.00017109206709796477, "loss": 2.361, "step": 21472 }, { "epoch": 0.27, "learning_rate": 0.00017107113411555814, "loss": 2.3648, "step": 21480 }, { "epoch": 0.27, "learning_rate": 0.00017105019500806285, "loss": 2.3331, "step": 21488 }, { "epoch": 0.27, "learning_rate": 0.00017102924977757892, "loss": 2.3595, "step": 21496 }, { "epoch": 0.27, "learning_rate": 0.00017100829842620706, "loss": 2.3584, "step": 21504 }, { "epoch": 0.27, "learning_rate": 0.00017098734095604855, "loss": 2.3472, "step": 21512 }, { "epoch": 0.27, "learning_rate": 0.0001709663773692053, "loss": 2.3614, "step": 21520 }, { "epoch": 0.27, "learning_rate": 0.00017094540766777983, "loss": 2.3515, "step": 21528 }, { "epoch": 0.27, "learning_rate": 0.00017092443185387534, "loss": 2.3551, "step": 21536 }, { "epoch": 0.27, "learning_rate": 0.00017090344992959556, "loss": 2.3527, "step": 21544 }, { "epoch": 0.27, "learning_rate": 0.00017088246189704486, "loss": 2.3484, "step": 21552 }, { "epoch": 0.27, "learning_rate": 0.00017086146775832818, "loss": 2.3581, "step": 21560 }, { "epoch": 0.27, "learning_rate": 0.00017084046751555119, "loss": 2.3426, "step": 21568 }, { "epoch": 0.27, "learning_rate": 0.00017081946117082, "loss": 2.3368, "step": 21576 }, { "epoch": 0.27, "learning_rate": 0.0001707984487262415, "loss": 2.3484, "step": 21584 }, { "epoch": 0.27, "learning_rate": 0.0001707774301839231, "loss": 2.3585, "step": 21592 }, { "epoch": 0.27, "learning_rate": 0.0001707564055459728, "loss": 2.3544, "step": 21600 }, { "epoch": 0.27, "learning_rate": 0.0001707353748144993, "loss": 2.3731, "step": 21608 }, { "epoch": 0.27, "learning_rate": 0.0001707143379916119, "loss": 2.3689, "step": 21616 }, { "epoch": 0.27, "learning_rate": 0.00017069329507942034, "loss": 2.354, "step": 21624 }, { "epoch": 0.27, "learning_rate": 0.00017067224608003528, "loss": 2.3552, "step": 21632 }, { "epoch": 0.27, "learning_rate": 0.00017065119099556769, "loss": 2.3687, "step": 21640 }, { "epoch": 0.27, "learning_rate": 0.0001706301298281293, "loss": 2.3573, "step": 21648 }, { "epoch": 0.27, "learning_rate": 0.00017060906257983244, "loss": 2.3725, "step": 21656 }, { "epoch": 0.27, "learning_rate": 0.00017058798925279005, "loss": 2.3824, "step": 21664 }, { "epoch": 0.27, "learning_rate": 0.00017056690984911562, "loss": 2.369, "step": 21672 }, { "epoch": 0.27, "learning_rate": 0.00017054582437092336, "loss": 2.3629, "step": 21680 }, { "epoch": 0.27, "learning_rate": 0.00017052473282032796, "loss": 2.3764, "step": 21688 }, { "epoch": 0.27, "learning_rate": 0.00017050363519944482, "loss": 2.353, "step": 21696 }, { "epoch": 0.27, "learning_rate": 0.00017048253151038988, "loss": 2.3595, "step": 21704 }, { "epoch": 0.27, "learning_rate": 0.0001704614217552798, "loss": 2.3739, "step": 21712 }, { "epoch": 0.27, "learning_rate": 0.00017044030593623167, "loss": 2.3635, "step": 21720 }, { "epoch": 0.27, "learning_rate": 0.0001704191840553633, "loss": 2.3805, "step": 21728 }, { "epoch": 0.27, "learning_rate": 0.00017039805611479317, "loss": 2.3468, "step": 21736 }, { "epoch": 0.27, "learning_rate": 0.00017037692211664026, "loss": 2.3738, "step": 21744 }, { "epoch": 0.27, "learning_rate": 0.00017035578206302411, "loss": 2.3571, "step": 21752 }, { "epoch": 0.27, "learning_rate": 0.00017033463595606506, "loss": 2.3456, "step": 21760 }, { "epoch": 0.27, "learning_rate": 0.00017031348379788392, "loss": 2.3619, "step": 21768 }, { "epoch": 0.27, "learning_rate": 0.00017029232559060206, "loss": 2.3699, "step": 21776 }, { "epoch": 0.27, "learning_rate": 0.00017027116133634164, "loss": 2.3569, "step": 21784 }, { "epoch": 0.27, "learning_rate": 0.0001702499910372252, "loss": 2.3819, "step": 21792 }, { "epoch": 0.27, "learning_rate": 0.00017022881469537607, "loss": 2.3633, "step": 21800 }, { "epoch": 0.27, "learning_rate": 0.00017020763231291808, "loss": 2.3789, "step": 21808 }, { "epoch": 0.27, "learning_rate": 0.00017018644389197573, "loss": 2.3709, "step": 21816 }, { "epoch": 0.27, "learning_rate": 0.00017016524943467412, "loss": 2.3684, "step": 21824 }, { "epoch": 0.27, "learning_rate": 0.00017014404894313888, "loss": 2.3515, "step": 21832 }, { "epoch": 0.27, "learning_rate": 0.00017012284241949634, "loss": 2.3462, "step": 21840 }, { "epoch": 0.27, "learning_rate": 0.00017010162986587338, "loss": 2.3505, "step": 21848 }, { "epoch": 0.27, "learning_rate": 0.0001700804112843975, "loss": 2.3732, "step": 21856 }, { "epoch": 0.27, "learning_rate": 0.0001700591866771968, "loss": 2.3474, "step": 21864 }, { "epoch": 0.27, "learning_rate": 0.00017003795604639998, "loss": 2.3502, "step": 21872 }, { "epoch": 0.27, "learning_rate": 0.00017001671939413638, "loss": 2.369, "step": 21880 }, { "epoch": 0.27, "learning_rate": 0.0001699954767225359, "loss": 2.3612, "step": 21888 }, { "epoch": 0.27, "learning_rate": 0.00016997422803372903, "loss": 2.383, "step": 21896 }, { "epoch": 0.27, "learning_rate": 0.00016995297332984697, "loss": 2.361, "step": 21904 }, { "epoch": 0.27, "learning_rate": 0.00016993171261302134, "loss": 2.3653, "step": 21912 }, { "epoch": 0.27, "learning_rate": 0.00016991044588538453, "loss": 2.3646, "step": 21920 }, { "epoch": 0.27, "learning_rate": 0.00016988917314906952, "loss": 2.3656, "step": 21928 }, { "epoch": 0.27, "learning_rate": 0.00016986789440620977, "loss": 2.3614, "step": 21936 }, { "epoch": 0.27, "learning_rate": 0.00016984660965893943, "loss": 2.3484, "step": 21944 }, { "epoch": 0.27, "learning_rate": 0.00016982531890939327, "loss": 2.3467, "step": 21952 }, { "epoch": 0.27, "learning_rate": 0.0001698040221597066, "loss": 2.3713, "step": 21960 }, { "epoch": 0.27, "learning_rate": 0.00016978271941201536, "loss": 2.3651, "step": 21968 }, { "epoch": 0.27, "learning_rate": 0.00016976141066845613, "loss": 2.3661, "step": 21976 }, { "epoch": 0.27, "learning_rate": 0.00016974009593116604, "loss": 2.3643, "step": 21984 }, { "epoch": 0.27, "learning_rate": 0.00016971877520228284, "loss": 2.3611, "step": 21992 }, { "epoch": 0.28, "learning_rate": 0.00016969744848394484, "loss": 2.3636, "step": 22000 }, { "epoch": 0.28, "learning_rate": 0.00016967611577829104, "loss": 2.3562, "step": 22008 }, { "epoch": 0.28, "learning_rate": 0.000169654777087461, "loss": 2.3769, "step": 22016 }, { "epoch": 0.28, "learning_rate": 0.0001696334324135948, "loss": 2.3671, "step": 22024 }, { "epoch": 0.28, "learning_rate": 0.00016961208175883324, "loss": 2.3611, "step": 22032 }, { "epoch": 0.28, "learning_rate": 0.00016959072512531765, "loss": 2.3582, "step": 22040 }, { "epoch": 0.28, "learning_rate": 0.00016956936251519002, "loss": 2.3397, "step": 22048 }, { "epoch": 0.28, "learning_rate": 0.00016954799393059284, "loss": 2.3583, "step": 22056 }, { "epoch": 0.28, "learning_rate": 0.0001695266193736693, "loss": 2.3723, "step": 22064 }, { "epoch": 0.28, "learning_rate": 0.00016950523884656313, "loss": 2.3695, "step": 22072 }, { "epoch": 0.28, "learning_rate": 0.00016948385235141867, "loss": 2.3528, "step": 22080 }, { "epoch": 0.28, "learning_rate": 0.00016946245989038088, "loss": 2.365, "step": 22088 }, { "epoch": 0.28, "learning_rate": 0.0001694410614655953, "loss": 2.3471, "step": 22096 }, { "epoch": 0.28, "learning_rate": 0.00016941965707920807, "loss": 2.3646, "step": 22104 }, { "epoch": 0.28, "learning_rate": 0.00016939824673336596, "loss": 2.3495, "step": 22112 }, { "epoch": 0.28, "learning_rate": 0.0001693768304302162, "loss": 2.3508, "step": 22120 }, { "epoch": 0.28, "learning_rate": 0.00016935540817190686, "loss": 2.3792, "step": 22128 }, { "epoch": 0.28, "learning_rate": 0.00016933397996058634, "loss": 2.3712, "step": 22136 }, { "epoch": 0.28, "learning_rate": 0.0001693125457984039, "loss": 2.3504, "step": 22144 }, { "epoch": 0.28, "learning_rate": 0.00016929110568750913, "loss": 2.3512, "step": 22152 }, { "epoch": 0.28, "learning_rate": 0.0001692696596300525, "loss": 2.3535, "step": 22160 }, { "epoch": 0.28, "learning_rate": 0.0001692482076281848, "loss": 2.3641, "step": 22168 }, { "epoch": 0.28, "learning_rate": 0.00016922674968405759, "loss": 2.3936, "step": 22176 }, { "epoch": 0.28, "learning_rate": 0.000169205285799823, "loss": 2.3403, "step": 22184 }, { "epoch": 0.28, "learning_rate": 0.0001691838159776337, "loss": 2.3827, "step": 22192 }, { "epoch": 0.28, "learning_rate": 0.00016916234021964308, "loss": 2.3686, "step": 22200 }, { "epoch": 0.28, "learning_rate": 0.00016914085852800487, "loss": 2.3668, "step": 22208 }, { "epoch": 0.28, "learning_rate": 0.00016911937090487373, "loss": 2.3742, "step": 22216 }, { "epoch": 0.28, "learning_rate": 0.00016909787735240465, "loss": 2.351, "step": 22224 }, { "epoch": 0.28, "learning_rate": 0.00016907637787275334, "loss": 2.3903, "step": 22232 }, { "epoch": 0.28, "learning_rate": 0.00016905487246807608, "loss": 2.3518, "step": 22240 }, { "epoch": 0.28, "learning_rate": 0.00016903336114052975, "loss": 2.3531, "step": 22248 }, { "epoch": 0.28, "learning_rate": 0.0001690118438922718, "loss": 2.3678, "step": 22256 }, { "epoch": 0.28, "learning_rate": 0.00016899032072546023, "loss": 2.36, "step": 22264 }, { "epoch": 0.28, "learning_rate": 0.00016896879164225378, "loss": 2.3821, "step": 22272 }, { "epoch": 0.28, "learning_rate": 0.0001689472566448117, "loss": 2.374, "step": 22280 }, { "epoch": 0.28, "learning_rate": 0.00016892571573529379, "loss": 2.3602, "step": 22288 }, { "epoch": 0.28, "learning_rate": 0.00016890416891586043, "loss": 2.3696, "step": 22296 }, { "epoch": 0.28, "learning_rate": 0.0001688826161886727, "loss": 2.3799, "step": 22304 }, { "epoch": 0.28, "learning_rate": 0.00016886105755589226, "loss": 2.3509, "step": 22312 }, { "epoch": 0.28, "learning_rate": 0.00016883949301968126, "loss": 2.3687, "step": 22320 }, { "epoch": 0.28, "learning_rate": 0.00016881792258220248, "loss": 2.3816, "step": 22328 }, { "epoch": 0.28, "learning_rate": 0.0001687963462456194, "loss": 2.3513, "step": 22336 }, { "epoch": 0.28, "learning_rate": 0.00016877476401209592, "loss": 2.3722, "step": 22344 }, { "epoch": 0.28, "learning_rate": 0.00016875317588379662, "loss": 2.3862, "step": 22352 }, { "epoch": 0.28, "learning_rate": 0.00016873158186288674, "loss": 2.3885, "step": 22360 }, { "epoch": 0.28, "learning_rate": 0.00016870998195153195, "loss": 2.3662, "step": 22368 }, { "epoch": 0.28, "learning_rate": 0.00016868837615189865, "loss": 2.3477, "step": 22376 }, { "epoch": 0.28, "learning_rate": 0.0001686667644661538, "loss": 2.3491, "step": 22384 }, { "epoch": 0.28, "learning_rate": 0.00016864514689646486, "loss": 2.3741, "step": 22392 }, { "epoch": 0.28, "learning_rate": 0.000168623523445, "loss": 2.3728, "step": 22400 }, { "epoch": 0.28, "learning_rate": 0.00016860189411392794, "loss": 2.3623, "step": 22408 }, { "epoch": 0.28, "learning_rate": 0.0001685802589054179, "loss": 2.3462, "step": 22416 }, { "epoch": 0.28, "learning_rate": 0.0001685586178216399, "loss": 2.3754, "step": 22424 }, { "epoch": 0.28, "learning_rate": 0.0001685369708647643, "loss": 2.3521, "step": 22432 }, { "epoch": 0.28, "learning_rate": 0.00016851531803696224, "loss": 2.3654, "step": 22440 }, { "epoch": 0.28, "learning_rate": 0.0001684936593404053, "loss": 2.3576, "step": 22448 }, { "epoch": 0.28, "learning_rate": 0.0001684719947772658, "loss": 2.3722, "step": 22456 }, { "epoch": 0.28, "learning_rate": 0.00016845032434971655, "loss": 2.3473, "step": 22464 }, { "epoch": 0.28, "learning_rate": 0.00016842864805993095, "loss": 2.361, "step": 22472 }, { "epoch": 0.28, "learning_rate": 0.00016840696591008302, "loss": 2.3534, "step": 22480 }, { "epoch": 0.28, "learning_rate": 0.00016838527790234738, "loss": 2.3708, "step": 22488 }, { "epoch": 0.28, "learning_rate": 0.00016836358403889918, "loss": 2.3316, "step": 22496 }, { "epoch": 0.28, "learning_rate": 0.00016834188432191422, "loss": 2.3883, "step": 22504 }, { "epoch": 0.28, "learning_rate": 0.00016832017875356885, "loss": 2.3649, "step": 22512 }, { "epoch": 0.28, "learning_rate": 0.00016829846733604, "loss": 2.3415, "step": 22520 }, { "epoch": 0.28, "learning_rate": 0.0001682767500715052, "loss": 2.3627, "step": 22528 }, { "epoch": 0.28, "learning_rate": 0.0001682550269621426, "loss": 2.3526, "step": 22536 }, { "epoch": 0.28, "learning_rate": 0.0001682332980101309, "loss": 2.3444, "step": 22544 }, { "epoch": 0.28, "learning_rate": 0.0001682115632176494, "loss": 2.3688, "step": 22552 }, { "epoch": 0.28, "learning_rate": 0.0001681898225868779, "loss": 2.356, "step": 22560 }, { "epoch": 0.28, "learning_rate": 0.0001681680761199969, "loss": 2.3715, "step": 22568 }, { "epoch": 0.28, "learning_rate": 0.00016814632381918751, "loss": 2.3462, "step": 22576 }, { "epoch": 0.28, "learning_rate": 0.00016812456568663132, "loss": 2.3519, "step": 22584 }, { "epoch": 0.28, "learning_rate": 0.0001681028017245105, "loss": 2.383, "step": 22592 }, { "epoch": 0.28, "learning_rate": 0.00016808103193500793, "loss": 2.3523, "step": 22600 }, { "epoch": 0.28, "learning_rate": 0.00016805925632030696, "loss": 2.3505, "step": 22608 }, { "epoch": 0.28, "learning_rate": 0.00016803747488259156, "loss": 2.3571, "step": 22616 }, { "epoch": 0.28, "learning_rate": 0.00016801568762404628, "loss": 2.366, "step": 22624 }, { "epoch": 0.28, "learning_rate": 0.00016799389454685626, "loss": 2.3635, "step": 22632 }, { "epoch": 0.28, "learning_rate": 0.00016797209565320726, "loss": 2.3707, "step": 22640 }, { "epoch": 0.28, "learning_rate": 0.00016795029094528554, "loss": 2.3546, "step": 22648 }, { "epoch": 0.28, "learning_rate": 0.00016792848042527798, "loss": 2.3388, "step": 22656 }, { "epoch": 0.28, "learning_rate": 0.0001679066640953721, "loss": 2.3613, "step": 22664 }, { "epoch": 0.28, "learning_rate": 0.0001678848419577559, "loss": 2.3609, "step": 22672 }, { "epoch": 0.28, "learning_rate": 0.00016786301401461805, "loss": 2.3542, "step": 22680 }, { "epoch": 0.28, "learning_rate": 0.0001678411802681478, "loss": 2.3655, "step": 22688 }, { "epoch": 0.28, "learning_rate": 0.0001678193407205349, "loss": 2.3626, "step": 22696 }, { "epoch": 0.28, "learning_rate": 0.00016779749537396973, "loss": 2.3452, "step": 22704 }, { "epoch": 0.28, "learning_rate": 0.00016777564423064328, "loss": 2.3502, "step": 22712 }, { "epoch": 0.28, "learning_rate": 0.00016775378729274709, "loss": 2.3817, "step": 22720 }, { "epoch": 0.28, "learning_rate": 0.0001677319245624733, "loss": 2.361, "step": 22728 }, { "epoch": 0.28, "learning_rate": 0.00016771005604201462, "loss": 2.351, "step": 22736 }, { "epoch": 0.28, "learning_rate": 0.00016768818173356427, "loss": 2.3419, "step": 22744 }, { "epoch": 0.28, "learning_rate": 0.00016766630163931622, "loss": 2.3564, "step": 22752 }, { "epoch": 0.28, "learning_rate": 0.0001676444157614648, "loss": 2.3648, "step": 22760 }, { "epoch": 0.28, "learning_rate": 0.00016762252410220519, "loss": 2.3581, "step": 22768 }, { "epoch": 0.28, "learning_rate": 0.00016760062666373288, "loss": 2.347, "step": 22776 }, { "epoch": 0.28, "learning_rate": 0.00016757872344824411, "loss": 2.3686, "step": 22784 }, { "epoch": 0.28, "learning_rate": 0.00016755681445793563, "loss": 2.3588, "step": 22792 }, { "epoch": 0.28, "learning_rate": 0.0001675348996950048, "loss": 2.3629, "step": 22800 }, { "epoch": 0.29, "learning_rate": 0.00016751297916164953, "loss": 2.3817, "step": 22808 }, { "epoch": 0.29, "learning_rate": 0.00016749105286006835, "loss": 2.3339, "step": 22816 }, { "epoch": 0.29, "learning_rate": 0.00016746912079246032, "loss": 2.3611, "step": 22824 }, { "epoch": 0.29, "learning_rate": 0.00016744718296102514, "loss": 2.3589, "step": 22832 }, { "epoch": 0.29, "learning_rate": 0.00016742523936796297, "loss": 2.3602, "step": 22840 }, { "epoch": 0.29, "learning_rate": 0.0001674032900154747, "loss": 2.3483, "step": 22848 }, { "epoch": 0.29, "learning_rate": 0.00016738133490576176, "loss": 2.3679, "step": 22856 }, { "epoch": 0.29, "learning_rate": 0.00016735937404102605, "loss": 2.3581, "step": 22864 }, { "epoch": 0.29, "learning_rate": 0.0001673374074234701, "loss": 2.3889, "step": 22872 }, { "epoch": 0.29, "learning_rate": 0.00016731543505529707, "loss": 2.3844, "step": 22880 }, { "epoch": 0.29, "learning_rate": 0.0001672934569387107, "loss": 2.3568, "step": 22888 }, { "epoch": 0.29, "learning_rate": 0.00016727147307591523, "loss": 2.3638, "step": 22896 }, { "epoch": 0.29, "learning_rate": 0.00016724948346911553, "loss": 2.354, "step": 22904 }, { "epoch": 0.29, "learning_rate": 0.00016722748812051706, "loss": 2.3641, "step": 22912 }, { "epoch": 0.29, "learning_rate": 0.00016720548703232576, "loss": 2.3637, "step": 22920 }, { "epoch": 0.29, "learning_rate": 0.0001671834802067483, "loss": 2.3566, "step": 22928 }, { "epoch": 0.29, "learning_rate": 0.00016716146764599174, "loss": 2.3524, "step": 22936 }, { "epoch": 0.29, "learning_rate": 0.0001671394493522639, "loss": 2.332, "step": 22944 }, { "epoch": 0.29, "learning_rate": 0.00016711742532777308, "loss": 2.3691, "step": 22952 }, { "epoch": 0.29, "learning_rate": 0.0001670953955747281, "loss": 2.3513, "step": 22960 }, { "epoch": 0.29, "learning_rate": 0.00016707336009533848, "loss": 2.3489, "step": 22968 }, { "epoch": 0.29, "learning_rate": 0.00016705131889181425, "loss": 2.362, "step": 22976 }, { "epoch": 0.29, "learning_rate": 0.000167029271966366, "loss": 2.3763, "step": 22984 }, { "epoch": 0.29, "learning_rate": 0.00016700721932120494, "loss": 2.3639, "step": 22992 }, { "epoch": 0.29, "learning_rate": 0.00016698516095854275, "loss": 2.3535, "step": 23000 }, { "epoch": 0.29, "learning_rate": 0.00016696309688059185, "loss": 2.364, "step": 23008 }, { "epoch": 0.29, "learning_rate": 0.0001669410270895651, "loss": 2.3434, "step": 23016 }, { "epoch": 0.29, "learning_rate": 0.00016691895158767596, "loss": 2.3584, "step": 23024 }, { "epoch": 0.29, "learning_rate": 0.00016689687037713854, "loss": 2.3772, "step": 23032 }, { "epoch": 0.29, "learning_rate": 0.0001668747834601674, "loss": 2.3541, "step": 23040 }, { "epoch": 0.29, "learning_rate": 0.0001668526908389777, "loss": 2.3568, "step": 23048 }, { "epoch": 0.29, "learning_rate": 0.00016683059251578527, "loss": 2.3415, "step": 23056 }, { "epoch": 0.29, "learning_rate": 0.0001668084884928065, "loss": 2.3583, "step": 23064 }, { "epoch": 0.29, "learning_rate": 0.00016678637877225815, "loss": 2.3558, "step": 23072 }, { "epoch": 0.29, "learning_rate": 0.00016676426335635782, "loss": 2.3473, "step": 23080 }, { "epoch": 0.29, "learning_rate": 0.0001667421422473235, "loss": 2.3499, "step": 23088 }, { "epoch": 0.29, "learning_rate": 0.00016672001544737382, "loss": 2.3647, "step": 23096 }, { "epoch": 0.29, "learning_rate": 0.00016669788295872804, "loss": 2.3281, "step": 23104 }, { "epoch": 0.29, "learning_rate": 0.0001666757447836058, "loss": 2.361, "step": 23112 }, { "epoch": 0.29, "learning_rate": 0.00016665360092422754, "loss": 2.3783, "step": 23120 }, { "epoch": 0.29, "learning_rate": 0.0001666314513828141, "loss": 2.3494, "step": 23128 }, { "epoch": 0.29, "learning_rate": 0.00016660929616158703, "loss": 2.3425, "step": 23136 }, { "epoch": 0.29, "learning_rate": 0.00016658713526276827, "loss": 2.353, "step": 23144 }, { "epoch": 0.29, "learning_rate": 0.00016656496868858048, "loss": 2.3706, "step": 23152 }, { "epoch": 0.29, "learning_rate": 0.00016654279644124688, "loss": 2.3552, "step": 23160 }, { "epoch": 0.29, "learning_rate": 0.00016652061852299118, "loss": 2.3691, "step": 23168 }, { "epoch": 0.29, "learning_rate": 0.00016649843493603766, "loss": 2.3605, "step": 23176 }, { "epoch": 0.29, "learning_rate": 0.0001664762456826113, "loss": 2.3614, "step": 23184 }, { "epoch": 0.29, "learning_rate": 0.0001664540507649375, "loss": 2.3548, "step": 23192 }, { "epoch": 0.29, "learning_rate": 0.00016643185018524228, "loss": 2.3568, "step": 23200 }, { "epoch": 0.29, "learning_rate": 0.00016640964394575226, "loss": 2.3591, "step": 23208 }, { "epoch": 0.29, "learning_rate": 0.0001663874320486946, "loss": 2.3771, "step": 23216 }, { "epoch": 0.29, "learning_rate": 0.000166365214496297, "loss": 2.3362, "step": 23224 }, { "epoch": 0.29, "learning_rate": 0.00016634299129078775, "loss": 2.3573, "step": 23232 }, { "epoch": 0.29, "learning_rate": 0.00016632076243439575, "loss": 2.3491, "step": 23240 }, { "epoch": 0.29, "learning_rate": 0.0001662985279293504, "loss": 2.3791, "step": 23248 }, { "epoch": 0.29, "learning_rate": 0.00016627628777788174, "loss": 2.3497, "step": 23256 }, { "epoch": 0.29, "learning_rate": 0.00016625404198222026, "loss": 2.3791, "step": 23264 }, { "epoch": 0.29, "learning_rate": 0.00016623179054459715, "loss": 2.3517, "step": 23272 }, { "epoch": 0.29, "learning_rate": 0.00016620953346724405, "loss": 2.37, "step": 23280 }, { "epoch": 0.29, "learning_rate": 0.00016618727075239323, "loss": 2.3703, "step": 23288 }, { "epoch": 0.29, "learning_rate": 0.00016616500240227756, "loss": 2.3514, "step": 23296 }, { "epoch": 0.29, "learning_rate": 0.0001661427284191304, "loss": 2.3604, "step": 23304 }, { "epoch": 0.29, "learning_rate": 0.00016612044880518566, "loss": 2.3929, "step": 23312 }, { "epoch": 0.29, "learning_rate": 0.00016609816356267794, "loss": 2.3677, "step": 23320 }, { "epoch": 0.29, "learning_rate": 0.00016607587269384225, "loss": 2.3498, "step": 23328 }, { "epoch": 0.29, "learning_rate": 0.0001660535762009143, "loss": 2.3682, "step": 23336 }, { "epoch": 0.29, "learning_rate": 0.00016603127408613025, "loss": 2.3444, "step": 23344 }, { "epoch": 0.29, "learning_rate": 0.00016600896635172692, "loss": 2.3704, "step": 23352 }, { "epoch": 0.29, "learning_rate": 0.00016598665299994166, "loss": 2.3707, "step": 23360 }, { "epoch": 0.29, "learning_rate": 0.0001659643340330123, "loss": 2.3491, "step": 23368 }, { "epoch": 0.29, "learning_rate": 0.00016594200945317734, "loss": 2.3676, "step": 23376 }, { "epoch": 0.29, "learning_rate": 0.00016591967926267583, "loss": 2.3657, "step": 23384 }, { "epoch": 0.29, "learning_rate": 0.00016589734346374738, "loss": 2.3764, "step": 23392 }, { "epoch": 0.29, "learning_rate": 0.00016587500205863208, "loss": 2.3708, "step": 23400 }, { "epoch": 0.29, "learning_rate": 0.00016585265504957065, "loss": 2.3501, "step": 23408 }, { "epoch": 0.29, "learning_rate": 0.00016583030243880447, "loss": 2.3565, "step": 23416 }, { "epoch": 0.29, "learning_rate": 0.00016580794422857523, "loss": 2.3661, "step": 23424 }, { "epoch": 0.29, "learning_rate": 0.00016578558042112547, "loss": 2.3465, "step": 23432 }, { "epoch": 0.29, "learning_rate": 0.00016576321101869807, "loss": 2.3455, "step": 23440 }, { "epoch": 0.29, "learning_rate": 0.00016574083602353658, "loss": 2.3842, "step": 23448 }, { "epoch": 0.29, "learning_rate": 0.00016571845543788508, "loss": 2.3526, "step": 23456 }, { "epoch": 0.29, "learning_rate": 0.0001656960692639882, "loss": 2.3627, "step": 23464 }, { "epoch": 0.29, "learning_rate": 0.00016567367750409118, "loss": 2.3439, "step": 23472 }, { "epoch": 0.29, "learning_rate": 0.00016565128016043975, "loss": 2.3557, "step": 23480 }, { "epoch": 0.29, "learning_rate": 0.00016562887723528031, "loss": 2.3578, "step": 23488 }, { "epoch": 0.29, "learning_rate": 0.00016560646873085965, "loss": 2.3724, "step": 23496 }, { "epoch": 0.29, "learning_rate": 0.00016558405464942526, "loss": 2.3647, "step": 23504 }, { "epoch": 0.29, "learning_rate": 0.00016556163499322518, "loss": 2.3543, "step": 23512 }, { "epoch": 0.29, "learning_rate": 0.00016553920976450793, "loss": 2.379, "step": 23520 }, { "epoch": 0.29, "learning_rate": 0.0001655167789655226, "loss": 2.3753, "step": 23528 }, { "epoch": 0.29, "learning_rate": 0.00016549434259851894, "loss": 2.3593, "step": 23536 }, { "epoch": 0.29, "learning_rate": 0.00016547190066574719, "loss": 2.3729, "step": 23544 }, { "epoch": 0.29, "learning_rate": 0.0001654494531694581, "loss": 2.3434, "step": 23552 }, { "epoch": 0.29, "learning_rate": 0.00016542700011190305, "loss": 2.3788, "step": 23560 }, { "epoch": 0.29, "learning_rate": 0.00016540454149533394, "loss": 2.3377, "step": 23568 }, { "epoch": 0.29, "learning_rate": 0.00016538207732200332, "loss": 2.3639, "step": 23576 }, { "epoch": 0.29, "learning_rate": 0.0001653596075941641, "loss": 2.3649, "step": 23584 }, { "epoch": 0.29, "learning_rate": 0.00016533713231406993, "loss": 2.3611, "step": 23592 }, { "epoch": 0.29, "learning_rate": 0.00016531465148397496, "loss": 2.3517, "step": 23600 }, { "epoch": 0.3, "learning_rate": 0.00016529216510613386, "loss": 2.3647, "step": 23608 }, { "epoch": 0.3, "learning_rate": 0.0001652696731828019, "loss": 2.369, "step": 23616 }, { "epoch": 0.3, "learning_rate": 0.00016524717571623492, "loss": 2.3559, "step": 23624 }, { "epoch": 0.3, "learning_rate": 0.00016522467270868924, "loss": 2.3478, "step": 23632 }, { "epoch": 0.3, "learning_rate": 0.00016520216416242184, "loss": 2.3569, "step": 23640 }, { "epoch": 0.3, "learning_rate": 0.00016517965007969014, "loss": 2.362, "step": 23648 }, { "epoch": 0.3, "learning_rate": 0.00016515713046275223, "loss": 2.339, "step": 23656 }, { "epoch": 0.3, "learning_rate": 0.00016513460531386665, "loss": 2.349, "step": 23664 }, { "epoch": 0.3, "learning_rate": 0.00016511207463529255, "loss": 2.3451, "step": 23672 }, { "epoch": 0.3, "learning_rate": 0.00016508953842928967, "loss": 2.3501, "step": 23680 }, { "epoch": 0.3, "learning_rate": 0.00016506699669811823, "loss": 2.3709, "step": 23688 }, { "epoch": 0.3, "learning_rate": 0.00016504444944403905, "loss": 2.3678, "step": 23696 }, { "epoch": 0.3, "learning_rate": 0.0001650218966693135, "loss": 2.3429, "step": 23704 }, { "epoch": 0.3, "learning_rate": 0.00016499933837620348, "loss": 2.3644, "step": 23712 }, { "epoch": 0.3, "learning_rate": 0.00016497677456697144, "loss": 2.3346, "step": 23720 }, { "epoch": 0.3, "learning_rate": 0.00016495420524388046, "loss": 2.3665, "step": 23728 }, { "epoch": 0.3, "learning_rate": 0.00016493163040919405, "loss": 2.354, "step": 23736 }, { "epoch": 0.3, "learning_rate": 0.00016490905006517643, "loss": 2.3642, "step": 23744 }, { "epoch": 0.3, "learning_rate": 0.00016488646421409215, "loss": 2.3749, "step": 23752 }, { "epoch": 0.3, "learning_rate": 0.00016486387285820654, "loss": 2.3801, "step": 23760 }, { "epoch": 0.3, "learning_rate": 0.00016484127599978535, "loss": 2.34, "step": 23768 }, { "epoch": 0.3, "learning_rate": 0.00016481867364109495, "loss": 2.3519, "step": 23776 }, { "epoch": 0.3, "learning_rate": 0.00016479606578440222, "loss": 2.3702, "step": 23784 }, { "epoch": 0.3, "learning_rate": 0.00016477345243197454, "loss": 2.3706, "step": 23792 }, { "epoch": 0.3, "learning_rate": 0.00016475083358607996, "loss": 2.3361, "step": 23800 }, { "epoch": 0.3, "learning_rate": 0.000164728209248987, "loss": 2.3657, "step": 23808 }, { "epoch": 0.3, "learning_rate": 0.00016470557942296476, "loss": 2.357, "step": 23816 }, { "epoch": 0.3, "learning_rate": 0.00016468294411028288, "loss": 2.3648, "step": 23824 }, { "epoch": 0.3, "learning_rate": 0.00016466030331321156, "loss": 2.3444, "step": 23832 }, { "epoch": 0.3, "learning_rate": 0.00016463765703402154, "loss": 2.3488, "step": 23840 }, { "epoch": 0.3, "learning_rate": 0.00016461500527498415, "loss": 2.3555, "step": 23848 }, { "epoch": 0.3, "learning_rate": 0.00016459234803837113, "loss": 2.3417, "step": 23856 }, { "epoch": 0.3, "learning_rate": 0.00016456968532645497, "loss": 2.3533, "step": 23864 }, { "epoch": 0.3, "learning_rate": 0.00016454701714150859, "loss": 2.3653, "step": 23872 }, { "epoch": 0.3, "learning_rate": 0.0001645243434858055, "loss": 2.3464, "step": 23880 }, { "epoch": 0.3, "learning_rate": 0.00016450166436161968, "loss": 2.3649, "step": 23888 }, { "epoch": 0.3, "learning_rate": 0.0001644789797712257, "loss": 2.3424, "step": 23896 }, { "epoch": 0.3, "learning_rate": 0.0001644562897168988, "loss": 2.3538, "step": 23904 }, { "epoch": 0.3, "learning_rate": 0.00016443359420091456, "loss": 2.3689, "step": 23912 }, { "epoch": 0.3, "learning_rate": 0.0001644108932255493, "loss": 2.3539, "step": 23920 }, { "epoch": 0.3, "learning_rate": 0.00016438818679307977, "loss": 2.357, "step": 23928 }, { "epoch": 0.3, "learning_rate": 0.00016436547490578327, "loss": 2.3491, "step": 23936 }, { "epoch": 0.3, "learning_rate": 0.00016434275756593768, "loss": 2.378, "step": 23944 }, { "epoch": 0.3, "learning_rate": 0.00016432003477582144, "loss": 2.359, "step": 23952 }, { "epoch": 0.3, "learning_rate": 0.0001642973065377135, "loss": 2.365, "step": 23960 }, { "epoch": 0.3, "learning_rate": 0.00016427457285389337, "loss": 2.3656, "step": 23968 }, { "epoch": 0.3, "learning_rate": 0.00016425183372664113, "loss": 2.3732, "step": 23976 }, { "epoch": 0.3, "learning_rate": 0.00016422908915823738, "loss": 2.3437, "step": 23984 }, { "epoch": 0.3, "learning_rate": 0.00016420633915096327, "loss": 2.3592, "step": 23992 }, { "epoch": 0.3, "learning_rate": 0.0001641835837071005, "loss": 2.3625, "step": 24000 }, { "epoch": 0.3, "learning_rate": 0.0001641608228289313, "loss": 2.3549, "step": 24008 }, { "epoch": 0.3, "learning_rate": 0.00016413805651873843, "loss": 2.3686, "step": 24016 }, { "epoch": 0.3, "learning_rate": 0.00016411528477880527, "loss": 2.3392, "step": 24024 }, { "epoch": 0.3, "learning_rate": 0.00016409250761141567, "loss": 2.3443, "step": 24032 }, { "epoch": 0.3, "learning_rate": 0.0001640697250188541, "loss": 2.3353, "step": 24040 }, { "epoch": 0.3, "learning_rate": 0.00016404693700340544, "loss": 2.353, "step": 24048 }, { "epoch": 0.3, "learning_rate": 0.0001640241435673553, "loss": 2.3483, "step": 24056 }, { "epoch": 0.3, "learning_rate": 0.00016400134471298964, "loss": 2.3602, "step": 24064 }, { "epoch": 0.3, "learning_rate": 0.00016397854044259512, "loss": 2.3606, "step": 24072 }, { "epoch": 0.3, "learning_rate": 0.00016395573075845882, "loss": 2.3673, "step": 24080 }, { "epoch": 0.3, "learning_rate": 0.00016393291566286846, "loss": 2.3277, "step": 24088 }, { "epoch": 0.3, "learning_rate": 0.0001639100951581123, "loss": 2.3626, "step": 24096 }, { "epoch": 0.3, "learning_rate": 0.00016388726924647905, "loss": 2.3611, "step": 24104 }, { "epoch": 0.3, "learning_rate": 0.000163864437930258, "loss": 2.3727, "step": 24112 }, { "epoch": 0.3, "learning_rate": 0.00016384160121173905, "loss": 2.3576, "step": 24120 }, { "epoch": 0.3, "learning_rate": 0.0001638187590932126, "loss": 2.3507, "step": 24128 }, { "epoch": 0.3, "learning_rate": 0.00016379591157696956, "loss": 2.3467, "step": 24136 }, { "epoch": 0.3, "learning_rate": 0.0001637730586653014, "loss": 2.3667, "step": 24144 }, { "epoch": 0.3, "learning_rate": 0.0001637502003605002, "loss": 2.3465, "step": 24152 }, { "epoch": 0.3, "learning_rate": 0.0001637273366648584, "loss": 2.3501, "step": 24160 }, { "epoch": 0.3, "learning_rate": 0.00016370446758066923, "loss": 2.3741, "step": 24168 }, { "epoch": 0.3, "learning_rate": 0.0001636815931102262, "loss": 2.3718, "step": 24176 }, { "epoch": 0.3, "learning_rate": 0.00016365871325582364, "loss": 2.3344, "step": 24184 }, { "epoch": 0.3, "learning_rate": 0.00016363582801975614, "loss": 2.363, "step": 24192 }, { "epoch": 0.3, "learning_rate": 0.00016361293740431904, "loss": 2.3628, "step": 24200 }, { "epoch": 0.3, "learning_rate": 0.00016359004141180803, "loss": 2.3312, "step": 24208 }, { "epoch": 0.3, "learning_rate": 0.00016356714004451962, "loss": 2.3715, "step": 24216 }, { "epoch": 0.3, "learning_rate": 0.0001635442333047505, "loss": 2.347, "step": 24224 }, { "epoch": 0.3, "learning_rate": 0.00016352132119479827, "loss": 2.3299, "step": 24232 }, { "epoch": 0.3, "learning_rate": 0.0001634984037169607, "loss": 2.3644, "step": 24240 }, { "epoch": 0.3, "learning_rate": 0.00016347548087353644, "loss": 2.3767, "step": 24248 }, { "epoch": 0.3, "learning_rate": 0.00016345255266682443, "loss": 2.3614, "step": 24256 }, { "epoch": 0.3, "learning_rate": 0.0001634296190991243, "loss": 2.3426, "step": 24264 }, { "epoch": 0.3, "learning_rate": 0.00016340668017273611, "loss": 2.3465, "step": 24272 }, { "epoch": 0.3, "learning_rate": 0.00016338373588996048, "loss": 2.3713, "step": 24280 }, { "epoch": 0.3, "learning_rate": 0.00016336078625309866, "loss": 2.342, "step": 24288 }, { "epoch": 0.3, "learning_rate": 0.00016333783126445232, "loss": 2.3604, "step": 24296 }, { "epoch": 0.3, "learning_rate": 0.00016331487092632375, "loss": 2.3597, "step": 24304 }, { "epoch": 0.3, "learning_rate": 0.00016329190524101573, "loss": 2.3383, "step": 24312 }, { "epoch": 0.3, "learning_rate": 0.00016326893421083155, "loss": 2.3325, "step": 24320 }, { "epoch": 0.3, "learning_rate": 0.00016324595783807517, "loss": 2.3749, "step": 24328 }, { "epoch": 0.3, "learning_rate": 0.00016322297612505086, "loss": 2.3572, "step": 24336 }, { "epoch": 0.3, "learning_rate": 0.00016319998907406367, "loss": 2.3476, "step": 24344 }, { "epoch": 0.3, "learning_rate": 0.00016317699668741897, "loss": 2.3465, "step": 24352 }, { "epoch": 0.3, "learning_rate": 0.0001631539989674229, "loss": 2.3665, "step": 24360 }, { "epoch": 0.3, "learning_rate": 0.00016313099591638185, "loss": 2.3642, "step": 24368 }, { "epoch": 0.3, "learning_rate": 0.00016310798753660296, "loss": 2.3656, "step": 24376 }, { "epoch": 0.3, "learning_rate": 0.0001630849738303939, "loss": 2.3449, "step": 24384 }, { "epoch": 0.3, "learning_rate": 0.00016306195480006273, "loss": 2.3582, "step": 24392 }, { "epoch": 0.3, "learning_rate": 0.00016303893044791818, "loss": 2.3552, "step": 24400 }, { "epoch": 0.31, "learning_rate": 0.00016301590077626944, "loss": 2.3693, "step": 24408 }, { "epoch": 0.31, "learning_rate": 0.00016299286578742622, "loss": 2.3662, "step": 24416 }, { "epoch": 0.31, "learning_rate": 0.00016296982548369887, "loss": 2.3623, "step": 24424 }, { "epoch": 0.31, "learning_rate": 0.00016294677986739817, "loss": 2.3417, "step": 24432 }, { "epoch": 0.31, "learning_rate": 0.00016292372894083544, "loss": 2.3441, "step": 24440 }, { "epoch": 0.31, "learning_rate": 0.00016290067270632261, "loss": 2.3478, "step": 24448 }, { "epoch": 0.31, "learning_rate": 0.00016287761116617203, "loss": 2.3561, "step": 24456 }, { "epoch": 0.31, "learning_rate": 0.00016285454432269665, "loss": 2.3321, "step": 24464 }, { "epoch": 0.31, "learning_rate": 0.00016283147217821, "loss": 2.3695, "step": 24472 }, { "epoch": 0.31, "learning_rate": 0.00016280839473502607, "loss": 2.3564, "step": 24480 }, { "epoch": 0.31, "learning_rate": 0.00016278531199545937, "loss": 2.3608, "step": 24488 }, { "epoch": 0.31, "learning_rate": 0.00016276222396182494, "loss": 2.343, "step": 24496 }, { "epoch": 0.31, "learning_rate": 0.00016273913063643842, "loss": 2.3622, "step": 24504 }, { "epoch": 0.31, "learning_rate": 0.00016271603202161597, "loss": 2.3573, "step": 24512 }, { "epoch": 0.31, "learning_rate": 0.00016269292811967417, "loss": 2.3377, "step": 24520 }, { "epoch": 0.31, "learning_rate": 0.00016266981893293028, "loss": 2.3627, "step": 24528 }, { "epoch": 0.31, "learning_rate": 0.000162646704463702, "loss": 2.3667, "step": 24536 }, { "epoch": 0.31, "learning_rate": 0.00016262358471430758, "loss": 2.3495, "step": 24544 }, { "epoch": 0.31, "learning_rate": 0.00016260045968706572, "loss": 2.3558, "step": 24552 }, { "epoch": 0.31, "learning_rate": 0.0001625773293842959, "loss": 2.3618, "step": 24560 }, { "epoch": 0.31, "learning_rate": 0.0001625541938083178, "loss": 2.3511, "step": 24568 }, { "epoch": 0.31, "learning_rate": 0.00016253105296145187, "loss": 2.3406, "step": 24576 }, { "epoch": 0.31, "learning_rate": 0.000162507906846019, "loss": 2.3462, "step": 24584 }, { "epoch": 0.31, "learning_rate": 0.0001624847554643406, "loss": 2.3325, "step": 24592 }, { "epoch": 0.31, "learning_rate": 0.0001624615988187386, "loss": 2.3366, "step": 24600 }, { "epoch": 0.31, "learning_rate": 0.0001624384369115355, "loss": 2.3308, "step": 24608 }, { "epoch": 0.31, "learning_rate": 0.00016241526974505432, "loss": 2.3752, "step": 24616 }, { "epoch": 0.31, "learning_rate": 0.0001623920973216186, "loss": 2.384, "step": 24624 }, { "epoch": 0.31, "learning_rate": 0.0001623689196435524, "loss": 2.3582, "step": 24632 }, { "epoch": 0.31, "learning_rate": 0.00016234573671318025, "loss": 2.3284, "step": 24640 }, { "epoch": 0.31, "learning_rate": 0.00016232254853282732, "loss": 2.3589, "step": 24648 }, { "epoch": 0.31, "learning_rate": 0.00016229935510481927, "loss": 2.3539, "step": 24656 }, { "epoch": 0.31, "learning_rate": 0.00016227615643148226, "loss": 2.3566, "step": 24664 }, { "epoch": 0.31, "learning_rate": 0.00016225295251514298, "loss": 2.3356, "step": 24672 }, { "epoch": 0.31, "learning_rate": 0.00016222974335812861, "loss": 2.3592, "step": 24680 }, { "epoch": 0.31, "learning_rate": 0.00016220652896276692, "loss": 2.3592, "step": 24688 }, { "epoch": 0.31, "learning_rate": 0.00016218330933138626, "loss": 2.3168, "step": 24696 }, { "epoch": 0.31, "learning_rate": 0.0001621600844663153, "loss": 2.3479, "step": 24704 }, { "epoch": 0.31, "learning_rate": 0.00016213685436988344, "loss": 2.3532, "step": 24712 }, { "epoch": 0.31, "learning_rate": 0.00016211361904442054, "loss": 2.381, "step": 24720 }, { "epoch": 0.31, "learning_rate": 0.00016209037849225687, "loss": 2.3638, "step": 24728 }, { "epoch": 0.31, "learning_rate": 0.00016206713271572348, "loss": 2.3467, "step": 24736 }, { "epoch": 0.31, "learning_rate": 0.00016204388171715164, "loss": 2.3445, "step": 24744 }, { "epoch": 0.31, "learning_rate": 0.0001620206254988734, "loss": 2.3513, "step": 24752 }, { "epoch": 0.31, "learning_rate": 0.00016199736406322118, "loss": 2.3738, "step": 24760 }, { "epoch": 0.31, "learning_rate": 0.00016197409741252797, "loss": 2.3668, "step": 24768 }, { "epoch": 0.31, "learning_rate": 0.00016195082554912727, "loss": 2.352, "step": 24776 }, { "epoch": 0.31, "learning_rate": 0.0001619275484753532, "loss": 2.3323, "step": 24784 }, { "epoch": 0.31, "learning_rate": 0.0001619042661935402, "loss": 2.345, "step": 24792 }, { "epoch": 0.31, "learning_rate": 0.00016188097870602347, "loss": 2.3678, "step": 24800 }, { "epoch": 0.31, "learning_rate": 0.0001618576860151385, "loss": 2.3336, "step": 24808 }, { "epoch": 0.31, "learning_rate": 0.00016183438812322144, "loss": 2.3462, "step": 24816 }, { "epoch": 0.31, "learning_rate": 0.000161811085032609, "loss": 2.3648, "step": 24824 }, { "epoch": 0.31, "learning_rate": 0.0001617877767456383, "loss": 2.359, "step": 24832 }, { "epoch": 0.31, "learning_rate": 0.00016176446326464705, "loss": 2.3535, "step": 24840 }, { "epoch": 0.31, "learning_rate": 0.00016174114459197345, "loss": 2.3545, "step": 24848 }, { "epoch": 0.31, "learning_rate": 0.00016171782072995622, "loss": 2.3495, "step": 24856 }, { "epoch": 0.31, "learning_rate": 0.0001616944916809346, "loss": 2.3503, "step": 24864 }, { "epoch": 0.31, "learning_rate": 0.00016167115744724839, "loss": 2.3568, "step": 24872 }, { "epoch": 0.31, "learning_rate": 0.00016164781803123786, "loss": 2.3508, "step": 24880 }, { "epoch": 0.31, "learning_rate": 0.00016162447343524389, "loss": 2.3444, "step": 24888 }, { "epoch": 0.31, "learning_rate": 0.0001616011236616077, "loss": 2.3645, "step": 24896 }, { "epoch": 0.31, "learning_rate": 0.0001615777687126712, "loss": 2.3424, "step": 24904 }, { "epoch": 0.31, "learning_rate": 0.00016155440859077678, "loss": 2.3547, "step": 24912 }, { "epoch": 0.31, "learning_rate": 0.00016153104329826728, "loss": 2.3337, "step": 24920 }, { "epoch": 0.31, "learning_rate": 0.0001615076728374861, "loss": 2.3787, "step": 24928 }, { "epoch": 0.31, "learning_rate": 0.00016148429721077727, "loss": 2.3323, "step": 24936 }, { "epoch": 0.31, "learning_rate": 0.00016146091642048511, "loss": 2.3654, "step": 24944 }, { "epoch": 0.31, "learning_rate": 0.00016143753046895463, "loss": 2.3683, "step": 24952 }, { "epoch": 0.31, "learning_rate": 0.0001614141393585313, "loss": 2.3359, "step": 24960 }, { "epoch": 0.31, "learning_rate": 0.00016139074309156116, "loss": 2.3483, "step": 24968 }, { "epoch": 0.31, "learning_rate": 0.00016136734167039064, "loss": 2.3603, "step": 24976 }, { "epoch": 0.31, "learning_rate": 0.0001613439350973668, "loss": 2.3502, "step": 24984 }, { "epoch": 0.31, "learning_rate": 0.00016132052337483724, "loss": 2.3342, "step": 24992 }, { "epoch": 0.31, "learning_rate": 0.00016129710650515, "loss": 2.3699, "step": 25000 }, { "epoch": 0.31, "learning_rate": 0.00016127368449065358, "loss": 2.344, "step": 25008 }, { "epoch": 0.31, "learning_rate": 0.00016125025733369717, "loss": 2.3424, "step": 25016 }, { "epoch": 0.31, "learning_rate": 0.00016122682503663037, "loss": 2.3594, "step": 25024 }, { "epoch": 0.31, "learning_rate": 0.00016120338760180328, "loss": 2.36, "step": 25032 }, { "epoch": 0.31, "learning_rate": 0.00016117994503156652, "loss": 2.3613, "step": 25040 }, { "epoch": 0.31, "learning_rate": 0.00016115649732827128, "loss": 2.3258, "step": 25048 }, { "epoch": 0.31, "learning_rate": 0.00016113304449426923, "loss": 2.3698, "step": 25056 }, { "epoch": 0.31, "learning_rate": 0.00016110958653191258, "loss": 2.3586, "step": 25064 }, { "epoch": 0.31, "learning_rate": 0.00016108612344355397, "loss": 2.3525, "step": 25072 }, { "epoch": 0.31, "learning_rate": 0.00016106265523154666, "loss": 2.3534, "step": 25080 }, { "epoch": 0.31, "learning_rate": 0.00016103918189824438, "loss": 2.3509, "step": 25088 }, { "epoch": 0.31, "learning_rate": 0.00016101570344600135, "loss": 2.3679, "step": 25096 }, { "epoch": 0.31, "learning_rate": 0.00016099221987717232, "loss": 2.3677, "step": 25104 }, { "epoch": 0.31, "learning_rate": 0.0001609687311941126, "loss": 2.361, "step": 25112 }, { "epoch": 0.31, "learning_rate": 0.00016094523739917794, "loss": 2.3361, "step": 25120 }, { "epoch": 0.31, "learning_rate": 0.00016092173849472464, "loss": 2.3544, "step": 25128 }, { "epoch": 0.31, "learning_rate": 0.00016089823448310947, "loss": 2.3409, "step": 25136 }, { "epoch": 0.31, "learning_rate": 0.00016087472536668984, "loss": 2.3485, "step": 25144 }, { "epoch": 0.31, "learning_rate": 0.0001608512111478235, "loss": 2.353, "step": 25152 }, { "epoch": 0.31, "learning_rate": 0.00016082769182886885, "loss": 2.3376, "step": 25160 }, { "epoch": 0.31, "learning_rate": 0.0001608041674121847, "loss": 2.3499, "step": 25168 }, { "epoch": 0.31, "learning_rate": 0.00016078063790013044, "loss": 2.3453, "step": 25176 }, { "epoch": 0.31, "learning_rate": 0.0001607571032950659, "loss": 2.3383, "step": 25184 }, { "epoch": 0.31, "learning_rate": 0.0001607335635993515, "loss": 2.3628, "step": 25192 }, { "epoch": 0.32, "learning_rate": 0.00016071001881534818, "loss": 2.3678, "step": 25200 }, { "epoch": 0.32, "learning_rate": 0.0001606864689454173, "loss": 2.3337, "step": 25208 }, { "epoch": 0.32, "learning_rate": 0.0001606629139919208, "loss": 2.3558, "step": 25216 }, { "epoch": 0.32, "learning_rate": 0.00016063935395722108, "loss": 2.3316, "step": 25224 }, { "epoch": 0.32, "learning_rate": 0.0001606157888436811, "loss": 2.3502, "step": 25232 }, { "epoch": 0.32, "learning_rate": 0.0001605922186536643, "loss": 2.3596, "step": 25240 }, { "epoch": 0.32, "learning_rate": 0.00016056864338953467, "loss": 2.3441, "step": 25248 }, { "epoch": 0.32, "learning_rate": 0.00016054506305365662, "loss": 2.3555, "step": 25256 }, { "epoch": 0.32, "learning_rate": 0.00016052147764839515, "loss": 2.3349, "step": 25264 }, { "epoch": 0.32, "learning_rate": 0.00016049788717611575, "loss": 2.3601, "step": 25272 }, { "epoch": 0.32, "learning_rate": 0.00016047429163918442, "loss": 2.3557, "step": 25280 }, { "epoch": 0.32, "learning_rate": 0.00016045069103996765, "loss": 2.3347, "step": 25288 }, { "epoch": 0.32, "learning_rate": 0.00016042708538083238, "loss": 2.3745, "step": 25296 }, { "epoch": 0.32, "learning_rate": 0.00016040347466414622, "loss": 2.3502, "step": 25304 }, { "epoch": 0.32, "learning_rate": 0.00016037985889227714, "loss": 2.3538, "step": 25312 }, { "epoch": 0.32, "learning_rate": 0.00016035623806759367, "loss": 2.3558, "step": 25320 }, { "epoch": 0.32, "learning_rate": 0.0001603326121924649, "loss": 2.3514, "step": 25328 }, { "epoch": 0.32, "learning_rate": 0.0001603089812692603, "loss": 2.3545, "step": 25336 }, { "epoch": 0.32, "learning_rate": 0.00016028534530034992, "loss": 2.3417, "step": 25344 }, { "epoch": 0.32, "learning_rate": 0.00016026170428810437, "loss": 2.3681, "step": 25352 }, { "epoch": 0.32, "learning_rate": 0.00016023805823489468, "loss": 2.3764, "step": 25360 }, { "epoch": 0.32, "learning_rate": 0.0001602144071430924, "loss": 2.3735, "step": 25368 }, { "epoch": 0.32, "learning_rate": 0.00016019075101506963, "loss": 2.3288, "step": 25376 }, { "epoch": 0.32, "learning_rate": 0.00016016708985319892, "loss": 2.3661, "step": 25384 }, { "epoch": 0.32, "learning_rate": 0.00016014342365985336, "loss": 2.3376, "step": 25392 }, { "epoch": 0.32, "learning_rate": 0.00016011975243740653, "loss": 2.369, "step": 25400 }, { "epoch": 0.32, "learning_rate": 0.00016009607618823254, "loss": 2.3474, "step": 25408 }, { "epoch": 0.32, "learning_rate": 0.00016007239491470595, "loss": 2.3394, "step": 25416 }, { "epoch": 0.32, "learning_rate": 0.0001600487086192019, "loss": 2.3354, "step": 25424 }, { "epoch": 0.32, "learning_rate": 0.00016002501730409595, "loss": 2.3636, "step": 25432 }, { "epoch": 0.32, "learning_rate": 0.00016000132097176422, "loss": 2.3228, "step": 25440 }, { "epoch": 0.32, "learning_rate": 0.0001599776196245833, "loss": 2.3397, "step": 25448 }, { "epoch": 0.32, "learning_rate": 0.00015995391326493037, "loss": 2.3327, "step": 25456 }, { "epoch": 0.32, "learning_rate": 0.00015993020189518294, "loss": 2.36, "step": 25464 }, { "epoch": 0.32, "learning_rate": 0.00015990648551771923, "loss": 2.3627, "step": 25472 }, { "epoch": 0.32, "learning_rate": 0.00015988276413491777, "loss": 2.3344, "step": 25480 }, { "epoch": 0.32, "learning_rate": 0.00015985903774915774, "loss": 2.3618, "step": 25488 }, { "epoch": 0.32, "learning_rate": 0.00015983530636281873, "loss": 2.364, "step": 25496 }, { "epoch": 0.32, "learning_rate": 0.00015981156997828087, "loss": 2.3557, "step": 25504 }, { "epoch": 0.32, "learning_rate": 0.00015978782859792483, "loss": 2.3556, "step": 25512 }, { "epoch": 0.32, "learning_rate": 0.00015976408222413165, "loss": 2.3487, "step": 25520 }, { "epoch": 0.32, "learning_rate": 0.00015974033085928302, "loss": 2.3641, "step": 25528 }, { "epoch": 0.32, "learning_rate": 0.00015971657450576104, "loss": 2.3469, "step": 25536 }, { "epoch": 0.32, "learning_rate": 0.00015969281316594836, "loss": 2.3521, "step": 25544 }, { "epoch": 0.32, "learning_rate": 0.00015966904684222807, "loss": 2.3417, "step": 25552 }, { "epoch": 0.32, "learning_rate": 0.00015964527553698386, "loss": 2.3446, "step": 25560 }, { "epoch": 0.32, "learning_rate": 0.00015962149925259977, "loss": 2.3452, "step": 25568 }, { "epoch": 0.32, "learning_rate": 0.0001595977179914605, "loss": 2.3637, "step": 25576 }, { "epoch": 0.32, "learning_rate": 0.00015957393175595113, "loss": 2.3543, "step": 25584 }, { "epoch": 0.32, "learning_rate": 0.00015955014054845737, "loss": 2.3542, "step": 25592 }, { "epoch": 0.32, "learning_rate": 0.00015952634437136522, "loss": 2.351, "step": 25600 }, { "epoch": 0.32, "learning_rate": 0.0001595025432270614, "loss": 2.3437, "step": 25608 }, { "epoch": 0.32, "learning_rate": 0.00015947873711793294, "loss": 2.3741, "step": 25616 }, { "epoch": 0.32, "learning_rate": 0.00015945492604636755, "loss": 2.3573, "step": 25624 }, { "epoch": 0.32, "learning_rate": 0.00015943111001475333, "loss": 2.3406, "step": 25632 }, { "epoch": 0.32, "learning_rate": 0.00015940728902547882, "loss": 2.362, "step": 25640 }, { "epoch": 0.32, "learning_rate": 0.0001593834630809332, "loss": 2.3443, "step": 25648 }, { "epoch": 0.32, "learning_rate": 0.00015935963218350604, "loss": 2.3741, "step": 25656 }, { "epoch": 0.32, "learning_rate": 0.00015933579633558746, "loss": 2.3339, "step": 25664 }, { "epoch": 0.32, "learning_rate": 0.00015931195553956805, "loss": 2.3407, "step": 25672 }, { "epoch": 0.32, "learning_rate": 0.00015928810979783895, "loss": 2.3564, "step": 25680 }, { "epoch": 0.32, "learning_rate": 0.00015926425911279171, "loss": 2.3782, "step": 25688 }, { "epoch": 0.32, "learning_rate": 0.00015924040348681842, "loss": 2.3478, "step": 25696 }, { "epoch": 0.32, "learning_rate": 0.00015921654292231166, "loss": 2.3544, "step": 25704 }, { "epoch": 0.32, "learning_rate": 0.00015919267742166453, "loss": 2.3387, "step": 25712 }, { "epoch": 0.32, "learning_rate": 0.00015916880698727058, "loss": 2.3613, "step": 25720 }, { "epoch": 0.32, "learning_rate": 0.00015914493162152396, "loss": 2.3464, "step": 25728 }, { "epoch": 0.32, "learning_rate": 0.0001591210513268191, "loss": 2.3402, "step": 25736 }, { "epoch": 0.32, "learning_rate": 0.00015909716610555113, "loss": 2.3524, "step": 25744 }, { "epoch": 0.32, "learning_rate": 0.00015907327596011563, "loss": 2.3427, "step": 25752 }, { "epoch": 0.32, "learning_rate": 0.0001590493808929086, "loss": 2.347, "step": 25760 }, { "epoch": 0.32, "learning_rate": 0.00015902548090632662, "loss": 2.3587, "step": 25768 }, { "epoch": 0.32, "learning_rate": 0.00015900157600276667, "loss": 2.3541, "step": 25776 }, { "epoch": 0.32, "learning_rate": 0.0001589776661846263, "loss": 2.3557, "step": 25784 }, { "epoch": 0.32, "learning_rate": 0.00015895375145430355, "loss": 2.3426, "step": 25792 }, { "epoch": 0.32, "learning_rate": 0.0001589298318141969, "loss": 2.3521, "step": 25800 }, { "epoch": 0.32, "learning_rate": 0.00015890590726670538, "loss": 2.3145, "step": 25808 }, { "epoch": 0.32, "learning_rate": 0.0001588819778142285, "loss": 2.3619, "step": 25816 }, { "epoch": 0.32, "learning_rate": 0.00015885804345916623, "loss": 2.328, "step": 25824 }, { "epoch": 0.32, "learning_rate": 0.000158834104203919, "loss": 2.3757, "step": 25832 }, { "epoch": 0.32, "learning_rate": 0.00015881016005088786, "loss": 2.329, "step": 25840 }, { "epoch": 0.32, "learning_rate": 0.0001587862110024742, "loss": 2.3689, "step": 25848 }, { "epoch": 0.32, "learning_rate": 0.0001587622570610801, "loss": 2.3612, "step": 25856 }, { "epoch": 0.32, "learning_rate": 0.00015873829822910784, "loss": 2.3493, "step": 25864 }, { "epoch": 0.32, "learning_rate": 0.00015871433450896045, "loss": 2.3461, "step": 25872 }, { "epoch": 0.32, "learning_rate": 0.00015869036590304133, "loss": 2.3466, "step": 25880 }, { "epoch": 0.32, "learning_rate": 0.00015866639241375442, "loss": 2.3555, "step": 25888 }, { "epoch": 0.32, "learning_rate": 0.00015864241404350412, "loss": 2.3412, "step": 25896 }, { "epoch": 0.32, "learning_rate": 0.00015861843079469532, "loss": 2.3376, "step": 25904 }, { "epoch": 0.32, "learning_rate": 0.0001585944426697334, "loss": 2.3717, "step": 25912 }, { "epoch": 0.32, "learning_rate": 0.0001585704496710242, "loss": 2.3511, "step": 25920 }, { "epoch": 0.32, "learning_rate": 0.00015854645180097415, "loss": 2.3541, "step": 25928 }, { "epoch": 0.32, "learning_rate": 0.00015852244906199, "loss": 2.3503, "step": 25936 }, { "epoch": 0.32, "learning_rate": 0.00015849844145647923, "loss": 2.3597, "step": 25944 }, { "epoch": 0.32, "learning_rate": 0.00015847442898684957, "loss": 2.3428, "step": 25952 }, { "epoch": 0.32, "learning_rate": 0.00015845041165550932, "loss": 2.3713, "step": 25960 }, { "epoch": 0.32, "learning_rate": 0.00015842638946486734, "loss": 2.3428, "step": 25968 }, { "epoch": 0.32, "learning_rate": 0.0001584023624173329, "loss": 2.3439, "step": 25976 }, { "epoch": 0.32, "learning_rate": 0.00015837833051531575, "loss": 2.3665, "step": 25984 }, { "epoch": 0.32, "learning_rate": 0.00015835429376122618, "loss": 2.3568, "step": 25992 }, { "epoch": 0.33, "learning_rate": 0.00015833025215747498, "loss": 2.3508, "step": 26000 }, { "epoch": 0.33, "learning_rate": 0.0001583062057064733, "loss": 2.37, "step": 26008 }, { "epoch": 0.33, "learning_rate": 0.00015828215441063292, "loss": 2.3413, "step": 26016 }, { "epoch": 0.33, "learning_rate": 0.000158258098272366, "loss": 2.3753, "step": 26024 }, { "epoch": 0.33, "learning_rate": 0.0001582340372940853, "loss": 2.3664, "step": 26032 }, { "epoch": 0.33, "learning_rate": 0.00015820997147820398, "loss": 2.3182, "step": 26040 }, { "epoch": 0.33, "learning_rate": 0.00015818590082713568, "loss": 2.3373, "step": 26048 }, { "epoch": 0.33, "learning_rate": 0.00015816182534329455, "loss": 2.3565, "step": 26056 }, { "epoch": 0.33, "learning_rate": 0.00015813774502909525, "loss": 2.3632, "step": 26064 }, { "epoch": 0.33, "learning_rate": 0.0001581136598869529, "loss": 2.3606, "step": 26072 }, { "epoch": 0.33, "learning_rate": 0.0001580895699192831, "loss": 2.3742, "step": 26080 }, { "epoch": 0.33, "learning_rate": 0.0001580654751285019, "loss": 2.3302, "step": 26088 }, { "epoch": 0.33, "learning_rate": 0.00015804137551702588, "loss": 2.3556, "step": 26096 }, { "epoch": 0.33, "learning_rate": 0.00015801727108727217, "loss": 2.3447, "step": 26104 }, { "epoch": 0.33, "learning_rate": 0.0001579931618416582, "loss": 2.3368, "step": 26112 }, { "epoch": 0.33, "learning_rate": 0.00015796904778260209, "loss": 2.374, "step": 26120 }, { "epoch": 0.33, "learning_rate": 0.00015794492891252226, "loss": 2.3352, "step": 26128 }, { "epoch": 0.33, "learning_rate": 0.00015792080523383773, "loss": 2.3634, "step": 26136 }, { "epoch": 0.33, "learning_rate": 0.000157896676748968, "loss": 2.3441, "step": 26144 }, { "epoch": 0.33, "learning_rate": 0.00015787254346033292, "loss": 2.3276, "step": 26152 }, { "epoch": 0.33, "learning_rate": 0.00015784840537035305, "loss": 2.3567, "step": 26160 }, { "epoch": 0.33, "learning_rate": 0.00015782426248144924, "loss": 2.3533, "step": 26168 }, { "epoch": 0.33, "learning_rate": 0.00015780011479604288, "loss": 2.3451, "step": 26176 }, { "epoch": 0.33, "learning_rate": 0.00015777596231655587, "loss": 2.3481, "step": 26184 }, { "epoch": 0.33, "learning_rate": 0.00015775180504541054, "loss": 2.3433, "step": 26192 }, { "epoch": 0.33, "learning_rate": 0.00015772764298502972, "loss": 2.327, "step": 26200 }, { "epoch": 0.33, "learning_rate": 0.0001577034761378368, "loss": 2.3611, "step": 26208 }, { "epoch": 0.33, "learning_rate": 0.0001576793045062555, "loss": 2.3377, "step": 26216 }, { "epoch": 0.33, "learning_rate": 0.0001576551280927101, "loss": 2.3541, "step": 26224 }, { "epoch": 0.33, "learning_rate": 0.0001576309468996254, "loss": 2.3543, "step": 26232 }, { "epoch": 0.33, "learning_rate": 0.00015760676092942661, "loss": 2.3363, "step": 26240 }, { "epoch": 0.33, "learning_rate": 0.00015758257018453947, "loss": 2.365, "step": 26248 }, { "epoch": 0.33, "learning_rate": 0.00015755837466739016, "loss": 2.3608, "step": 26256 }, { "epoch": 0.33, "learning_rate": 0.00015753417438040535, "loss": 2.3474, "step": 26264 }, { "epoch": 0.33, "learning_rate": 0.00015750996932601218, "loss": 2.3553, "step": 26272 }, { "epoch": 0.33, "learning_rate": 0.00015748575950663834, "loss": 2.346, "step": 26280 }, { "epoch": 0.33, "learning_rate": 0.00015746154492471182, "loss": 2.3306, "step": 26288 }, { "epoch": 0.33, "learning_rate": 0.0001574373255826613, "loss": 2.3284, "step": 26296 }, { "epoch": 0.33, "learning_rate": 0.0001574131014829158, "loss": 2.352, "step": 26304 }, { "epoch": 0.33, "learning_rate": 0.00015738887262790494, "loss": 2.3187, "step": 26312 }, { "epoch": 0.33, "learning_rate": 0.00015736463902005864, "loss": 2.3556, "step": 26320 }, { "epoch": 0.33, "learning_rate": 0.00015734040066180745, "loss": 2.3584, "step": 26328 }, { "epoch": 0.33, "learning_rate": 0.00015731615755558225, "loss": 2.3371, "step": 26336 }, { "epoch": 0.33, "learning_rate": 0.00015729190970381463, "loss": 2.3758, "step": 26344 }, { "epoch": 0.33, "learning_rate": 0.0001572676571089364, "loss": 2.3543, "step": 26352 }, { "epoch": 0.33, "learning_rate": 0.00015724339977338003, "loss": 2.3462, "step": 26360 }, { "epoch": 0.33, "learning_rate": 0.0001572191376995783, "loss": 2.336, "step": 26368 }, { "epoch": 0.33, "learning_rate": 0.00015719487088996465, "loss": 2.3513, "step": 26376 }, { "epoch": 0.33, "learning_rate": 0.00015717059934697292, "loss": 2.3433, "step": 26384 }, { "epoch": 0.33, "learning_rate": 0.00015714632307303728, "loss": 2.3628, "step": 26392 }, { "epoch": 0.33, "learning_rate": 0.0001571220420705926, "loss": 2.3407, "step": 26400 }, { "epoch": 0.33, "learning_rate": 0.00015709775634207413, "loss": 2.3131, "step": 26408 }, { "epoch": 0.33, "learning_rate": 0.00015707346588991755, "loss": 2.3613, "step": 26416 }, { "epoch": 0.33, "learning_rate": 0.0001570491707165591, "loss": 2.3444, "step": 26424 }, { "epoch": 0.33, "learning_rate": 0.0001570248708244354, "loss": 2.3195, "step": 26432 }, { "epoch": 0.33, "learning_rate": 0.00015700056621598363, "loss": 2.3584, "step": 26440 }, { "epoch": 0.33, "learning_rate": 0.00015697625689364137, "loss": 2.3682, "step": 26448 }, { "epoch": 0.33, "learning_rate": 0.00015695194285984677, "loss": 2.3372, "step": 26456 }, { "epoch": 0.33, "learning_rate": 0.00015692762411703828, "loss": 2.3702, "step": 26464 }, { "epoch": 0.33, "learning_rate": 0.00015690330066765504, "loss": 2.3328, "step": 26472 }, { "epoch": 0.33, "learning_rate": 0.0001568789725141365, "loss": 2.3444, "step": 26480 }, { "epoch": 0.33, "learning_rate": 0.00015685463965892264, "loss": 2.339, "step": 26488 }, { "epoch": 0.33, "learning_rate": 0.0001568303021044539, "loss": 2.3607, "step": 26496 }, { "epoch": 0.33, "learning_rate": 0.00015680595985317127, "loss": 2.3462, "step": 26504 }, { "epoch": 0.33, "learning_rate": 0.00015678161290751604, "loss": 2.3455, "step": 26512 }, { "epoch": 0.33, "learning_rate": 0.00015675726126993013, "loss": 2.3634, "step": 26520 }, { "epoch": 0.33, "learning_rate": 0.00015673290494285587, "loss": 2.3436, "step": 26528 }, { "epoch": 0.33, "learning_rate": 0.00015670854392873601, "loss": 2.3242, "step": 26536 }, { "epoch": 0.33, "learning_rate": 0.00015668417823001387, "loss": 2.3532, "step": 26544 }, { "epoch": 0.33, "learning_rate": 0.00015665980784913318, "loss": 2.3646, "step": 26552 }, { "epoch": 0.33, "learning_rate": 0.00015663543278853818, "loss": 2.3541, "step": 26560 }, { "epoch": 0.33, "learning_rate": 0.0001566110530506735, "loss": 2.3552, "step": 26568 }, { "epoch": 0.33, "learning_rate": 0.0001565866686379843, "loss": 2.3261, "step": 26576 }, { "epoch": 0.33, "learning_rate": 0.00015656227955291625, "loss": 2.3554, "step": 26584 }, { "epoch": 0.33, "learning_rate": 0.00015653788579791535, "loss": 2.3611, "step": 26592 }, { "epoch": 0.33, "learning_rate": 0.0001565134873754282, "loss": 2.3374, "step": 26600 }, { "epoch": 0.33, "learning_rate": 0.0001564890842879019, "loss": 2.3489, "step": 26608 }, { "epoch": 0.33, "learning_rate": 0.00015646467653778381, "loss": 2.3733, "step": 26616 }, { "epoch": 0.33, "learning_rate": 0.00015644026412752195, "loss": 2.3396, "step": 26624 }, { "epoch": 0.33, "learning_rate": 0.00015641584705956474, "loss": 2.368, "step": 26632 }, { "epoch": 0.33, "learning_rate": 0.0001563914253363611, "loss": 2.3337, "step": 26640 }, { "epoch": 0.33, "learning_rate": 0.00015636699896036036, "loss": 2.3404, "step": 26648 }, { "epoch": 0.33, "learning_rate": 0.00015634256793401233, "loss": 2.3482, "step": 26656 }, { "epoch": 0.33, "learning_rate": 0.00015631813225976734, "loss": 2.3404, "step": 26664 }, { "epoch": 0.33, "learning_rate": 0.00015629369194007618, "loss": 2.3383, "step": 26672 }, { "epoch": 0.33, "learning_rate": 0.00015626924697738993, "loss": 2.3398, "step": 26680 }, { "epoch": 0.33, "learning_rate": 0.00015624479737416048, "loss": 2.3386, "step": 26688 }, { "epoch": 0.33, "learning_rate": 0.00015622034313283987, "loss": 2.3544, "step": 26696 }, { "epoch": 0.33, "learning_rate": 0.0001561958842558807, "loss": 2.367, "step": 26704 }, { "epoch": 0.33, "learning_rate": 0.00015617142074573616, "loss": 2.3442, "step": 26712 }, { "epoch": 0.33, "learning_rate": 0.00015614695260485973, "loss": 2.3491, "step": 26720 }, { "epoch": 0.33, "learning_rate": 0.0001561224798357054, "loss": 2.3523, "step": 26728 }, { "epoch": 0.33, "learning_rate": 0.0001560980024407277, "loss": 2.3193, "step": 26736 }, { "epoch": 0.33, "learning_rate": 0.00015607352042238158, "loss": 2.3346, "step": 26744 }, { "epoch": 0.33, "learning_rate": 0.00015604903378312244, "loss": 2.3652, "step": 26752 }, { "epoch": 0.33, "learning_rate": 0.00015602454252540608, "loss": 2.3316, "step": 26760 }, { "epoch": 0.33, "learning_rate": 0.00015600004665168894, "loss": 2.3361, "step": 26768 }, { "epoch": 0.33, "learning_rate": 0.00015597554616442774, "loss": 2.3498, "step": 26776 }, { "epoch": 0.33, "learning_rate": 0.00015595104106607983, "loss": 2.3353, "step": 26784 }, { "epoch": 0.33, "learning_rate": 0.00015592653135910282, "loss": 2.3532, "step": 26792 }, { "epoch": 0.34, "learning_rate": 0.00015590201704595495, "loss": 2.3302, "step": 26800 }, { "epoch": 0.34, "learning_rate": 0.0001558774981290949, "loss": 2.3484, "step": 26808 }, { "epoch": 0.34, "learning_rate": 0.0001558529746109817, "loss": 2.3495, "step": 26816 }, { "epoch": 0.34, "learning_rate": 0.000155828446494075, "loss": 2.3646, "step": 26824 }, { "epoch": 0.34, "learning_rate": 0.00015580391378083478, "loss": 2.3281, "step": 26832 }, { "epoch": 0.34, "learning_rate": 0.00015577937647372157, "loss": 2.33, "step": 26840 }, { "epoch": 0.34, "learning_rate": 0.00015575483457519625, "loss": 2.3452, "step": 26848 }, { "epoch": 0.34, "learning_rate": 0.00015573028808772032, "loss": 2.3138, "step": 26856 }, { "epoch": 0.34, "learning_rate": 0.00015570573701375562, "loss": 2.3516, "step": 26864 }, { "epoch": 0.34, "learning_rate": 0.0001556811813557645, "loss": 2.3445, "step": 26872 }, { "epoch": 0.34, "learning_rate": 0.00015565662111620965, "loss": 2.3429, "step": 26880 }, { "epoch": 0.34, "learning_rate": 0.00015563205629755449, "loss": 2.3573, "step": 26888 }, { "epoch": 0.34, "learning_rate": 0.0001556074869022626, "loss": 2.3477, "step": 26896 }, { "epoch": 0.34, "learning_rate": 0.00015558291293279824, "loss": 2.3274, "step": 26904 }, { "epoch": 0.34, "learning_rate": 0.00015555833439162597, "loss": 2.3406, "step": 26912 }, { "epoch": 0.34, "learning_rate": 0.00015553375128121092, "loss": 2.3379, "step": 26920 }, { "epoch": 0.34, "learning_rate": 0.00015550916360401864, "loss": 2.3392, "step": 26928 }, { "epoch": 0.34, "learning_rate": 0.00015548457136251508, "loss": 2.3623, "step": 26936 }, { "epoch": 0.34, "learning_rate": 0.00015545997455916675, "loss": 2.3331, "step": 26944 }, { "epoch": 0.34, "learning_rate": 0.0001554353731964406, "loss": 2.3389, "step": 26952 }, { "epoch": 0.34, "learning_rate": 0.00015541076727680395, "loss": 2.352, "step": 26960 }, { "epoch": 0.34, "learning_rate": 0.00015538615680272465, "loss": 2.3686, "step": 26968 }, { "epoch": 0.34, "learning_rate": 0.00015536154177667096, "loss": 2.3361, "step": 26976 }, { "epoch": 0.34, "learning_rate": 0.00015533692220111173, "loss": 2.3631, "step": 26984 }, { "epoch": 0.34, "learning_rate": 0.00015531229807851606, "loss": 2.3459, "step": 26992 }, { "epoch": 0.34, "learning_rate": 0.00015528766941135365, "loss": 2.3276, "step": 27000 }, { "epoch": 0.34, "learning_rate": 0.00015526303620209462, "loss": 2.3583, "step": 27008 }, { "epoch": 0.34, "learning_rate": 0.0001552383984532095, "loss": 2.3418, "step": 27016 }, { "epoch": 0.34, "learning_rate": 0.0001552137561671694, "loss": 2.3421, "step": 27024 }, { "epoch": 0.34, "learning_rate": 0.00015518910934644574, "loss": 2.3628, "step": 27032 }, { "epoch": 0.34, "learning_rate": 0.00015516445799351045, "loss": 2.3553, "step": 27040 }, { "epoch": 0.34, "learning_rate": 0.00015513980211083594, "loss": 2.3505, "step": 27048 }, { "epoch": 0.34, "learning_rate": 0.00015511514170089504, "loss": 2.362, "step": 27056 }, { "epoch": 0.34, "learning_rate": 0.00015509047676616112, "loss": 2.3502, "step": 27064 }, { "epoch": 0.34, "learning_rate": 0.0001550658073091078, "loss": 2.3353, "step": 27072 }, { "epoch": 0.34, "learning_rate": 0.00015504113333220942, "loss": 2.3458, "step": 27080 }, { "epoch": 0.34, "learning_rate": 0.0001550164548379406, "loss": 2.349, "step": 27088 }, { "epoch": 0.34, "learning_rate": 0.0001549917718287764, "loss": 2.3257, "step": 27096 }, { "epoch": 0.34, "learning_rate": 0.0001549670843071924, "loss": 2.3582, "step": 27104 }, { "epoch": 0.34, "learning_rate": 0.00015494239227566468, "loss": 2.3337, "step": 27112 }, { "epoch": 0.34, "learning_rate": 0.00015491769573666966, "loss": 2.3431, "step": 27120 }, { "epoch": 0.34, "learning_rate": 0.0001548929946926843, "loss": 2.3536, "step": 27128 }, { "epoch": 0.34, "learning_rate": 0.0001548682891461859, "loss": 2.3524, "step": 27136 }, { "epoch": 0.34, "learning_rate": 0.00015484357909965237, "loss": 2.3405, "step": 27144 }, { "epoch": 0.34, "learning_rate": 0.00015481886455556197, "loss": 2.3395, "step": 27152 }, { "epoch": 0.34, "learning_rate": 0.00015479414551639338, "loss": 2.3419, "step": 27160 }, { "epoch": 0.34, "learning_rate": 0.0001547694219846258, "loss": 2.3394, "step": 27168 }, { "epoch": 0.34, "learning_rate": 0.0001547446939627389, "loss": 2.3433, "step": 27176 }, { "epoch": 0.34, "learning_rate": 0.00015471996145321272, "loss": 2.3401, "step": 27184 }, { "epoch": 0.34, "learning_rate": 0.00015469522445852782, "loss": 2.3359, "step": 27192 }, { "epoch": 0.34, "learning_rate": 0.00015467048298116516, "loss": 2.3478, "step": 27200 }, { "epoch": 0.34, "learning_rate": 0.00015464573702360617, "loss": 2.3498, "step": 27208 }, { "epoch": 0.34, "learning_rate": 0.00015462098658833274, "loss": 2.3467, "step": 27216 }, { "epoch": 0.34, "learning_rate": 0.00015459623167782719, "loss": 2.3392, "step": 27224 }, { "epoch": 0.34, "learning_rate": 0.0001545714722945723, "loss": 2.3436, "step": 27232 }, { "epoch": 0.34, "learning_rate": 0.00015454670844105125, "loss": 2.3436, "step": 27240 }, { "epoch": 0.34, "learning_rate": 0.0001545219401197478, "loss": 2.3522, "step": 27248 }, { "epoch": 0.34, "learning_rate": 0.00015449716733314606, "loss": 2.3591, "step": 27256 }, { "epoch": 0.34, "learning_rate": 0.00015447239008373052, "loss": 2.3432, "step": 27264 }, { "epoch": 0.34, "learning_rate": 0.00015444760837398627, "loss": 2.3186, "step": 27272 }, { "epoch": 0.34, "learning_rate": 0.00015442282220639876, "loss": 2.3482, "step": 27280 }, { "epoch": 0.34, "learning_rate": 0.0001543980315834539, "loss": 2.3542, "step": 27288 }, { "epoch": 0.34, "learning_rate": 0.000154373236507638, "loss": 2.3371, "step": 27296 }, { "epoch": 0.34, "learning_rate": 0.00015434843698143797, "loss": 2.3645, "step": 27304 }, { "epoch": 0.34, "learning_rate": 0.00015432363300734095, "loss": 2.3462, "step": 27312 }, { "epoch": 0.34, "learning_rate": 0.00015429882458783473, "loss": 2.335, "step": 27320 }, { "epoch": 0.34, "learning_rate": 0.0001542740117254074, "loss": 2.35, "step": 27328 }, { "epoch": 0.34, "learning_rate": 0.00015424919442254758, "loss": 2.3501, "step": 27336 }, { "epoch": 0.34, "learning_rate": 0.00015422437268174425, "loss": 2.3226, "step": 27344 }, { "epoch": 0.34, "learning_rate": 0.000154199546505487, "loss": 2.3499, "step": 27352 }, { "epoch": 0.34, "learning_rate": 0.00015417471589626564, "loss": 2.3527, "step": 27360 }, { "epoch": 0.34, "learning_rate": 0.0001541498808565706, "loss": 2.3363, "step": 27368 }, { "epoch": 0.34, "learning_rate": 0.00015412504138889263, "loss": 2.338, "step": 27376 }, { "epoch": 0.34, "learning_rate": 0.00015410019749572307, "loss": 2.3607, "step": 27384 }, { "epoch": 0.34, "learning_rate": 0.00015407534917955356, "loss": 2.3495, "step": 27392 }, { "epoch": 0.34, "learning_rate": 0.00015405049644287631, "loss": 2.3433, "step": 27400 }, { "epoch": 0.34, "learning_rate": 0.00015402563928818385, "loss": 2.3516, "step": 27408 }, { "epoch": 0.34, "learning_rate": 0.00015400077771796926, "loss": 2.3483, "step": 27416 }, { "epoch": 0.34, "learning_rate": 0.00015397591173472595, "loss": 2.331, "step": 27424 }, { "epoch": 0.34, "learning_rate": 0.00015395104134094788, "loss": 2.3395, "step": 27432 }, { "epoch": 0.34, "learning_rate": 0.00015392616653912941, "loss": 2.3596, "step": 27440 }, { "epoch": 0.34, "learning_rate": 0.00015390128733176536, "loss": 2.3341, "step": 27448 }, { "epoch": 0.34, "learning_rate": 0.00015387640372135092, "loss": 2.3516, "step": 27456 }, { "epoch": 0.34, "learning_rate": 0.0001538515157103818, "loss": 2.352, "step": 27464 }, { "epoch": 0.34, "learning_rate": 0.00015382662330135413, "loss": 2.3459, "step": 27472 }, { "epoch": 0.34, "learning_rate": 0.0001538017264967645, "loss": 2.3475, "step": 27480 }, { "epoch": 0.34, "learning_rate": 0.0001537768252991099, "loss": 2.3473, "step": 27488 }, { "epoch": 0.34, "learning_rate": 0.00015375191971088778, "loss": 2.337, "step": 27496 }, { "epoch": 0.34, "learning_rate": 0.00015372700973459598, "loss": 2.3546, "step": 27504 }, { "epoch": 0.34, "learning_rate": 0.0001537020953727329, "loss": 2.3639, "step": 27512 }, { "epoch": 0.34, "learning_rate": 0.0001536771766277973, "loss": 2.3299, "step": 27520 }, { "epoch": 0.34, "learning_rate": 0.00015365225350228836, "loss": 2.3784, "step": 27528 }, { "epoch": 0.34, "learning_rate": 0.00015362732599870572, "loss": 2.3445, "step": 27536 }, { "epoch": 0.34, "learning_rate": 0.00015360239411954952, "loss": 2.3425, "step": 27544 }, { "epoch": 0.34, "learning_rate": 0.00015357745786732024, "loss": 2.3485, "step": 27552 }, { "epoch": 0.34, "learning_rate": 0.00015355251724451886, "loss": 2.3412, "step": 27560 }, { "epoch": 0.34, "learning_rate": 0.0001535275722536468, "loss": 2.335, "step": 27568 }, { "epoch": 0.34, "learning_rate": 0.00015350262289720587, "loss": 2.3613, "step": 27576 }, { "epoch": 0.34, "learning_rate": 0.00015347766917769834, "loss": 2.336, "step": 27584 }, { "epoch": 0.34, "learning_rate": 0.000153452711097627, "loss": 2.34, "step": 27592 }, { "epoch": 0.34, "learning_rate": 0.00015342774865949492, "loss": 2.3729, "step": 27600 }, { "epoch": 0.35, "learning_rate": 0.0001534027818658057, "loss": 2.332, "step": 27608 }, { "epoch": 0.35, "learning_rate": 0.00015337781071906342, "loss": 2.3427, "step": 27616 }, { "epoch": 0.35, "learning_rate": 0.00015335283522177254, "loss": 2.331, "step": 27624 }, { "epoch": 0.35, "learning_rate": 0.00015332785537643792, "loss": 2.3674, "step": 27632 }, { "epoch": 0.35, "learning_rate": 0.0001533028711855649, "loss": 2.3552, "step": 27640 }, { "epoch": 0.35, "learning_rate": 0.00015327788265165928, "loss": 2.3365, "step": 27648 }, { "epoch": 0.35, "learning_rate": 0.00015325288977722728, "loss": 2.3378, "step": 27656 }, { "epoch": 0.35, "learning_rate": 0.0001532278925647755, "loss": 2.3511, "step": 27664 }, { "epoch": 0.35, "learning_rate": 0.000153202891016811, "loss": 2.3587, "step": 27672 }, { "epoch": 0.35, "learning_rate": 0.00015317788513584136, "loss": 2.3446, "step": 27680 }, { "epoch": 0.35, "learning_rate": 0.0001531528749243745, "loss": 2.3359, "step": 27688 }, { "epoch": 0.35, "learning_rate": 0.00015312786038491885, "loss": 2.3245, "step": 27696 }, { "epoch": 0.35, "learning_rate": 0.0001531028415199831, "loss": 2.3622, "step": 27704 }, { "epoch": 0.35, "learning_rate": 0.00015307781833207663, "loss": 2.3527, "step": 27712 }, { "epoch": 0.35, "learning_rate": 0.00015305279082370907, "loss": 2.335, "step": 27720 }, { "epoch": 0.35, "learning_rate": 0.00015302775899739052, "loss": 2.3363, "step": 27728 }, { "epoch": 0.35, "learning_rate": 0.00015300272285563156, "loss": 2.3449, "step": 27736 }, { "epoch": 0.35, "learning_rate": 0.00015297768240094318, "loss": 2.3365, "step": 27744 }, { "epoch": 0.35, "learning_rate": 0.00015295263763583677, "loss": 2.3446, "step": 27752 }, { "epoch": 0.35, "learning_rate": 0.00015292758856282418, "loss": 2.3681, "step": 27760 }, { "epoch": 0.35, "learning_rate": 0.0001529025351844177, "loss": 2.3404, "step": 27768 }, { "epoch": 0.35, "learning_rate": 0.00015287747750313005, "loss": 2.3392, "step": 27776 }, { "epoch": 0.35, "learning_rate": 0.00015285241552147436, "loss": 2.3452, "step": 27784 }, { "epoch": 0.35, "learning_rate": 0.0001528273492419642, "loss": 2.3503, "step": 27792 }, { "epoch": 0.35, "learning_rate": 0.00015280227866711364, "loss": 2.3446, "step": 27800 }, { "epoch": 0.35, "learning_rate": 0.00015277720379943698, "loss": 2.357, "step": 27808 }, { "epoch": 0.35, "learning_rate": 0.00015275212464144918, "loss": 2.3229, "step": 27816 }, { "epoch": 0.35, "learning_rate": 0.00015272704119566558, "loss": 2.3273, "step": 27824 }, { "epoch": 0.35, "learning_rate": 0.0001527019534646018, "loss": 2.3513, "step": 27832 }, { "epoch": 0.35, "learning_rate": 0.00015267686145077408, "loss": 2.3468, "step": 27840 }, { "epoch": 0.35, "learning_rate": 0.00015265176515669897, "loss": 2.3324, "step": 27848 }, { "epoch": 0.35, "learning_rate": 0.00015262666458489346, "loss": 2.3574, "step": 27856 }, { "epoch": 0.35, "learning_rate": 0.00015260155973787507, "loss": 2.3569, "step": 27864 }, { "epoch": 0.35, "learning_rate": 0.00015257645061816162, "loss": 2.3308, "step": 27872 }, { "epoch": 0.35, "learning_rate": 0.0001525513372282714, "loss": 2.3383, "step": 27880 }, { "epoch": 0.35, "learning_rate": 0.00015252621957072323, "loss": 2.3512, "step": 27888 }, { "epoch": 0.35, "learning_rate": 0.00015250109764803612, "loss": 2.3349, "step": 27896 }, { "epoch": 0.35, "learning_rate": 0.0001524759714627298, "loss": 2.3295, "step": 27904 }, { "epoch": 0.35, "learning_rate": 0.0001524508410173242, "loss": 2.3294, "step": 27912 }, { "epoch": 0.35, "learning_rate": 0.00015242570631433978, "loss": 2.3564, "step": 27920 }, { "epoch": 0.35, "learning_rate": 0.00015240056735629746, "loss": 2.3491, "step": 27928 }, { "epoch": 0.35, "learning_rate": 0.00015237542414571844, "loss": 2.3508, "step": 27936 }, { "epoch": 0.35, "learning_rate": 0.00015235027668512448, "loss": 2.3542, "step": 27944 }, { "epoch": 0.35, "learning_rate": 0.00015232512497703778, "loss": 2.3519, "step": 27952 }, { "epoch": 0.35, "learning_rate": 0.00015229996902398085, "loss": 2.3242, "step": 27960 }, { "epoch": 0.35, "learning_rate": 0.00015227480882847673, "loss": 2.3295, "step": 27968 }, { "epoch": 0.35, "learning_rate": 0.0001522496443930488, "loss": 2.3675, "step": 27976 }, { "epoch": 0.35, "learning_rate": 0.00015222447572022096, "loss": 2.3498, "step": 27984 }, { "epoch": 0.35, "learning_rate": 0.00015219930281251746, "loss": 2.3399, "step": 27992 }, { "epoch": 0.35, "learning_rate": 0.00015217412567246298, "loss": 2.3291, "step": 28000 }, { "epoch": 0.35, "learning_rate": 0.0001521489443025827, "loss": 2.3343, "step": 28008 }, { "epoch": 0.35, "learning_rate": 0.00015212375870540213, "loss": 2.3622, "step": 28016 }, { "epoch": 0.35, "learning_rate": 0.00015209856888344722, "loss": 2.3427, "step": 28024 }, { "epoch": 0.35, "learning_rate": 0.0001520733748392444, "loss": 2.3513, "step": 28032 }, { "epoch": 0.35, "learning_rate": 0.0001520481765753205, "loss": 2.3327, "step": 28040 }, { "epoch": 0.35, "learning_rate": 0.00015202297409420274, "loss": 2.3453, "step": 28048 }, { "epoch": 0.35, "learning_rate": 0.0001519977673984188, "loss": 2.3351, "step": 28056 }, { "epoch": 0.35, "learning_rate": 0.0001519725564904968, "loss": 2.3244, "step": 28064 }, { "epoch": 0.35, "learning_rate": 0.00015194734137296515, "loss": 2.3351, "step": 28072 }, { "epoch": 0.35, "learning_rate": 0.00015192212204835287, "loss": 2.3457, "step": 28080 }, { "epoch": 0.35, "learning_rate": 0.00015189689851918928, "loss": 2.3522, "step": 28088 }, { "epoch": 0.35, "learning_rate": 0.0001518716707880042, "loss": 2.3318, "step": 28096 }, { "epoch": 0.35, "learning_rate": 0.00015184643885732778, "loss": 2.3137, "step": 28104 }, { "epoch": 0.35, "learning_rate": 0.00015182120272969066, "loss": 2.3415, "step": 28112 }, { "epoch": 0.35, "learning_rate": 0.00015179596240762387, "loss": 2.3595, "step": 28120 }, { "epoch": 0.35, "learning_rate": 0.0001517707178936589, "loss": 2.3465, "step": 28128 }, { "epoch": 0.35, "learning_rate": 0.00015174546919032757, "loss": 2.338, "step": 28136 }, { "epoch": 0.35, "learning_rate": 0.00015172021630016226, "loss": 2.3299, "step": 28144 }, { "epoch": 0.35, "learning_rate": 0.00015169495922569566, "loss": 2.3421, "step": 28152 }, { "epoch": 0.35, "learning_rate": 0.00015166969796946087, "loss": 2.3332, "step": 28160 }, { "epoch": 0.35, "learning_rate": 0.00015164443253399152, "loss": 2.3336, "step": 28168 }, { "epoch": 0.35, "learning_rate": 0.00015161916292182154, "loss": 2.3521, "step": 28176 }, { "epoch": 0.35, "learning_rate": 0.00015159388913548537, "loss": 2.3402, "step": 28184 }, { "epoch": 0.35, "learning_rate": 0.00015156861117751778, "loss": 2.3478, "step": 28192 }, { "epoch": 0.35, "learning_rate": 0.00015154332905045403, "loss": 2.3329, "step": 28200 }, { "epoch": 0.35, "learning_rate": 0.00015151804275682977, "loss": 2.3357, "step": 28208 }, { "epoch": 0.35, "learning_rate": 0.00015149275229918107, "loss": 2.3491, "step": 28216 }, { "epoch": 0.35, "learning_rate": 0.00015146745768004444, "loss": 2.3523, "step": 28224 }, { "epoch": 0.35, "learning_rate": 0.00015144215890195678, "loss": 2.3362, "step": 28232 }, { "epoch": 0.35, "learning_rate": 0.00015141685596745542, "loss": 2.3381, "step": 28240 }, { "epoch": 0.35, "learning_rate": 0.00015139154887907805, "loss": 2.3543, "step": 28248 }, { "epoch": 0.35, "learning_rate": 0.0001513662376393629, "loss": 2.3439, "step": 28256 }, { "epoch": 0.35, "learning_rate": 0.00015134092225084847, "loss": 2.345, "step": 28264 }, { "epoch": 0.35, "learning_rate": 0.0001513156027160738, "loss": 2.3319, "step": 28272 }, { "epoch": 0.35, "learning_rate": 0.0001512902790375783, "loss": 2.332, "step": 28280 }, { "epoch": 0.35, "learning_rate": 0.00015126495121790178, "loss": 2.3283, "step": 28288 }, { "epoch": 0.35, "learning_rate": 0.00015123961925958445, "loss": 2.3364, "step": 28296 }, { "epoch": 0.35, "learning_rate": 0.00015121428316516698, "loss": 2.3491, "step": 28304 }, { "epoch": 0.35, "learning_rate": 0.00015118894293719045, "loss": 2.3717, "step": 28312 }, { "epoch": 0.35, "learning_rate": 0.00015116359857819634, "loss": 2.3313, "step": 28320 }, { "epoch": 0.35, "learning_rate": 0.00015113825009072657, "loss": 2.3385, "step": 28328 }, { "epoch": 0.35, "learning_rate": 0.0001511128974773234, "loss": 2.3365, "step": 28336 }, { "epoch": 0.35, "learning_rate": 0.00015108754074052955, "loss": 2.3404, "step": 28344 }, { "epoch": 0.35, "learning_rate": 0.00015106217988288816, "loss": 2.331, "step": 28352 }, { "epoch": 0.35, "learning_rate": 0.00015103681490694282, "loss": 2.3407, "step": 28360 }, { "epoch": 0.35, "learning_rate": 0.0001510114458152375, "loss": 2.3581, "step": 28368 }, { "epoch": 0.35, "learning_rate": 0.00015098607261031653, "loss": 2.3557, "step": 28376 }, { "epoch": 0.35, "learning_rate": 0.0001509606952947247, "loss": 2.3406, "step": 28384 }, { "epoch": 0.35, "learning_rate": 0.00015093531387100725, "loss": 2.3517, "step": 28392 }, { "epoch": 0.35, "learning_rate": 0.00015090992834170975, "loss": 2.3336, "step": 28400 }, { "epoch": 0.36, "learning_rate": 0.0001508845387093783, "loss": 2.3263, "step": 28408 }, { "epoch": 0.36, "learning_rate": 0.00015085914497655923, "loss": 2.3366, "step": 28416 }, { "epoch": 0.36, "learning_rate": 0.00015083374714579942, "loss": 2.3341, "step": 28424 }, { "epoch": 0.36, "learning_rate": 0.0001508083452196462, "loss": 2.3656, "step": 28432 }, { "epoch": 0.36, "learning_rate": 0.00015078293920064718, "loss": 2.3516, "step": 28440 }, { "epoch": 0.36, "learning_rate": 0.00015075752909135038, "loss": 2.3374, "step": 28448 }, { "epoch": 0.36, "learning_rate": 0.00015073211489430446, "loss": 2.3196, "step": 28456 }, { "epoch": 0.36, "learning_rate": 0.00015070669661205817, "loss": 2.3555, "step": 28464 }, { "epoch": 0.36, "learning_rate": 0.00015068127424716085, "loss": 2.3525, "step": 28472 }, { "epoch": 0.36, "learning_rate": 0.00015065584780216224, "loss": 2.35, "step": 28480 }, { "epoch": 0.36, "learning_rate": 0.00015063041727961246, "loss": 2.3504, "step": 28488 }, { "epoch": 0.36, "learning_rate": 0.00015060498268206206, "loss": 2.3407, "step": 28496 }, { "epoch": 0.36, "learning_rate": 0.000150579544012062, "loss": 2.3414, "step": 28504 }, { "epoch": 0.36, "learning_rate": 0.00015055410127216357, "loss": 2.3395, "step": 28512 }, { "epoch": 0.36, "learning_rate": 0.00015052865446491863, "loss": 2.3395, "step": 28520 }, { "epoch": 0.36, "learning_rate": 0.00015050320359287926, "loss": 2.3479, "step": 28528 }, { "epoch": 0.36, "learning_rate": 0.0001504777486585981, "loss": 2.3378, "step": 28536 }, { "epoch": 0.36, "learning_rate": 0.0001504522896646281, "loss": 2.3331, "step": 28544 }, { "epoch": 0.36, "learning_rate": 0.0001504268266135226, "loss": 2.3431, "step": 28552 }, { "epoch": 0.36, "learning_rate": 0.00015040135950783554, "loss": 2.3502, "step": 28560 }, { "epoch": 0.36, "learning_rate": 0.00015037588835012099, "loss": 2.3253, "step": 28568 }, { "epoch": 0.36, "learning_rate": 0.00015035041314293365, "loss": 2.3419, "step": 28576 }, { "epoch": 0.36, "learning_rate": 0.0001503249338888285, "loss": 2.3567, "step": 28584 }, { "epoch": 0.36, "learning_rate": 0.000150299450590361, "loss": 2.3198, "step": 28592 }, { "epoch": 0.36, "learning_rate": 0.00015027396325008696, "loss": 2.3482, "step": 28600 }, { "epoch": 0.36, "learning_rate": 0.00015024847187056258, "loss": 2.3629, "step": 28608 }, { "epoch": 0.36, "learning_rate": 0.00015022297645434453, "loss": 2.3581, "step": 28616 }, { "epoch": 0.36, "learning_rate": 0.00015019747700398988, "loss": 2.3516, "step": 28624 }, { "epoch": 0.36, "learning_rate": 0.00015017197352205604, "loss": 2.329, "step": 28632 }, { "epoch": 0.36, "learning_rate": 0.00015014646601110092, "loss": 2.3226, "step": 28640 }, { "epoch": 0.36, "learning_rate": 0.0001501209544736827, "loss": 2.3293, "step": 28648 }, { "epoch": 0.36, "learning_rate": 0.0001500954389123601, "loss": 2.3383, "step": 28656 }, { "epoch": 0.36, "learning_rate": 0.00015006991932969214, "loss": 2.3345, "step": 28664 }, { "epoch": 0.36, "learning_rate": 0.00015004439572823835, "loss": 2.347, "step": 28672 }, { "epoch": 0.36, "learning_rate": 0.0001500188681105586, "loss": 2.3363, "step": 28680 }, { "epoch": 0.36, "learning_rate": 0.00014999333647921308, "loss": 2.3535, "step": 28688 }, { "epoch": 0.36, "learning_rate": 0.00014996780083676256, "loss": 2.3487, "step": 28696 }, { "epoch": 0.36, "learning_rate": 0.00014994226118576808, "loss": 2.3424, "step": 28704 }, { "epoch": 0.36, "learning_rate": 0.0001499167175287911, "loss": 2.3354, "step": 28712 }, { "epoch": 0.36, "learning_rate": 0.00014989116986839358, "loss": 2.3441, "step": 28720 }, { "epoch": 0.36, "learning_rate": 0.00014986561820713775, "loss": 2.332, "step": 28728 }, { "epoch": 0.36, "learning_rate": 0.0001498400625475863, "loss": 2.3381, "step": 28736 }, { "epoch": 0.36, "learning_rate": 0.00014981450289230228, "loss": 2.3243, "step": 28744 }, { "epoch": 0.36, "learning_rate": 0.00014978893924384924, "loss": 2.3433, "step": 28752 }, { "epoch": 0.36, "learning_rate": 0.00014976337160479107, "loss": 2.3453, "step": 28760 }, { "epoch": 0.36, "learning_rate": 0.00014973779997769207, "loss": 2.334, "step": 28768 }, { "epoch": 0.36, "learning_rate": 0.00014971222436511688, "loss": 2.3379, "step": 28776 }, { "epoch": 0.36, "learning_rate": 0.00014968664476963054, "loss": 2.3375, "step": 28784 }, { "epoch": 0.36, "learning_rate": 0.0001496610611937987, "loss": 2.3479, "step": 28792 }, { "epoch": 0.36, "learning_rate": 0.00014963547364018712, "loss": 2.3551, "step": 28800 }, { "epoch": 0.36, "learning_rate": 0.00014960988211136207, "loss": 2.3474, "step": 28808 }, { "epoch": 0.36, "learning_rate": 0.00014958428660989036, "loss": 2.3363, "step": 28816 }, { "epoch": 0.36, "learning_rate": 0.00014955868713833895, "loss": 2.3387, "step": 28824 }, { "epoch": 0.36, "learning_rate": 0.0001495330836992754, "loss": 2.327, "step": 28832 }, { "epoch": 0.36, "learning_rate": 0.00014950747629526755, "loss": 2.3386, "step": 28840 }, { "epoch": 0.36, "learning_rate": 0.0001494818649288837, "loss": 2.3362, "step": 28848 }, { "epoch": 0.36, "learning_rate": 0.0001494562496026925, "loss": 2.3549, "step": 28856 }, { "epoch": 0.36, "learning_rate": 0.00014943063031926308, "loss": 2.3443, "step": 28864 }, { "epoch": 0.36, "learning_rate": 0.00014940500708116483, "loss": 2.3407, "step": 28872 }, { "epoch": 0.36, "learning_rate": 0.00014937937989096764, "loss": 2.3372, "step": 28880 }, { "epoch": 0.36, "learning_rate": 0.00014935374875124177, "loss": 2.3329, "step": 28888 }, { "epoch": 0.36, "learning_rate": 0.0001493281136645579, "loss": 2.3524, "step": 28896 }, { "epoch": 0.36, "learning_rate": 0.0001493024746334871, "loss": 2.3366, "step": 28904 }, { "epoch": 0.36, "learning_rate": 0.0001492768316606008, "loss": 2.3344, "step": 28912 }, { "epoch": 0.36, "learning_rate": 0.00014925118474847082, "loss": 2.3587, "step": 28920 }, { "epoch": 0.36, "learning_rate": 0.0001492255338996694, "loss": 2.3319, "step": 28928 }, { "epoch": 0.36, "learning_rate": 0.00014919987911676921, "loss": 2.3376, "step": 28936 }, { "epoch": 0.36, "learning_rate": 0.0001491742204023433, "loss": 2.3359, "step": 28944 }, { "epoch": 0.36, "learning_rate": 0.000149148557758965, "loss": 2.3534, "step": 28952 }, { "epoch": 0.36, "learning_rate": 0.00014912289118920822, "loss": 2.3306, "step": 28960 }, { "epoch": 0.36, "learning_rate": 0.00014909722069564714, "loss": 2.3442, "step": 28968 }, { "epoch": 0.36, "learning_rate": 0.00014907154628085632, "loss": 2.3387, "step": 28976 }, { "epoch": 0.36, "learning_rate": 0.00014904586794741088, "loss": 2.3303, "step": 28984 }, { "epoch": 0.36, "learning_rate": 0.00014902018569788608, "loss": 2.3572, "step": 28992 }, { "epoch": 0.36, "learning_rate": 0.00014899449953485774, "loss": 2.3339, "step": 29000 }, { "epoch": 0.36, "learning_rate": 0.00014896880946090204, "loss": 2.3472, "step": 29008 }, { "epoch": 0.36, "learning_rate": 0.0001489431154785956, "loss": 2.3409, "step": 29016 }, { "epoch": 0.36, "learning_rate": 0.00014891741759051532, "loss": 2.3505, "step": 29024 }, { "epoch": 0.36, "learning_rate": 0.0001488917157992386, "loss": 2.3222, "step": 29032 }, { "epoch": 0.36, "learning_rate": 0.00014886601010734312, "loss": 2.3337, "step": 29040 }, { "epoch": 0.36, "learning_rate": 0.0001488403005174071, "loss": 2.3479, "step": 29048 }, { "epoch": 0.36, "learning_rate": 0.00014881458703200896, "loss": 2.3243, "step": 29056 }, { "epoch": 0.36, "learning_rate": 0.0001487888696537277, "loss": 2.3342, "step": 29064 }, { "epoch": 0.36, "learning_rate": 0.00014876314838514266, "loss": 2.3166, "step": 29072 }, { "epoch": 0.36, "learning_rate": 0.0001487374232288334, "loss": 2.3249, "step": 29080 }, { "epoch": 0.36, "learning_rate": 0.00014871169418738013, "loss": 2.3302, "step": 29088 }, { "epoch": 0.36, "learning_rate": 0.00014868596126336328, "loss": 2.3495, "step": 29096 }, { "epoch": 0.36, "learning_rate": 0.00014866022445936372, "loss": 2.3304, "step": 29104 }, { "epoch": 0.36, "learning_rate": 0.0001486344837779627, "loss": 2.3214, "step": 29112 }, { "epoch": 0.36, "learning_rate": 0.00014860873922174187, "loss": 2.3299, "step": 29120 }, { "epoch": 0.36, "learning_rate": 0.0001485829907932833, "loss": 2.3484, "step": 29128 }, { "epoch": 0.36, "learning_rate": 0.00014855723849516934, "loss": 2.3348, "step": 29136 }, { "epoch": 0.36, "learning_rate": 0.00014853148232998284, "loss": 2.3215, "step": 29144 }, { "epoch": 0.36, "learning_rate": 0.00014850572230030702, "loss": 2.3235, "step": 29152 }, { "epoch": 0.36, "learning_rate": 0.0001484799584087254, "loss": 2.3429, "step": 29160 }, { "epoch": 0.36, "learning_rate": 0.00014845419065782203, "loss": 2.35, "step": 29168 }, { "epoch": 0.36, "learning_rate": 0.0001484284190501812, "loss": 2.3447, "step": 29176 }, { "epoch": 0.36, "learning_rate": 0.0001484026435883877, "loss": 2.3307, "step": 29184 }, { "epoch": 0.36, "learning_rate": 0.0001483768642750266, "loss": 2.3297, "step": 29192 }, { "epoch": 0.36, "learning_rate": 0.00014835108111268354, "loss": 2.3107, "step": 29200 }, { "epoch": 0.37, "learning_rate": 0.00014832529410394436, "loss": 2.3137, "step": 29208 }, { "epoch": 0.37, "learning_rate": 0.0001482995032513953, "loss": 2.3262, "step": 29216 }, { "epoch": 0.37, "learning_rate": 0.0001482737085576231, "loss": 2.3533, "step": 29224 }, { "epoch": 0.37, "learning_rate": 0.00014824791002521478, "loss": 2.3325, "step": 29232 }, { "epoch": 0.37, "learning_rate": 0.00014822210765675785, "loss": 2.3406, "step": 29240 }, { "epoch": 0.37, "learning_rate": 0.00014819630145484008, "loss": 2.3257, "step": 29248 }, { "epoch": 0.37, "learning_rate": 0.00014817049142204969, "loss": 2.3314, "step": 29256 }, { "epoch": 0.37, "learning_rate": 0.0001481446775609753, "loss": 2.3156, "step": 29264 }, { "epoch": 0.37, "learning_rate": 0.00014811885987420592, "loss": 2.3407, "step": 29272 }, { "epoch": 0.37, "learning_rate": 0.00014809303836433086, "loss": 2.3236, "step": 29280 }, { "epoch": 0.37, "learning_rate": 0.0001480672130339399, "loss": 2.3444, "step": 29288 }, { "epoch": 0.37, "learning_rate": 0.00014804138388562317, "loss": 2.3287, "step": 29296 }, { "epoch": 0.37, "learning_rate": 0.00014801555092197122, "loss": 2.3245, "step": 29304 }, { "epoch": 0.37, "learning_rate": 0.00014798971414557488, "loss": 2.3374, "step": 29312 }, { "epoch": 0.37, "learning_rate": 0.00014796387355902547, "loss": 2.3293, "step": 29320 }, { "epoch": 0.37, "learning_rate": 0.0001479380291649147, "loss": 2.3382, "step": 29328 }, { "epoch": 0.37, "learning_rate": 0.00014791218096583456, "loss": 2.3235, "step": 29336 }, { "epoch": 0.37, "learning_rate": 0.0001478863289643775, "loss": 2.3306, "step": 29344 }, { "epoch": 0.37, "learning_rate": 0.0001478604731631363, "loss": 2.3396, "step": 29352 }, { "epoch": 0.37, "learning_rate": 0.00014783461356470415, "loss": 2.3325, "step": 29360 }, { "epoch": 0.37, "learning_rate": 0.00014780875017167468, "loss": 2.3407, "step": 29368 }, { "epoch": 0.37, "learning_rate": 0.00014778288298664181, "loss": 2.3434, "step": 29376 }, { "epoch": 0.37, "learning_rate": 0.00014775701201219982, "loss": 2.3369, "step": 29384 }, { "epoch": 0.37, "learning_rate": 0.0001477311372509435, "loss": 2.3491, "step": 29392 }, { "epoch": 0.37, "learning_rate": 0.00014770525870546792, "loss": 2.3242, "step": 29400 }, { "epoch": 0.37, "learning_rate": 0.00014767937637836853, "loss": 2.3186, "step": 29408 }, { "epoch": 0.37, "learning_rate": 0.0001476534902722412, "loss": 2.3348, "step": 29416 }, { "epoch": 0.37, "learning_rate": 0.00014762760038968214, "loss": 2.3589, "step": 29424 }, { "epoch": 0.37, "learning_rate": 0.000147601706733288, "loss": 2.3274, "step": 29432 }, { "epoch": 0.37, "learning_rate": 0.0001475758093056557, "loss": 2.3279, "step": 29440 }, { "epoch": 0.37, "learning_rate": 0.00014754990810938266, "loss": 2.3216, "step": 29448 }, { "epoch": 0.37, "learning_rate": 0.00014752400314706657, "loss": 2.3277, "step": 29456 }, { "epoch": 0.37, "learning_rate": 0.00014749809442130566, "loss": 2.325, "step": 29464 }, { "epoch": 0.37, "learning_rate": 0.0001474721819346983, "loss": 2.318, "step": 29472 }, { "epoch": 0.37, "learning_rate": 0.00014744626568984344, "loss": 2.3395, "step": 29480 }, { "epoch": 0.37, "learning_rate": 0.0001474203456893403, "loss": 2.3437, "step": 29488 }, { "epoch": 0.37, "learning_rate": 0.00014739442193578852, "loss": 2.3328, "step": 29496 }, { "epoch": 0.37, "learning_rate": 0.00014736849443178812, "loss": 2.339, "step": 29504 }, { "epoch": 0.37, "learning_rate": 0.0001473425631799395, "loss": 2.3505, "step": 29512 }, { "epoch": 0.37, "learning_rate": 0.00014731662818284332, "loss": 2.3389, "step": 29520 }, { "epoch": 0.37, "learning_rate": 0.00014729068944310082, "loss": 2.3392, "step": 29528 }, { "epoch": 0.37, "learning_rate": 0.00014726474696331347, "loss": 2.3339, "step": 29536 }, { "epoch": 0.37, "learning_rate": 0.00014723880074608316, "loss": 2.3296, "step": 29544 }, { "epoch": 0.37, "learning_rate": 0.00014721285079401212, "loss": 2.3506, "step": 29552 }, { "epoch": 0.37, "learning_rate": 0.000147186897109703, "loss": 2.3408, "step": 29560 }, { "epoch": 0.37, "learning_rate": 0.00014716093969575886, "loss": 2.3333, "step": 29568 }, { "epoch": 0.37, "learning_rate": 0.00014713497855478299, "loss": 2.3327, "step": 29576 }, { "epoch": 0.37, "learning_rate": 0.00014710901368937922, "loss": 2.3382, "step": 29584 }, { "epoch": 0.37, "learning_rate": 0.00014708304510215162, "loss": 2.3124, "step": 29592 }, { "epoch": 0.37, "learning_rate": 0.00014705707279570477, "loss": 2.3373, "step": 29600 }, { "epoch": 0.37, "learning_rate": 0.00014703109677264344, "loss": 2.338, "step": 29608 }, { "epoch": 0.37, "learning_rate": 0.00014700511703557293, "loss": 2.3312, "step": 29616 }, { "epoch": 0.37, "learning_rate": 0.00014697913358709887, "loss": 2.3422, "step": 29624 }, { "epoch": 0.37, "learning_rate": 0.00014695314642982726, "loss": 2.3347, "step": 29632 }, { "epoch": 0.37, "learning_rate": 0.00014692715556636446, "loss": 2.3351, "step": 29640 }, { "epoch": 0.37, "learning_rate": 0.00014690116099931724, "loss": 2.3259, "step": 29648 }, { "epoch": 0.37, "learning_rate": 0.00014687516273129259, "loss": 2.334, "step": 29656 }, { "epoch": 0.37, "learning_rate": 0.0001468491607648981, "loss": 2.3336, "step": 29664 }, { "epoch": 0.37, "learning_rate": 0.00014682315510274155, "loss": 2.3478, "step": 29672 }, { "epoch": 0.37, "learning_rate": 0.0001467971457474312, "loss": 2.3421, "step": 29680 }, { "epoch": 0.37, "learning_rate": 0.0001467711327015757, "loss": 2.3377, "step": 29688 }, { "epoch": 0.37, "learning_rate": 0.0001467451159677839, "loss": 2.3256, "step": 29696 }, { "epoch": 0.37, "learning_rate": 0.00014671909554866516, "loss": 2.34, "step": 29704 }, { "epoch": 0.37, "learning_rate": 0.00014669307144682923, "loss": 2.3314, "step": 29712 }, { "epoch": 0.37, "learning_rate": 0.00014666704366488612, "loss": 2.3404, "step": 29720 }, { "epoch": 0.37, "learning_rate": 0.0001466410122054463, "loss": 2.3467, "step": 29728 }, { "epoch": 0.37, "learning_rate": 0.00014661497707112062, "loss": 2.3349, "step": 29736 }, { "epoch": 0.37, "learning_rate": 0.00014658893826452018, "loss": 2.3457, "step": 29744 }, { "epoch": 0.37, "learning_rate": 0.00014656289578825654, "loss": 2.3265, "step": 29752 }, { "epoch": 0.37, "learning_rate": 0.00014653684964494162, "loss": 2.3338, "step": 29760 }, { "epoch": 0.37, "learning_rate": 0.00014651079983718775, "loss": 2.3222, "step": 29768 }, { "epoch": 0.37, "learning_rate": 0.00014648474636760753, "loss": 2.3273, "step": 29776 }, { "epoch": 0.37, "learning_rate": 0.00014645868923881397, "loss": 2.3521, "step": 29784 }, { "epoch": 0.37, "learning_rate": 0.00014643262845342049, "loss": 2.3332, "step": 29792 }, { "epoch": 0.37, "learning_rate": 0.0001464065640140408, "loss": 2.3301, "step": 29800 }, { "epoch": 0.37, "learning_rate": 0.000146380495923289, "loss": 2.3247, "step": 29808 }, { "epoch": 0.37, "learning_rate": 0.00014635442418377964, "loss": 2.3303, "step": 29816 }, { "epoch": 0.37, "learning_rate": 0.00014632834879812755, "loss": 2.3413, "step": 29824 }, { "epoch": 0.37, "learning_rate": 0.00014630226976894789, "loss": 2.3486, "step": 29832 }, { "epoch": 0.37, "learning_rate": 0.00014627618709885627, "loss": 2.3395, "step": 29840 }, { "epoch": 0.37, "learning_rate": 0.00014625010079046864, "loss": 2.325, "step": 29848 }, { "epoch": 0.37, "learning_rate": 0.0001462240108464013, "loss": 2.3321, "step": 29856 }, { "epoch": 0.37, "learning_rate": 0.0001461979172692709, "loss": 2.3157, "step": 29864 }, { "epoch": 0.37, "learning_rate": 0.00014617182006169456, "loss": 2.3328, "step": 29872 }, { "epoch": 0.37, "learning_rate": 0.00014614571922628964, "loss": 2.3355, "step": 29880 }, { "epoch": 0.37, "learning_rate": 0.00014611961476567383, "loss": 2.3394, "step": 29888 }, { "epoch": 0.37, "learning_rate": 0.00014609350668246535, "loss": 2.3394, "step": 29896 }, { "epoch": 0.37, "learning_rate": 0.00014606739497928268, "loss": 2.3201, "step": 29904 }, { "epoch": 0.37, "learning_rate": 0.00014604127965874467, "loss": 2.3392, "step": 29912 }, { "epoch": 0.37, "learning_rate": 0.00014601516072347052, "loss": 2.3644, "step": 29920 }, { "epoch": 0.37, "learning_rate": 0.00014598903817607982, "loss": 2.344, "step": 29928 }, { "epoch": 0.37, "learning_rate": 0.00014596291201919253, "loss": 2.335, "step": 29936 }, { "epoch": 0.37, "learning_rate": 0.00014593678225542894, "loss": 2.3298, "step": 29944 }, { "epoch": 0.37, "learning_rate": 0.0001459106488874097, "loss": 2.3384, "step": 29952 }, { "epoch": 0.37, "learning_rate": 0.00014588451191775587, "loss": 2.3236, "step": 29960 }, { "epoch": 0.37, "learning_rate": 0.0001458583713490888, "loss": 2.3433, "step": 29968 }, { "epoch": 0.37, "learning_rate": 0.0001458322271840303, "loss": 2.3322, "step": 29976 }, { "epoch": 0.37, "learning_rate": 0.00014580607942520242, "loss": 2.3439, "step": 29984 }, { "epoch": 0.37, "learning_rate": 0.0001457799280752277, "loss": 2.3376, "step": 29992 }, { "epoch": 0.38, "learning_rate": 0.00014575377313672894, "loss": 2.334, "step": 30000 }, { "epoch": 0.38, "learning_rate": 0.0001457276146123293, "loss": 2.346, "step": 30008 }, { "epoch": 0.38, "learning_rate": 0.00014570145250465238, "loss": 2.3478, "step": 30016 }, { "epoch": 0.38, "learning_rate": 0.00014567528681632203, "loss": 2.3316, "step": 30024 }, { "epoch": 0.38, "learning_rate": 0.00014564911754996258, "loss": 2.3405, "step": 30032 }, { "epoch": 0.38, "learning_rate": 0.00014562294470819864, "loss": 2.348, "step": 30040 }, { "epoch": 0.38, "learning_rate": 0.0001455967682936552, "loss": 2.335, "step": 30048 }, { "epoch": 0.38, "learning_rate": 0.0001455705883089576, "loss": 2.35, "step": 30056 }, { "epoch": 0.38, "learning_rate": 0.00014554440475673155, "loss": 2.3286, "step": 30064 }, { "epoch": 0.38, "learning_rate": 0.0001455182176396031, "loss": 2.3412, "step": 30072 }, { "epoch": 0.38, "learning_rate": 0.0001454920269601987, "loss": 2.3289, "step": 30080 }, { "epoch": 0.38, "learning_rate": 0.00014546583272114508, "loss": 2.3202, "step": 30088 }, { "epoch": 0.38, "learning_rate": 0.0001454396349250694, "loss": 2.3399, "step": 30096 }, { "epoch": 0.38, "learning_rate": 0.00014541343357459915, "loss": 2.3324, "step": 30104 }, { "epoch": 0.38, "learning_rate": 0.00014538722867236218, "loss": 2.3385, "step": 30112 }, { "epoch": 0.38, "learning_rate": 0.0001453610202209867, "loss": 2.3492, "step": 30120 }, { "epoch": 0.38, "learning_rate": 0.00014533480822310124, "loss": 2.3365, "step": 30128 }, { "epoch": 0.38, "learning_rate": 0.00014530859268133475, "loss": 2.3304, "step": 30136 }, { "epoch": 0.38, "learning_rate": 0.00014528237359831648, "loss": 2.3142, "step": 30144 }, { "epoch": 0.38, "learning_rate": 0.00014525615097667603, "loss": 2.3339, "step": 30152 }, { "epoch": 0.38, "learning_rate": 0.00014522992481904345, "loss": 2.3159, "step": 30160 }, { "epoch": 0.38, "learning_rate": 0.000145203695128049, "loss": 2.3171, "step": 30168 }, { "epoch": 0.38, "learning_rate": 0.00014517746190632343, "loss": 2.3399, "step": 30176 }, { "epoch": 0.38, "learning_rate": 0.00014515122515649777, "loss": 2.3326, "step": 30184 }, { "epoch": 0.38, "learning_rate": 0.00014512498488120337, "loss": 2.3464, "step": 30192 }, { "epoch": 0.38, "learning_rate": 0.00014509874108307205, "loss": 2.3256, "step": 30200 }, { "epoch": 0.38, "learning_rate": 0.00014507249376473585, "loss": 2.342, "step": 30208 }, { "epoch": 0.38, "learning_rate": 0.00014504624292882728, "loss": 2.3033, "step": 30216 }, { "epoch": 0.38, "learning_rate": 0.00014501998857797908, "loss": 2.3319, "step": 30224 }, { "epoch": 0.38, "learning_rate": 0.0001449937307148245, "loss": 2.322, "step": 30232 }, { "epoch": 0.38, "learning_rate": 0.000144967469341997, "loss": 2.3478, "step": 30240 }, { "epoch": 0.38, "learning_rate": 0.0001449412044621305, "loss": 2.3316, "step": 30248 }, { "epoch": 0.38, "learning_rate": 0.00014491493607785916, "loss": 2.3201, "step": 30256 }, { "epoch": 0.38, "learning_rate": 0.00014488866419181754, "loss": 2.3326, "step": 30264 }, { "epoch": 0.38, "learning_rate": 0.00014486238880664063, "loss": 2.3317, "step": 30272 }, { "epoch": 0.38, "learning_rate": 0.00014483610992496363, "loss": 2.3521, "step": 30280 }, { "epoch": 0.38, "learning_rate": 0.00014480982754942222, "loss": 2.353, "step": 30288 }, { "epoch": 0.38, "learning_rate": 0.00014478354168265235, "loss": 2.3476, "step": 30296 }, { "epoch": 0.38, "learning_rate": 0.00014475725232729032, "loss": 2.3191, "step": 30304 }, { "epoch": 0.38, "learning_rate": 0.00014473095948597286, "loss": 2.315, "step": 30312 }, { "epoch": 0.38, "learning_rate": 0.00014470466316133696, "loss": 2.3267, "step": 30320 }, { "epoch": 0.38, "learning_rate": 0.00014467836335601994, "loss": 2.3145, "step": 30328 }, { "epoch": 0.38, "learning_rate": 0.00014465206007265963, "loss": 2.3269, "step": 30336 }, { "epoch": 0.38, "learning_rate": 0.00014462575331389402, "loss": 2.3471, "step": 30344 }, { "epoch": 0.38, "learning_rate": 0.00014459944308236157, "loss": 2.3319, "step": 30352 }, { "epoch": 0.38, "learning_rate": 0.000144573129380701, "loss": 2.3414, "step": 30360 }, { "epoch": 0.38, "learning_rate": 0.0001445468122115515, "loss": 2.3323, "step": 30368 }, { "epoch": 0.38, "learning_rate": 0.00014452049157755243, "loss": 2.3348, "step": 30376 }, { "epoch": 0.38, "learning_rate": 0.0001444941674813437, "loss": 2.3375, "step": 30384 }, { "epoch": 0.38, "learning_rate": 0.00014446783992556542, "loss": 2.3368, "step": 30392 }, { "epoch": 0.38, "learning_rate": 0.00014444150891285807, "loss": 2.3473, "step": 30400 }, { "epoch": 0.38, "learning_rate": 0.0001444151744458626, "loss": 2.3309, "step": 30408 }, { "epoch": 0.38, "learning_rate": 0.0001443888365272201, "loss": 2.3415, "step": 30416 }, { "epoch": 0.38, "learning_rate": 0.00014436249515957213, "loss": 2.3244, "step": 30424 }, { "epoch": 0.38, "learning_rate": 0.0001443361503455606, "loss": 2.3226, "step": 30432 }, { "epoch": 0.38, "learning_rate": 0.00014430980208782781, "loss": 2.3234, "step": 30440 }, { "epoch": 0.38, "learning_rate": 0.00014428345038901627, "loss": 2.3263, "step": 30448 }, { "epoch": 0.38, "learning_rate": 0.00014425709525176889, "loss": 2.3313, "step": 30456 }, { "epoch": 0.38, "learning_rate": 0.00014423073667872892, "loss": 2.3595, "step": 30464 }, { "epoch": 0.38, "learning_rate": 0.00014420437467254008, "loss": 2.3352, "step": 30472 }, { "epoch": 0.38, "learning_rate": 0.0001441780092358463, "loss": 2.3284, "step": 30480 }, { "epoch": 0.38, "learning_rate": 0.00014415164037129182, "loss": 2.3267, "step": 30488 }, { "epoch": 0.38, "learning_rate": 0.00014412526808152133, "loss": 2.3277, "step": 30496 }, { "epoch": 0.38, "learning_rate": 0.00014409889236917983, "loss": 2.3253, "step": 30504 }, { "epoch": 0.38, "learning_rate": 0.0001440725132369126, "loss": 2.3273, "step": 30512 }, { "epoch": 0.38, "learning_rate": 0.00014404613068736539, "loss": 2.3413, "step": 30520 }, { "epoch": 0.38, "learning_rate": 0.00014401974472318417, "loss": 2.3401, "step": 30528 }, { "epoch": 0.38, "learning_rate": 0.00014399335534701535, "loss": 2.3177, "step": 30536 }, { "epoch": 0.38, "learning_rate": 0.0001439669625615056, "loss": 2.3336, "step": 30544 }, { "epoch": 0.38, "learning_rate": 0.00014394056636930194, "loss": 2.2879, "step": 30552 }, { "epoch": 0.38, "learning_rate": 0.00014391416677305183, "loss": 2.3249, "step": 30560 }, { "epoch": 0.38, "learning_rate": 0.00014388776377540294, "loss": 2.3318, "step": 30568 }, { "epoch": 0.38, "learning_rate": 0.00014386135737900338, "loss": 2.3436, "step": 30576 }, { "epoch": 0.38, "learning_rate": 0.0001438349475865015, "loss": 2.3322, "step": 30584 }, { "epoch": 0.38, "learning_rate": 0.00014380853440054616, "loss": 2.3301, "step": 30592 }, { "epoch": 0.38, "learning_rate": 0.00014378211782378633, "loss": 2.3403, "step": 30600 }, { "epoch": 0.38, "learning_rate": 0.00014375569785887154, "loss": 2.3475, "step": 30608 }, { "epoch": 0.38, "learning_rate": 0.00014372927450845153, "loss": 2.323, "step": 30616 }, { "epoch": 0.38, "learning_rate": 0.00014370284777517637, "loss": 2.3429, "step": 30624 }, { "epoch": 0.38, "learning_rate": 0.00014367641766169654, "loss": 2.3332, "step": 30632 }, { "epoch": 0.38, "learning_rate": 0.0001436499841706629, "loss": 2.3243, "step": 30640 }, { "epoch": 0.38, "learning_rate": 0.00014362354730472647, "loss": 2.3246, "step": 30648 }, { "epoch": 0.38, "learning_rate": 0.00014359710706653882, "loss": 2.3242, "step": 30656 }, { "epoch": 0.38, "learning_rate": 0.00014357066345875165, "loss": 2.3182, "step": 30664 }, { "epoch": 0.38, "learning_rate": 0.00014354421648401716, "loss": 2.3333, "step": 30672 }, { "epoch": 0.38, "learning_rate": 0.00014351776614498785, "loss": 2.3454, "step": 30680 }, { "epoch": 0.38, "learning_rate": 0.0001434913124443165, "loss": 2.3311, "step": 30688 }, { "epoch": 0.38, "learning_rate": 0.00014346485538465633, "loss": 2.34, "step": 30696 }, { "epoch": 0.38, "learning_rate": 0.00014343839496866074, "loss": 2.3112, "step": 30704 }, { "epoch": 0.38, "learning_rate": 0.0001434119311989836, "loss": 2.3262, "step": 30712 }, { "epoch": 0.38, "learning_rate": 0.0001433854640782791, "loss": 2.3146, "step": 30720 }, { "epoch": 0.38, "learning_rate": 0.00014335899360920176, "loss": 2.335, "step": 30728 }, { "epoch": 0.38, "learning_rate": 0.0001433325197944063, "loss": 2.3279, "step": 30736 }, { "epoch": 0.38, "learning_rate": 0.00014330604263654807, "loss": 2.3299, "step": 30744 }, { "epoch": 0.38, "learning_rate": 0.00014327956213828244, "loss": 2.3252, "step": 30752 }, { "epoch": 0.38, "learning_rate": 0.0001432530783022653, "loss": 2.3326, "step": 30760 }, { "epoch": 0.38, "learning_rate": 0.00014322659113115283, "loss": 2.3351, "step": 30768 }, { "epoch": 0.38, "learning_rate": 0.00014320010062760153, "loss": 2.3142, "step": 30776 }, { "epoch": 0.38, "learning_rate": 0.00014317360679426828, "loss": 2.3354, "step": 30784 }, { "epoch": 0.38, "learning_rate": 0.00014314710963381024, "loss": 2.3315, "step": 30792 }, { "epoch": 0.39, "learning_rate": 0.00014312060914888492, "loss": 2.3304, "step": 30800 }, { "epoch": 0.39, "learning_rate": 0.00014309410534215017, "loss": 2.3285, "step": 30808 }, { "epoch": 0.39, "learning_rate": 0.00014306759821626415, "loss": 2.3338, "step": 30816 }, { "epoch": 0.39, "learning_rate": 0.00014304108777388546, "loss": 2.3328, "step": 30824 }, { "epoch": 0.39, "learning_rate": 0.00014301457401767287, "loss": 2.3262, "step": 30832 }, { "epoch": 0.39, "learning_rate": 0.00014298805695028556, "loss": 2.3694, "step": 30840 }, { "epoch": 0.39, "learning_rate": 0.00014296153657438306, "loss": 2.3391, "step": 30848 }, { "epoch": 0.39, "learning_rate": 0.0001429350128926252, "loss": 2.3307, "step": 30856 }, { "epoch": 0.39, "learning_rate": 0.00014290848590767222, "loss": 2.3472, "step": 30864 }, { "epoch": 0.39, "learning_rate": 0.0001428819556221845, "loss": 2.3372, "step": 30872 }, { "epoch": 0.39, "learning_rate": 0.000142855422038823, "loss": 2.3245, "step": 30880 }, { "epoch": 0.39, "learning_rate": 0.00014282888516024882, "loss": 2.3338, "step": 30888 }, { "epoch": 0.39, "learning_rate": 0.0001428023449891235, "loss": 2.3499, "step": 30896 }, { "epoch": 0.39, "learning_rate": 0.0001427758015281088, "loss": 2.3538, "step": 30904 }, { "epoch": 0.39, "learning_rate": 0.00014274925477986695, "loss": 2.3487, "step": 30912 }, { "epoch": 0.39, "learning_rate": 0.00014272270474706045, "loss": 2.3325, "step": 30920 }, { "epoch": 0.39, "learning_rate": 0.00014269615143235205, "loss": 2.3428, "step": 30928 }, { "epoch": 0.39, "learning_rate": 0.0001426695948384049, "loss": 2.336, "step": 30936 }, { "epoch": 0.39, "learning_rate": 0.0001426430349678825, "loss": 2.3348, "step": 30944 }, { "epoch": 0.39, "learning_rate": 0.0001426164718234487, "loss": 2.3212, "step": 30952 }, { "epoch": 0.39, "learning_rate": 0.0001425899054077676, "loss": 2.3392, "step": 30960 }, { "epoch": 0.39, "learning_rate": 0.00014256333572350361, "loss": 2.3245, "step": 30968 }, { "epoch": 0.39, "learning_rate": 0.0001425367627733216, "loss": 2.3066, "step": 30976 }, { "epoch": 0.39, "learning_rate": 0.00014251018655988661, "loss": 2.336, "step": 30984 }, { "epoch": 0.39, "learning_rate": 0.00014248360708586413, "loss": 2.3472, "step": 30992 }, { "epoch": 0.39, "learning_rate": 0.00014245702435391992, "loss": 2.3399, "step": 31000 }, { "epoch": 0.39, "learning_rate": 0.00014243043836672012, "loss": 2.3288, "step": 31008 }, { "epoch": 0.39, "learning_rate": 0.00014240384912693105, "loss": 2.3253, "step": 31016 }, { "epoch": 0.39, "learning_rate": 0.00014237725663721957, "loss": 2.3653, "step": 31024 }, { "epoch": 0.39, "learning_rate": 0.00014235066090025267, "loss": 2.3518, "step": 31032 }, { "epoch": 0.39, "learning_rate": 0.00014232406191869783, "loss": 2.3105, "step": 31040 }, { "epoch": 0.39, "learning_rate": 0.00014229745969522272, "loss": 2.3407, "step": 31048 }, { "epoch": 0.39, "learning_rate": 0.00014227085423249545, "loss": 2.3451, "step": 31056 }, { "epoch": 0.39, "learning_rate": 0.00014224424553318428, "loss": 2.337, "step": 31064 }, { "epoch": 0.39, "learning_rate": 0.00014221763359995805, "loss": 2.3458, "step": 31072 }, { "epoch": 0.39, "learning_rate": 0.00014219101843548568, "loss": 2.3316, "step": 31080 }, { "epoch": 0.39, "learning_rate": 0.0001421644000424366, "loss": 2.3445, "step": 31088 }, { "epoch": 0.39, "learning_rate": 0.00014213777842348043, "loss": 2.3446, "step": 31096 }, { "epoch": 0.39, "learning_rate": 0.00014211115358128722, "loss": 2.3419, "step": 31104 }, { "epoch": 0.39, "learning_rate": 0.00014208452551852722, "loss": 2.3441, "step": 31112 }, { "epoch": 0.39, "learning_rate": 0.00014205789423787113, "loss": 2.3363, "step": 31120 }, { "epoch": 0.39, "learning_rate": 0.0001420312597419899, "loss": 2.3372, "step": 31128 }, { "epoch": 0.39, "learning_rate": 0.00014200462203355478, "loss": 2.3237, "step": 31136 }, { "epoch": 0.39, "learning_rate": 0.00014197798111523747, "loss": 2.3379, "step": 31144 }, { "epoch": 0.39, "learning_rate": 0.00014195133698970984, "loss": 2.3358, "step": 31152 }, { "epoch": 0.39, "learning_rate": 0.00014192468965964412, "loss": 2.3271, "step": 31160 }, { "epoch": 0.39, "learning_rate": 0.00014189803912771293, "loss": 2.3326, "step": 31168 }, { "epoch": 0.39, "learning_rate": 0.0001418713853965892, "loss": 2.3544, "step": 31176 }, { "epoch": 0.39, "learning_rate": 0.0001418447284689461, "loss": 2.3409, "step": 31184 }, { "epoch": 0.39, "learning_rate": 0.00014181806834745713, "loss": 2.3238, "step": 31192 }, { "epoch": 0.39, "learning_rate": 0.00014179140503479623, "loss": 2.3243, "step": 31200 }, { "epoch": 0.39, "learning_rate": 0.00014176473853363755, "loss": 2.3351, "step": 31208 }, { "epoch": 0.39, "learning_rate": 0.00014173806884665557, "loss": 2.334, "step": 31216 }, { "epoch": 0.39, "learning_rate": 0.00014171139597652513, "loss": 2.3482, "step": 31224 }, { "epoch": 0.39, "learning_rate": 0.00014168471992592136, "loss": 2.3243, "step": 31232 }, { "epoch": 0.39, "learning_rate": 0.00014165804069751973, "loss": 2.3527, "step": 31240 }, { "epoch": 0.39, "learning_rate": 0.00014163135829399598, "loss": 2.3315, "step": 31248 }, { "epoch": 0.39, "learning_rate": 0.00014160467271802623, "loss": 2.3231, "step": 31256 }, { "epoch": 0.39, "learning_rate": 0.00014157798397228689, "loss": 2.3578, "step": 31264 }, { "epoch": 0.39, "learning_rate": 0.0001415512920594547, "loss": 2.3275, "step": 31272 }, { "epoch": 0.39, "learning_rate": 0.0001415245969822067, "loss": 2.3344, "step": 31280 }, { "epoch": 0.39, "learning_rate": 0.00014149789874322023, "loss": 2.3109, "step": 31288 }, { "epoch": 0.39, "learning_rate": 0.000141471197345173, "loss": 2.3177, "step": 31296 }, { "epoch": 0.39, "learning_rate": 0.00014144449279074298, "loss": 2.332, "step": 31304 }, { "epoch": 0.39, "learning_rate": 0.00014141778508260853, "loss": 2.3502, "step": 31312 }, { "epoch": 0.39, "learning_rate": 0.00014139107422344829, "loss": 2.3215, "step": 31320 }, { "epoch": 0.39, "learning_rate": 0.00014136436021594114, "loss": 2.3411, "step": 31328 }, { "epoch": 0.39, "learning_rate": 0.00014133764306276637, "loss": 2.3346, "step": 31336 }, { "epoch": 0.39, "learning_rate": 0.0001413109227666036, "loss": 2.3291, "step": 31344 }, { "epoch": 0.39, "learning_rate": 0.00014128419933013268, "loss": 2.325, "step": 31352 }, { "epoch": 0.39, "learning_rate": 0.00014125747275603386, "loss": 2.3407, "step": 31360 }, { "epoch": 0.39, "learning_rate": 0.00014123074304698757, "loss": 2.3422, "step": 31368 }, { "epoch": 0.39, "learning_rate": 0.00014120401020567476, "loss": 2.319, "step": 31376 }, { "epoch": 0.39, "learning_rate": 0.00014117727423477652, "loss": 2.3368, "step": 31384 }, { "epoch": 0.39, "learning_rate": 0.00014115053513697438, "loss": 2.3233, "step": 31392 }, { "epoch": 0.39, "learning_rate": 0.00014112379291495003, "loss": 2.3315, "step": 31400 }, { "epoch": 0.39, "learning_rate": 0.00014109704757138565, "loss": 2.3328, "step": 31408 }, { "epoch": 0.39, "learning_rate": 0.00014107029910896354, "loss": 2.3139, "step": 31416 }, { "epoch": 0.39, "learning_rate": 0.00014104354753036654, "loss": 2.3181, "step": 31424 }, { "epoch": 0.39, "learning_rate": 0.0001410167928382776, "loss": 2.3383, "step": 31432 }, { "epoch": 0.39, "learning_rate": 0.00014099003503538008, "loss": 2.3449, "step": 31440 }, { "epoch": 0.39, "learning_rate": 0.00014096327412435765, "loss": 2.3204, "step": 31448 }, { "epoch": 0.39, "learning_rate": 0.00014093651010789433, "loss": 2.3385, "step": 31456 }, { "epoch": 0.39, "learning_rate": 0.00014090974298867426, "loss": 2.3069, "step": 31464 }, { "epoch": 0.39, "learning_rate": 0.00014088297276938213, "loss": 2.3453, "step": 31472 }, { "epoch": 0.39, "learning_rate": 0.00014085619945270288, "loss": 2.3164, "step": 31480 }, { "epoch": 0.39, "learning_rate": 0.0001408294230413216, "loss": 2.3504, "step": 31488 }, { "epoch": 0.39, "learning_rate": 0.00014080264353792392, "loss": 2.3526, "step": 31496 }, { "epoch": 0.39, "learning_rate": 0.00014077586094519558, "loss": 2.3364, "step": 31504 }, { "epoch": 0.39, "learning_rate": 0.0001407490752658228, "loss": 2.3284, "step": 31512 }, { "epoch": 0.39, "learning_rate": 0.00014072228650249203, "loss": 2.3399, "step": 31520 }, { "epoch": 0.39, "learning_rate": 0.00014069549465789001, "loss": 2.3218, "step": 31528 }, { "epoch": 0.39, "learning_rate": 0.0001406686997347038, "loss": 2.3116, "step": 31536 }, { "epoch": 0.39, "learning_rate": 0.00014064190173562074, "loss": 2.3341, "step": 31544 }, { "epoch": 0.39, "learning_rate": 0.0001406151006633286, "loss": 2.3373, "step": 31552 }, { "epoch": 0.39, "learning_rate": 0.00014058829652051534, "loss": 2.3532, "step": 31560 }, { "epoch": 0.39, "learning_rate": 0.00014056148930986922, "loss": 2.3232, "step": 31568 }, { "epoch": 0.39, "learning_rate": 0.00014053467903407893, "loss": 2.3351, "step": 31576 }, { "epoch": 0.39, "learning_rate": 0.00014050786569583335, "loss": 2.359, "step": 31584 }, { "epoch": 0.39, "learning_rate": 0.0001404810492978217, "loss": 2.3445, "step": 31592 }, { "epoch": 0.4, "learning_rate": 0.00014045422984273353, "loss": 2.3469, "step": 31600 }, { "epoch": 0.4, "learning_rate": 0.00014042740733325866, "loss": 2.3274, "step": 31608 }, { "epoch": 0.4, "learning_rate": 0.00014040058177208726, "loss": 2.345, "step": 31616 }, { "epoch": 0.4, "learning_rate": 0.00014037375316190974, "loss": 2.3238, "step": 31624 }, { "epoch": 0.4, "learning_rate": 0.00014034692150541696, "loss": 2.3124, "step": 31632 }, { "epoch": 0.4, "learning_rate": 0.0001403200868052998, "loss": 2.3365, "step": 31640 }, { "epoch": 0.4, "learning_rate": 0.00014029324906424982, "loss": 2.3329, "step": 31648 }, { "epoch": 0.4, "learning_rate": 0.00014026640828495855, "loss": 2.317, "step": 31656 }, { "epoch": 0.4, "learning_rate": 0.0001402395644701181, "loss": 2.3134, "step": 31664 }, { "epoch": 0.4, "learning_rate": 0.0001402127176224206, "loss": 2.3412, "step": 31672 }, { "epoch": 0.4, "learning_rate": 0.00014018586774455874, "loss": 2.3381, "step": 31680 }, { "epoch": 0.4, "learning_rate": 0.00014015901483922539, "loss": 2.3443, "step": 31688 }, { "epoch": 0.4, "learning_rate": 0.00014013215890911377, "loss": 2.3181, "step": 31696 }, { "epoch": 0.4, "learning_rate": 0.0001401052999569173, "loss": 2.3193, "step": 31704 }, { "epoch": 0.4, "learning_rate": 0.00014007843798532989, "loss": 2.3436, "step": 31712 }, { "epoch": 0.4, "learning_rate": 0.00014005157299704557, "loss": 2.3367, "step": 31720 }, { "epoch": 0.4, "learning_rate": 0.00014002470499475874, "loss": 2.3267, "step": 31728 }, { "epoch": 0.4, "learning_rate": 0.00013999783398116415, "loss": 2.3431, "step": 31736 }, { "epoch": 0.4, "learning_rate": 0.00013997095995895676, "loss": 2.3532, "step": 31744 }, { "epoch": 0.4, "learning_rate": 0.00013994408293083193, "loss": 2.3009, "step": 31752 }, { "epoch": 0.4, "learning_rate": 0.00013991720289948525, "loss": 2.334, "step": 31760 }, { "epoch": 0.4, "learning_rate": 0.00013989031986761264, "loss": 2.3417, "step": 31768 }, { "epoch": 0.4, "learning_rate": 0.00013986343383791028, "loss": 2.336, "step": 31776 }, { "epoch": 0.4, "learning_rate": 0.0001398365448130748, "loss": 2.3165, "step": 31784 }, { "epoch": 0.4, "learning_rate": 0.00013980965279580286, "loss": 2.3326, "step": 31792 }, { "epoch": 0.4, "learning_rate": 0.0001397827577887917, "loss": 2.3231, "step": 31800 }, { "epoch": 0.4, "learning_rate": 0.00013975585979473872, "loss": 2.3396, "step": 31808 }, { "epoch": 0.4, "learning_rate": 0.00013972895881634155, "loss": 2.3193, "step": 31816 }, { "epoch": 0.4, "learning_rate": 0.00013970205485629825, "loss": 2.3241, "step": 31824 }, { "epoch": 0.4, "learning_rate": 0.0001396751479173072, "loss": 2.3285, "step": 31832 }, { "epoch": 0.4, "learning_rate": 0.00013964823800206698, "loss": 2.3439, "step": 31840 }, { "epoch": 0.4, "learning_rate": 0.00013962132511327643, "loss": 2.3081, "step": 31848 }, { "epoch": 0.4, "learning_rate": 0.00013959440925363482, "loss": 2.3452, "step": 31856 }, { "epoch": 0.4, "learning_rate": 0.00013956749042584167, "loss": 2.3261, "step": 31864 }, { "epoch": 0.4, "learning_rate": 0.00013954056863259677, "loss": 2.323, "step": 31872 }, { "epoch": 0.4, "learning_rate": 0.00013951364387660022, "loss": 2.3443, "step": 31880 }, { "epoch": 0.4, "learning_rate": 0.0001394867161605524, "loss": 2.3251, "step": 31888 }, { "epoch": 0.4, "learning_rate": 0.0001394597854871541, "loss": 2.3408, "step": 31896 }, { "epoch": 0.4, "learning_rate": 0.0001394328518591062, "loss": 2.3175, "step": 31904 }, { "epoch": 0.4, "learning_rate": 0.00013940591527911, "loss": 2.3375, "step": 31912 }, { "epoch": 0.4, "learning_rate": 0.00013937897574986714, "loss": 2.3308, "step": 31920 }, { "epoch": 0.4, "learning_rate": 0.0001393520332740795, "loss": 2.3262, "step": 31928 }, { "epoch": 0.4, "learning_rate": 0.00013932508785444926, "loss": 2.3275, "step": 31936 }, { "epoch": 0.4, "learning_rate": 0.00013929813949367884, "loss": 2.3295, "step": 31944 }, { "epoch": 0.4, "learning_rate": 0.00013927118819447105, "loss": 2.3114, "step": 31952 }, { "epoch": 0.4, "learning_rate": 0.00013924423395952893, "loss": 2.3261, "step": 31960 }, { "epoch": 0.4, "learning_rate": 0.00013921727679155584, "loss": 2.3264, "step": 31968 }, { "epoch": 0.4, "learning_rate": 0.00013919031669325547, "loss": 2.3457, "step": 31976 }, { "epoch": 0.4, "learning_rate": 0.00013916335366733176, "loss": 2.3238, "step": 31984 }, { "epoch": 0.4, "learning_rate": 0.00013913638771648892, "loss": 2.3341, "step": 31992 }, { "epoch": 0.4, "learning_rate": 0.00013910941884343143, "loss": 2.3246, "step": 32000 }, { "epoch": 0.4, "learning_rate": 0.00013908244705086422, "loss": 2.3329, "step": 32008 }, { "epoch": 0.4, "learning_rate": 0.00013905547234149235, "loss": 2.3328, "step": 32016 }, { "epoch": 0.4, "learning_rate": 0.00013902849471802127, "loss": 2.3505, "step": 32024 }, { "epoch": 0.4, "learning_rate": 0.00013900151418315662, "loss": 2.3239, "step": 32032 }, { "epoch": 0.4, "learning_rate": 0.0001389745307396044, "loss": 2.325, "step": 32040 }, { "epoch": 0.4, "learning_rate": 0.000138947544390071, "loss": 2.3463, "step": 32048 }, { "epoch": 0.4, "learning_rate": 0.00013892055513726285, "loss": 2.3161, "step": 32056 }, { "epoch": 0.4, "learning_rate": 0.00013889356298388693, "loss": 2.3579, "step": 32064 }, { "epoch": 0.4, "learning_rate": 0.00013886656793265037, "loss": 2.3374, "step": 32072 }, { "epoch": 0.4, "learning_rate": 0.00013883956998626059, "loss": 2.3137, "step": 32080 }, { "epoch": 0.4, "learning_rate": 0.00013881256914742538, "loss": 2.3509, "step": 32088 }, { "epoch": 0.4, "learning_rate": 0.00013878556541885274, "loss": 2.3303, "step": 32096 }, { "epoch": 0.4, "learning_rate": 0.000138758558803251, "loss": 2.3307, "step": 32104 }, { "epoch": 0.4, "learning_rate": 0.00013873154930332872, "loss": 2.3458, "step": 32112 }, { "epoch": 0.4, "learning_rate": 0.0001387045369217949, "loss": 2.3421, "step": 32120 }, { "epoch": 0.4, "learning_rate": 0.00013867752166135867, "loss": 2.3328, "step": 32128 }, { "epoch": 0.4, "learning_rate": 0.0001386505035247295, "loss": 2.334, "step": 32136 }, { "epoch": 0.4, "learning_rate": 0.00013862348251461715, "loss": 2.3206, "step": 32144 }, { "epoch": 0.4, "learning_rate": 0.00013859645863373169, "loss": 2.3406, "step": 32152 }, { "epoch": 0.4, "learning_rate": 0.00013856943188478353, "loss": 2.3326, "step": 32160 }, { "epoch": 0.4, "learning_rate": 0.0001385424022704832, "loss": 2.3113, "step": 32168 }, { "epoch": 0.4, "learning_rate": 0.00013851536979354162, "loss": 2.3309, "step": 32176 }, { "epoch": 0.4, "learning_rate": 0.00013848833445667007, "loss": 2.3261, "step": 32184 }, { "epoch": 0.4, "learning_rate": 0.00013846129626257997, "loss": 2.3318, "step": 32192 }, { "epoch": 0.4, "learning_rate": 0.00013843425521398316, "loss": 2.3548, "step": 32200 }, { "epoch": 0.4, "learning_rate": 0.00013840721131359166, "loss": 2.3158, "step": 32208 }, { "epoch": 0.4, "learning_rate": 0.0001383801645641178, "loss": 2.3342, "step": 32216 }, { "epoch": 0.4, "learning_rate": 0.00013835311496827423, "loss": 2.3466, "step": 32224 }, { "epoch": 0.4, "learning_rate": 0.00013832606252877394, "loss": 2.3309, "step": 32232 }, { "epoch": 0.4, "learning_rate": 0.00013829900724833007, "loss": 2.3539, "step": 32240 }, { "epoch": 0.4, "learning_rate": 0.0001382719491296561, "loss": 2.3271, "step": 32248 }, { "epoch": 0.4, "learning_rate": 0.00013824488817546583, "loss": 2.3247, "step": 32256 }, { "epoch": 0.4, "learning_rate": 0.00013821782438847336, "loss": 2.3313, "step": 32264 }, { "epoch": 0.4, "learning_rate": 0.00013819075777139297, "loss": 2.3321, "step": 32272 }, { "epoch": 0.4, "learning_rate": 0.00013816368832693932, "loss": 2.3606, "step": 32280 }, { "epoch": 0.4, "learning_rate": 0.0001381366160578273, "loss": 2.3352, "step": 32288 }, { "epoch": 0.4, "learning_rate": 0.0001381095409667721, "loss": 2.3224, "step": 32296 }, { "epoch": 0.4, "learning_rate": 0.0001380824630564893, "loss": 2.3289, "step": 32304 }, { "epoch": 0.4, "learning_rate": 0.00013805538232969448, "loss": 2.3364, "step": 32312 }, { "epoch": 0.4, "learning_rate": 0.00013802829878910384, "loss": 2.3251, "step": 32320 }, { "epoch": 0.4, "learning_rate": 0.00013800121243743365, "loss": 2.3284, "step": 32328 }, { "epoch": 0.4, "learning_rate": 0.0001379741232774005, "loss": 2.3512, "step": 32336 }, { "epoch": 0.4, "learning_rate": 0.00013794703131172128, "loss": 2.326, "step": 32344 }, { "epoch": 0.4, "learning_rate": 0.00013791993654311318, "loss": 2.3519, "step": 32352 }, { "epoch": 0.4, "learning_rate": 0.0001378928389742937, "loss": 2.3033, "step": 32360 }, { "epoch": 0.4, "learning_rate": 0.00013786573860798048, "loss": 2.3303, "step": 32368 }, { "epoch": 0.4, "learning_rate": 0.00013783863544689158, "loss": 2.3365, "step": 32376 }, { "epoch": 0.4, "learning_rate": 0.00013781152949374526, "loss": 2.306, "step": 32384 }, { "epoch": 0.4, "learning_rate": 0.00013778442075126018, "loss": 2.3207, "step": 32392 }, { "epoch": 0.41, "learning_rate": 0.00013775730922215509, "loss": 2.3471, "step": 32400 }, { "epoch": 0.41, "learning_rate": 0.00013773019490914918, "loss": 2.3217, "step": 32408 }, { "epoch": 0.41, "learning_rate": 0.0001377030778149618, "loss": 2.3427, "step": 32416 }, { "epoch": 0.41, "learning_rate": 0.00013767595794231277, "loss": 2.3208, "step": 32424 }, { "epoch": 0.41, "learning_rate": 0.00013764883529392193, "loss": 2.3332, "step": 32432 }, { "epoch": 0.41, "learning_rate": 0.00013762170987250959, "loss": 2.3168, "step": 32440 }, { "epoch": 0.41, "learning_rate": 0.00013759458168079627, "loss": 2.3292, "step": 32448 }, { "epoch": 0.41, "learning_rate": 0.00013756745072150274, "loss": 2.3347, "step": 32456 }, { "epoch": 0.41, "learning_rate": 0.00013754031699735015, "loss": 2.3264, "step": 32464 }, { "epoch": 0.41, "learning_rate": 0.0001375131805110598, "loss": 2.3475, "step": 32472 }, { "epoch": 0.41, "learning_rate": 0.0001374860412653533, "loss": 2.3212, "step": 32480 }, { "epoch": 0.41, "learning_rate": 0.00013745889926295265, "loss": 2.3351, "step": 32488 }, { "epoch": 0.41, "learning_rate": 0.00013743175450658, "loss": 2.3362, "step": 32496 }, { "epoch": 0.41, "learning_rate": 0.00013740460699895779, "loss": 2.3455, "step": 32504 }, { "epoch": 0.41, "learning_rate": 0.0001373774567428088, "loss": 2.3302, "step": 32512 }, { "epoch": 0.41, "learning_rate": 0.000137350303740856, "loss": 2.3088, "step": 32520 }, { "epoch": 0.41, "learning_rate": 0.00013732314799582275, "loss": 2.3471, "step": 32528 }, { "epoch": 0.41, "learning_rate": 0.00013729598951043256, "loss": 2.3461, "step": 32536 }, { "epoch": 0.41, "learning_rate": 0.00013726882828740927, "loss": 2.3278, "step": 32544 }, { "epoch": 0.41, "learning_rate": 0.00013724166432947706, "loss": 2.3329, "step": 32552 }, { "epoch": 0.41, "learning_rate": 0.00013721449763936023, "loss": 2.342, "step": 32560 }, { "epoch": 0.41, "learning_rate": 0.0001371873282197835, "loss": 2.3192, "step": 32568 }, { "epoch": 0.41, "learning_rate": 0.00013716015607347182, "loss": 2.3524, "step": 32576 }, { "epoch": 0.41, "learning_rate": 0.00013713298120315037, "loss": 2.3314, "step": 32584 }, { "epoch": 0.41, "learning_rate": 0.00013710580361154463, "loss": 2.3047, "step": 32592 }, { "epoch": 0.41, "learning_rate": 0.00013707862330138046, "loss": 2.3408, "step": 32600 }, { "epoch": 0.41, "learning_rate": 0.00013705144027538374, "loss": 2.3439, "step": 32608 }, { "epoch": 0.41, "learning_rate": 0.00013702425453628085, "loss": 2.3183, "step": 32616 }, { "epoch": 0.41, "learning_rate": 0.00013699706608679834, "loss": 2.3365, "step": 32624 }, { "epoch": 0.41, "learning_rate": 0.0001369698749296631, "loss": 2.3345, "step": 32632 }, { "epoch": 0.41, "learning_rate": 0.00013694268106760225, "loss": 2.317, "step": 32640 }, { "epoch": 0.41, "learning_rate": 0.0001369154845033431, "loss": 2.3474, "step": 32648 }, { "epoch": 0.41, "learning_rate": 0.0001368882852396134, "loss": 2.3258, "step": 32656 }, { "epoch": 0.41, "learning_rate": 0.00013686108327914102, "loss": 2.305, "step": 32664 }, { "epoch": 0.41, "learning_rate": 0.00013683387862465423, "loss": 2.3404, "step": 32672 }, { "epoch": 0.41, "learning_rate": 0.00013680667127888144, "loss": 2.3367, "step": 32680 }, { "epoch": 0.41, "learning_rate": 0.0001367794612445514, "loss": 2.3033, "step": 32688 }, { "epoch": 0.41, "learning_rate": 0.0001367522485243932, "loss": 2.3386, "step": 32696 }, { "epoch": 0.41, "learning_rate": 0.000136725033121136, "loss": 2.3398, "step": 32704 }, { "epoch": 0.41, "learning_rate": 0.00013669781503750943, "loss": 2.3317, "step": 32712 }, { "epoch": 0.41, "learning_rate": 0.00013667059427624326, "loss": 2.3333, "step": 32720 }, { "epoch": 0.41, "learning_rate": 0.00013664337084006765, "loss": 2.3498, "step": 32728 }, { "epoch": 0.41, "learning_rate": 0.0001366161447317129, "loss": 2.3159, "step": 32736 }, { "epoch": 0.41, "learning_rate": 0.00013658891595390966, "loss": 2.3382, "step": 32744 }, { "epoch": 0.41, "learning_rate": 0.00013656168450938878, "loss": 2.3327, "step": 32752 }, { "epoch": 0.41, "learning_rate": 0.00013653445040088147, "loss": 2.3289, "step": 32760 }, { "epoch": 0.41, "learning_rate": 0.00013650721363111913, "loss": 2.3335, "step": 32768 }, { "epoch": 0.41, "learning_rate": 0.00013647997420283348, "loss": 2.335, "step": 32776 }, { "epoch": 0.41, "learning_rate": 0.00013645273211875645, "loss": 2.3143, "step": 32784 }, { "epoch": 0.41, "learning_rate": 0.00013642548738162027, "loss": 2.3518, "step": 32792 }, { "epoch": 0.41, "learning_rate": 0.00013639823999415745, "loss": 2.3477, "step": 32800 }, { "epoch": 0.41, "learning_rate": 0.00013637098995910075, "loss": 2.3158, "step": 32808 }, { "epoch": 0.41, "learning_rate": 0.00013634373727918316, "loss": 2.3237, "step": 32816 }, { "epoch": 0.41, "learning_rate": 0.000136316481957138, "loss": 2.3383, "step": 32824 }, { "epoch": 0.41, "learning_rate": 0.0001362892239956988, "loss": 2.335, "step": 32832 }, { "epoch": 0.41, "learning_rate": 0.00013626196339759945, "loss": 2.336, "step": 32840 }, { "epoch": 0.41, "learning_rate": 0.00013623470016557393, "loss": 2.3121, "step": 32848 }, { "epoch": 0.41, "learning_rate": 0.00013620743430235664, "loss": 2.3398, "step": 32856 }, { "epoch": 0.41, "learning_rate": 0.00013618016581068223, "loss": 2.3294, "step": 32864 }, { "epoch": 0.41, "learning_rate": 0.0001361528946932855, "loss": 2.3147, "step": 32872 }, { "epoch": 0.41, "learning_rate": 0.0001361256209529016, "loss": 2.3243, "step": 32880 }, { "epoch": 0.41, "learning_rate": 0.00013609834459226601, "loss": 2.3484, "step": 32888 }, { "epoch": 0.41, "learning_rate": 0.0001360710656141143, "loss": 2.3221, "step": 32896 }, { "epoch": 0.41, "learning_rate": 0.00013604378402118247, "loss": 2.3189, "step": 32904 }, { "epoch": 0.41, "learning_rate": 0.00013601649981620663, "loss": 2.3377, "step": 32912 }, { "epoch": 0.41, "learning_rate": 0.0001359892130019233, "loss": 2.3243, "step": 32920 }, { "epoch": 0.41, "learning_rate": 0.0001359619235810692, "loss": 2.3366, "step": 32928 }, { "epoch": 0.41, "learning_rate": 0.0001359346315563812, "loss": 2.3385, "step": 32936 }, { "epoch": 0.41, "learning_rate": 0.00013590733693059668, "loss": 2.3185, "step": 32944 }, { "epoch": 0.41, "learning_rate": 0.00013588003970645303, "loss": 2.3202, "step": 32952 }, { "epoch": 0.41, "learning_rate": 0.00013585273988668802, "loss": 2.3385, "step": 32960 }, { "epoch": 0.41, "learning_rate": 0.00013582543747403972, "loss": 2.3334, "step": 32968 }, { "epoch": 0.41, "learning_rate": 0.00013579813247124636, "loss": 2.3069, "step": 32976 }, { "epoch": 0.41, "learning_rate": 0.0001357708248810465, "loss": 2.3268, "step": 32984 }, { "epoch": 0.41, "learning_rate": 0.00013574351470617895, "loss": 2.3412, "step": 32992 }, { "epoch": 0.41, "learning_rate": 0.00013571620194938275, "loss": 2.3255, "step": 33000 }, { "epoch": 0.41, "learning_rate": 0.0001356888866133972, "loss": 2.3275, "step": 33008 }, { "epoch": 0.41, "learning_rate": 0.00013566156870096184, "loss": 2.3415, "step": 33016 }, { "epoch": 0.41, "learning_rate": 0.00013563424821481658, "loss": 2.316, "step": 33024 }, { "epoch": 0.41, "learning_rate": 0.0001356069251577015, "loss": 2.3338, "step": 33032 }, { "epoch": 0.41, "learning_rate": 0.0001355795995323569, "loss": 2.3173, "step": 33040 }, { "epoch": 0.41, "learning_rate": 0.0001355522713415234, "loss": 2.3389, "step": 33048 }, { "epoch": 0.41, "learning_rate": 0.00013552494058794188, "loss": 2.3337, "step": 33056 }, { "epoch": 0.41, "learning_rate": 0.00013549760727435346, "loss": 2.3549, "step": 33064 }, { "epoch": 0.41, "learning_rate": 0.0001354702714034995, "loss": 2.3263, "step": 33072 }, { "epoch": 0.41, "learning_rate": 0.00013544293297812165, "loss": 2.3393, "step": 33080 }, { "epoch": 0.41, "learning_rate": 0.00013541559200096176, "loss": 2.3174, "step": 33088 }, { "epoch": 0.41, "learning_rate": 0.00013538824847476205, "loss": 2.3373, "step": 33096 }, { "epoch": 0.41, "learning_rate": 0.00013536090240226484, "loss": 2.3121, "step": 33104 }, { "epoch": 0.41, "learning_rate": 0.0001353335537862128, "loss": 2.329, "step": 33112 }, { "epoch": 0.41, "learning_rate": 0.00013530620262934892, "loss": 2.3358, "step": 33120 }, { "epoch": 0.41, "learning_rate": 0.00013527884893441632, "loss": 2.3492, "step": 33128 }, { "epoch": 0.41, "learning_rate": 0.00013525149270415837, "loss": 2.3306, "step": 33136 }, { "epoch": 0.41, "learning_rate": 0.0001352241339413188, "loss": 2.3263, "step": 33144 }, { "epoch": 0.41, "learning_rate": 0.0001351967726486415, "loss": 2.3263, "step": 33152 }, { "epoch": 0.41, "learning_rate": 0.00013516940882887067, "loss": 2.3302, "step": 33160 }, { "epoch": 0.41, "learning_rate": 0.00013514204248475079, "loss": 2.3144, "step": 33168 }, { "epoch": 0.41, "learning_rate": 0.0001351146736190265, "loss": 2.3273, "step": 33176 }, { "epoch": 0.41, "learning_rate": 0.00013508730223444273, "loss": 2.3389, "step": 33184 }, { "epoch": 0.41, "learning_rate": 0.0001350599283337447, "loss": 2.3215, "step": 33192 }, { "epoch": 0.41, "learning_rate": 0.0001350325519196779, "loss": 2.3227, "step": 33200 }, { "epoch": 0.42, "learning_rate": 0.0001350051729949879, "loss": 2.3158, "step": 33208 }, { "epoch": 0.42, "learning_rate": 0.0001349777915624208, "loss": 2.3082, "step": 33216 }, { "epoch": 0.42, "learning_rate": 0.00013495040762472277, "loss": 2.3326, "step": 33224 }, { "epoch": 0.42, "learning_rate": 0.00013492302118464018, "loss": 2.3257, "step": 33232 }, { "epoch": 0.42, "learning_rate": 0.0001348956322449198, "loss": 2.3187, "step": 33240 }, { "epoch": 0.42, "learning_rate": 0.00013486824080830855, "loss": 2.3479, "step": 33248 }, { "epoch": 0.42, "learning_rate": 0.00013484084687755368, "loss": 2.3246, "step": 33256 }, { "epoch": 0.42, "learning_rate": 0.00013481345045540265, "loss": 2.2993, "step": 33264 }, { "epoch": 0.42, "learning_rate": 0.0001347860515446031, "loss": 2.3429, "step": 33272 }, { "epoch": 0.42, "learning_rate": 0.00013475865014790306, "loss": 2.3235, "step": 33280 }, { "epoch": 0.42, "learning_rate": 0.00013473124626805065, "loss": 2.3162, "step": 33288 }, { "epoch": 0.42, "learning_rate": 0.0001347038399077944, "loss": 2.3467, "step": 33296 }, { "epoch": 0.42, "learning_rate": 0.00013467643106988302, "loss": 2.346, "step": 33304 }, { "epoch": 0.42, "learning_rate": 0.0001346490197570654, "loss": 2.3182, "step": 33312 }, { "epoch": 0.42, "learning_rate": 0.00013462160597209075, "loss": 2.3337, "step": 33320 }, { "epoch": 0.42, "learning_rate": 0.00013459418971770854, "loss": 2.3292, "step": 33328 }, { "epoch": 0.42, "learning_rate": 0.00013456677099666844, "loss": 2.3165, "step": 33336 }, { "epoch": 0.42, "learning_rate": 0.0001345393498117205, "loss": 2.3189, "step": 33344 }, { "epoch": 0.42, "learning_rate": 0.00013451192616561471, "loss": 2.3316, "step": 33352 }, { "epoch": 0.42, "learning_rate": 0.0001344845000611017, "loss": 2.3297, "step": 33360 }, { "epoch": 0.42, "learning_rate": 0.00013445707150093206, "loss": 2.3286, "step": 33368 }, { "epoch": 0.42, "learning_rate": 0.0001344296404878567, "loss": 2.3315, "step": 33376 }, { "epoch": 0.42, "learning_rate": 0.00013440220702462684, "loss": 2.3369, "step": 33384 }, { "epoch": 0.42, "learning_rate": 0.00013437477111399388, "loss": 2.3528, "step": 33392 }, { "epoch": 0.42, "learning_rate": 0.0001343473327587095, "loss": 2.3434, "step": 33400 }, { "epoch": 0.42, "learning_rate": 0.0001343198919615256, "loss": 2.312, "step": 33408 }, { "epoch": 0.42, "learning_rate": 0.00013429244872519434, "loss": 2.3376, "step": 33416 }, { "epoch": 0.42, "learning_rate": 0.00013426500305246808, "loss": 2.3139, "step": 33424 }, { "epoch": 0.42, "learning_rate": 0.0001342375549460996, "loss": 2.3187, "step": 33432 }, { "epoch": 0.42, "learning_rate": 0.00013421010440884163, "loss": 2.3292, "step": 33440 }, { "epoch": 0.42, "learning_rate": 0.00013418265144344736, "loss": 2.3267, "step": 33448 }, { "epoch": 0.42, "learning_rate": 0.0001341551960526702, "loss": 2.315, "step": 33456 }, { "epoch": 0.42, "learning_rate": 0.00013412773823926375, "loss": 2.3303, "step": 33464 }, { "epoch": 0.42, "learning_rate": 0.00013410027800598185, "loss": 2.3138, "step": 33472 }, { "epoch": 0.42, "learning_rate": 0.0001340728153555787, "loss": 2.3246, "step": 33480 }, { "epoch": 0.42, "learning_rate": 0.0001340453502908085, "loss": 2.3218, "step": 33488 }, { "epoch": 0.42, "learning_rate": 0.00013401788281442592, "loss": 2.3378, "step": 33496 }, { "epoch": 0.42, "learning_rate": 0.00013399041292918578, "loss": 2.3445, "step": 33504 }, { "epoch": 0.42, "learning_rate": 0.00013396294063784317, "loss": 2.3175, "step": 33512 }, { "epoch": 0.42, "learning_rate": 0.00013393546594315343, "loss": 2.3263, "step": 33520 }, { "epoch": 0.42, "learning_rate": 0.00013390798884787205, "loss": 2.3311, "step": 33528 }, { "epoch": 0.42, "learning_rate": 0.00013388050935475487, "loss": 2.2972, "step": 33536 }, { "epoch": 0.42, "learning_rate": 0.0001338530274665579, "loss": 2.3509, "step": 33544 }, { "epoch": 0.42, "learning_rate": 0.00013382554318603745, "loss": 2.3398, "step": 33552 }, { "epoch": 0.42, "learning_rate": 0.00013379805651594998, "loss": 2.3255, "step": 33560 }, { "epoch": 0.42, "learning_rate": 0.00013377056745905236, "loss": 2.3228, "step": 33568 }, { "epoch": 0.42, "learning_rate": 0.0001337430760181015, "loss": 2.337, "step": 33576 }, { "epoch": 0.42, "learning_rate": 0.00013371558219585464, "loss": 2.3389, "step": 33584 }, { "epoch": 0.42, "learning_rate": 0.00013368808599506922, "loss": 2.32, "step": 33592 }, { "epoch": 0.42, "learning_rate": 0.00013366058741850302, "loss": 2.3347, "step": 33600 }, { "epoch": 0.42, "learning_rate": 0.000133633086468914, "loss": 2.3055, "step": 33608 }, { "epoch": 0.42, "learning_rate": 0.00013360558314906034, "loss": 2.3301, "step": 33616 }, { "epoch": 0.42, "learning_rate": 0.00013357807746170036, "loss": 2.3413, "step": 33624 }, { "epoch": 0.42, "learning_rate": 0.0001335505694095929, "loss": 2.315, "step": 33632 }, { "epoch": 0.42, "learning_rate": 0.00013352305899549672, "loss": 2.3321, "step": 33640 }, { "epoch": 0.42, "learning_rate": 0.00013349554622217103, "loss": 2.3298, "step": 33648 }, { "epoch": 0.42, "learning_rate": 0.00013346803109237518, "loss": 2.3372, "step": 33656 }, { "epoch": 0.42, "learning_rate": 0.0001334405136088688, "loss": 2.3442, "step": 33664 }, { "epoch": 0.42, "learning_rate": 0.0001334129937744117, "loss": 2.3291, "step": 33672 }, { "epoch": 0.42, "learning_rate": 0.000133385471591764, "loss": 2.2941, "step": 33680 }, { "epoch": 0.42, "learning_rate": 0.00013335794706368606, "loss": 2.325, "step": 33688 }, { "epoch": 0.42, "learning_rate": 0.00013333042019293833, "loss": 2.3194, "step": 33696 }, { "epoch": 0.42, "learning_rate": 0.00013330289098228165, "loss": 2.3252, "step": 33704 }, { "epoch": 0.42, "learning_rate": 0.00013327535943447706, "loss": 2.3262, "step": 33712 }, { "epoch": 0.42, "learning_rate": 0.00013324782555228581, "loss": 2.3263, "step": 33720 }, { "epoch": 0.42, "learning_rate": 0.00013322028933846936, "loss": 2.319, "step": 33728 }, { "epoch": 0.42, "learning_rate": 0.0001331927507957895, "loss": 2.3209, "step": 33736 }, { "epoch": 0.42, "learning_rate": 0.00013316520992700813, "loss": 2.3131, "step": 33744 }, { "epoch": 0.42, "learning_rate": 0.00013313766673488748, "loss": 2.335, "step": 33752 }, { "epoch": 0.42, "learning_rate": 0.00013311012122218995, "loss": 2.3272, "step": 33760 }, { "epoch": 0.42, "learning_rate": 0.0001330825733916782, "loss": 2.3284, "step": 33768 }, { "epoch": 0.42, "learning_rate": 0.00013305502324611516, "loss": 2.3199, "step": 33776 }, { "epoch": 0.42, "learning_rate": 0.00013302747078826395, "loss": 2.3329, "step": 33784 }, { "epoch": 0.42, "learning_rate": 0.00013299991602088782, "loss": 2.3292, "step": 33792 }, { "epoch": 0.42, "learning_rate": 0.0001329723589467505, "loss": 2.3425, "step": 33800 }, { "epoch": 0.42, "learning_rate": 0.0001329447995686157, "loss": 2.3359, "step": 33808 }, { "epoch": 0.42, "learning_rate": 0.00013291723788924758, "loss": 2.3153, "step": 33816 }, { "epoch": 0.42, "learning_rate": 0.00013288967391141029, "loss": 2.3149, "step": 33824 }, { "epoch": 0.42, "learning_rate": 0.00013286210763786843, "loss": 2.3068, "step": 33832 }, { "epoch": 0.42, "learning_rate": 0.00013283453907138673, "loss": 2.3255, "step": 33840 }, { "epoch": 0.42, "learning_rate": 0.00013280696821473014, "loss": 2.3269, "step": 33848 }, { "epoch": 0.42, "learning_rate": 0.00013277939507066387, "loss": 2.2989, "step": 33856 }, { "epoch": 0.42, "learning_rate": 0.0001327518196419533, "loss": 2.3182, "step": 33864 }, { "epoch": 0.42, "learning_rate": 0.00013272424193136424, "loss": 2.3271, "step": 33872 }, { "epoch": 0.42, "learning_rate": 0.00013269666194166242, "loss": 2.3189, "step": 33880 }, { "epoch": 0.42, "learning_rate": 0.000132669079675614, "loss": 2.3362, "step": 33888 }, { "epoch": 0.42, "learning_rate": 0.00013264149513598537, "loss": 2.3303, "step": 33896 }, { "epoch": 0.42, "learning_rate": 0.00013261390832554305, "loss": 2.3359, "step": 33904 }, { "epoch": 0.42, "learning_rate": 0.0001325863192470539, "loss": 2.3111, "step": 33912 }, { "epoch": 0.42, "learning_rate": 0.00013255872790328486, "loss": 2.3387, "step": 33920 }, { "epoch": 0.42, "learning_rate": 0.00013253113429700326, "loss": 2.3154, "step": 33928 }, { "epoch": 0.42, "learning_rate": 0.00013250353843097655, "loss": 2.3182, "step": 33936 }, { "epoch": 0.42, "learning_rate": 0.00013247594030797244, "loss": 2.328, "step": 33944 }, { "epoch": 0.42, "learning_rate": 0.0001324483399307589, "loss": 2.3183, "step": 33952 }, { "epoch": 0.42, "learning_rate": 0.00013242073730210404, "loss": 2.3307, "step": 33960 }, { "epoch": 0.42, "learning_rate": 0.00013239313242477632, "loss": 2.3219, "step": 33968 }, { "epoch": 0.42, "learning_rate": 0.00013236552530154424, "loss": 2.3249, "step": 33976 }, { "epoch": 0.42, "learning_rate": 0.00013233791593517675, "loss": 2.3335, "step": 33984 }, { "epoch": 0.42, "learning_rate": 0.0001323103043284428, "loss": 2.3166, "step": 33992 }, { "epoch": 0.42, "learning_rate": 0.0001322826904841118, "loss": 2.3181, "step": 34000 }, { "epoch": 0.43, "learning_rate": 0.00013225507440495321, "loss": 2.3349, "step": 34008 }, { "epoch": 0.43, "learning_rate": 0.00013222745609373676, "loss": 2.3305, "step": 34016 }, { "epoch": 0.43, "learning_rate": 0.00013219983555323237, "loss": 2.3511, "step": 34024 }, { "epoch": 0.43, "learning_rate": 0.0001321722127862103, "loss": 2.3142, "step": 34032 }, { "epoch": 0.43, "learning_rate": 0.00013214458779544093, "loss": 2.3216, "step": 34040 }, { "epoch": 0.43, "learning_rate": 0.00013211696058369486, "loss": 2.3294, "step": 34048 }, { "epoch": 0.43, "learning_rate": 0.00013208933115374297, "loss": 2.3095, "step": 34056 }, { "epoch": 0.43, "learning_rate": 0.0001320616995083563, "loss": 2.3049, "step": 34064 }, { "epoch": 0.43, "learning_rate": 0.00013203406565030624, "loss": 2.3436, "step": 34072 }, { "epoch": 0.43, "learning_rate": 0.0001320064295823642, "loss": 2.3446, "step": 34080 }, { "epoch": 0.43, "learning_rate": 0.000131978791307302, "loss": 2.309, "step": 34088 }, { "epoch": 0.43, "learning_rate": 0.00013195115082789154, "loss": 2.3312, "step": 34096 }, { "epoch": 0.43, "learning_rate": 0.00013192350814690505, "loss": 2.3356, "step": 34104 }, { "epoch": 0.43, "learning_rate": 0.00013189586326711492, "loss": 2.3002, "step": 34112 }, { "epoch": 0.43, "learning_rate": 0.00013186821619129378, "loss": 2.3259, "step": 34120 }, { "epoch": 0.43, "learning_rate": 0.00013184056692221443, "loss": 2.3184, "step": 34128 }, { "epoch": 0.43, "learning_rate": 0.00013181291546265003, "loss": 2.321, "step": 34136 }, { "epoch": 0.43, "learning_rate": 0.00013178526181537376, "loss": 2.332, "step": 34144 }, { "epoch": 0.43, "learning_rate": 0.0001317576059831592, "loss": 2.3391, "step": 34152 }, { "epoch": 0.43, "learning_rate": 0.00013172994796878002, "loss": 2.3083, "step": 34160 }, { "epoch": 0.43, "learning_rate": 0.00013170228777501018, "loss": 2.3083, "step": 34168 }, { "epoch": 0.43, "learning_rate": 0.0001316746254046239, "loss": 2.3349, "step": 34176 }, { "epoch": 0.43, "learning_rate": 0.0001316469608603955, "loss": 2.323, "step": 34184 }, { "epoch": 0.43, "learning_rate": 0.00013161929414509955, "loss": 2.3084, "step": 34192 }, { "epoch": 0.43, "learning_rate": 0.0001315916252615109, "loss": 2.3286, "step": 34200 }, { "epoch": 0.43, "learning_rate": 0.00013156395421240458, "loss": 2.3202, "step": 34208 }, { "epoch": 0.43, "learning_rate": 0.00013153628100055585, "loss": 2.3184, "step": 34216 }, { "epoch": 0.43, "learning_rate": 0.00013150860562874018, "loss": 2.3427, "step": 34224 }, { "epoch": 0.43, "learning_rate": 0.00013148092809973325, "loss": 2.3231, "step": 34232 }, { "epoch": 0.43, "learning_rate": 0.00013145324841631092, "loss": 2.3042, "step": 34240 }, { "epoch": 0.43, "learning_rate": 0.00013142556658124935, "loss": 2.3215, "step": 34248 }, { "epoch": 0.43, "learning_rate": 0.00013139788259732484, "loss": 2.3244, "step": 34256 }, { "epoch": 0.43, "learning_rate": 0.00013137019646731395, "loss": 2.3211, "step": 34264 }, { "epoch": 0.43, "learning_rate": 0.00013134250819399348, "loss": 2.3224, "step": 34272 }, { "epoch": 0.43, "learning_rate": 0.00013131481778014037, "loss": 2.3353, "step": 34280 }, { "epoch": 0.43, "learning_rate": 0.00013128712522853176, "loss": 2.3068, "step": 34288 }, { "epoch": 0.43, "learning_rate": 0.00013125943054194514, "loss": 2.3377, "step": 34296 }, { "epoch": 0.43, "learning_rate": 0.0001312317337231581, "loss": 2.3393, "step": 34304 }, { "epoch": 0.43, "learning_rate": 0.0001312040347749485, "loss": 2.3399, "step": 34312 }, { "epoch": 0.43, "learning_rate": 0.00013117633370009432, "loss": 2.3153, "step": 34320 }, { "epoch": 0.43, "learning_rate": 0.00013114863050137386, "loss": 2.3328, "step": 34328 }, { "epoch": 0.43, "learning_rate": 0.00013112092518156561, "loss": 2.3037, "step": 34336 }, { "epoch": 0.43, "learning_rate": 0.00013109321774344826, "loss": 2.352, "step": 34344 }, { "epoch": 0.43, "learning_rate": 0.00013106550818980066, "loss": 2.3285, "step": 34352 }, { "epoch": 0.43, "learning_rate": 0.00013103779652340198, "loss": 2.3373, "step": 34360 }, { "epoch": 0.43, "learning_rate": 0.0001310100827470315, "loss": 2.3117, "step": 34368 }, { "epoch": 0.43, "learning_rate": 0.00013098236686346878, "loss": 2.3458, "step": 34376 }, { "epoch": 0.43, "learning_rate": 0.00013095464887549353, "loss": 2.3368, "step": 34384 }, { "epoch": 0.43, "learning_rate": 0.00013092692878588578, "loss": 2.3383, "step": 34392 }, { "epoch": 0.43, "learning_rate": 0.0001308992065974256, "loss": 2.3247, "step": 34400 }, { "epoch": 0.43, "learning_rate": 0.00013087148231289347, "loss": 2.3282, "step": 34408 }, { "epoch": 0.43, "learning_rate": 0.00013084375593506986, "loss": 2.3085, "step": 34416 }, { "epoch": 0.43, "learning_rate": 0.00013081602746673572, "loss": 2.3116, "step": 34424 }, { "epoch": 0.43, "learning_rate": 0.0001307882969106719, "loss": 2.3122, "step": 34432 }, { "epoch": 0.43, "learning_rate": 0.00013076056426965973, "loss": 2.3413, "step": 34440 }, { "epoch": 0.43, "learning_rate": 0.0001307328295464806, "loss": 2.3342, "step": 34448 }, { "epoch": 0.43, "learning_rate": 0.00013070509274391615, "loss": 2.3329, "step": 34456 }, { "epoch": 0.43, "learning_rate": 0.0001306773538647482, "loss": 2.3173, "step": 34464 }, { "epoch": 0.43, "learning_rate": 0.00013064961291175882, "loss": 2.336, "step": 34472 }, { "epoch": 0.43, "learning_rate": 0.0001306218698877303, "loss": 2.3235, "step": 34480 }, { "epoch": 0.43, "learning_rate": 0.00013059412479544507, "loss": 2.2992, "step": 34488 }, { "epoch": 0.43, "learning_rate": 0.0001305663776376858, "loss": 2.3191, "step": 34496 }, { "epoch": 0.43, "learning_rate": 0.00013053862841723538, "loss": 2.3185, "step": 34504 }, { "epoch": 0.43, "learning_rate": 0.00013051087713687696, "loss": 2.3143, "step": 34512 }, { "epoch": 0.43, "learning_rate": 0.00013048312379939373, "loss": 2.3187, "step": 34520 }, { "epoch": 0.43, "learning_rate": 0.00013045536840756926, "loss": 2.3176, "step": 34528 }, { "epoch": 0.43, "learning_rate": 0.00013042761096418727, "loss": 2.3311, "step": 34536 }, { "epoch": 0.43, "learning_rate": 0.00013039985147203165, "loss": 2.3234, "step": 34544 }, { "epoch": 0.43, "learning_rate": 0.0001303720899338865, "loss": 2.344, "step": 34552 }, { "epoch": 0.43, "learning_rate": 0.00013034432635253615, "loss": 2.3544, "step": 34560 }, { "epoch": 0.43, "learning_rate": 0.00013031656073076516, "loss": 2.3232, "step": 34568 }, { "epoch": 0.43, "learning_rate": 0.00013028879307135823, "loss": 2.306, "step": 34576 }, { "epoch": 0.43, "learning_rate": 0.00013026102337710036, "loss": 2.3266, "step": 34584 }, { "epoch": 0.43, "learning_rate": 0.00013023325165077663, "loss": 2.3034, "step": 34592 }, { "epoch": 0.43, "learning_rate": 0.0001302054778951724, "loss": 2.3197, "step": 34600 }, { "epoch": 0.43, "learning_rate": 0.0001301777021130732, "loss": 2.3139, "step": 34608 }, { "epoch": 0.43, "learning_rate": 0.00013014992430726485, "loss": 2.334, "step": 34616 }, { "epoch": 0.43, "learning_rate": 0.0001301221444805333, "loss": 2.3284, "step": 34624 }, { "epoch": 0.43, "learning_rate": 0.0001300943626356646, "loss": 2.3146, "step": 34632 }, { "epoch": 0.43, "learning_rate": 0.00013006657877544524, "loss": 2.3201, "step": 34640 }, { "epoch": 0.43, "learning_rate": 0.00013003879290266173, "loss": 2.3053, "step": 34648 }, { "epoch": 0.43, "learning_rate": 0.00013001100502010082, "loss": 2.3236, "step": 34656 }, { "epoch": 0.43, "learning_rate": 0.0001299832151305495, "loss": 2.3267, "step": 34664 }, { "epoch": 0.43, "learning_rate": 0.00012995542323679493, "loss": 2.3376, "step": 34672 }, { "epoch": 0.43, "learning_rate": 0.00012992762934162447, "loss": 2.3303, "step": 34680 }, { "epoch": 0.43, "learning_rate": 0.00012989983344782575, "loss": 2.3228, "step": 34688 }, { "epoch": 0.43, "learning_rate": 0.00012987203555818645, "loss": 2.3266, "step": 34696 }, { "epoch": 0.43, "learning_rate": 0.0001298442356754946, "loss": 2.3292, "step": 34704 }, { "epoch": 0.43, "learning_rate": 0.0001298164338025384, "loss": 2.3109, "step": 34712 }, { "epoch": 0.43, "learning_rate": 0.00012978862994210609, "loss": 2.3226, "step": 34720 }, { "epoch": 0.43, "learning_rate": 0.00012976082409698635, "loss": 2.3199, "step": 34728 }, { "epoch": 0.43, "learning_rate": 0.00012973301626996797, "loss": 2.3239, "step": 34736 }, { "epoch": 0.43, "learning_rate": 0.00012970520646383985, "loss": 2.3247, "step": 34744 }, { "epoch": 0.43, "learning_rate": 0.00012967739468139116, "loss": 2.3299, "step": 34752 }, { "epoch": 0.43, "learning_rate": 0.00012964958092541128, "loss": 2.3095, "step": 34760 }, { "epoch": 0.43, "learning_rate": 0.00012962176519868977, "loss": 2.3212, "step": 34768 }, { "epoch": 0.43, "learning_rate": 0.00012959394750401644, "loss": 2.3029, "step": 34776 }, { "epoch": 0.43, "learning_rate": 0.00012956612784418114, "loss": 2.3238, "step": 34784 }, { "epoch": 0.43, "learning_rate": 0.0001295383062219741, "loss": 2.3168, "step": 34792 }, { "epoch": 0.43, "learning_rate": 0.0001295104826401857, "loss": 2.3121, "step": 34800 }, { "epoch": 0.44, "learning_rate": 0.00012948265710160644, "loss": 2.3227, "step": 34808 }, { "epoch": 0.44, "learning_rate": 0.00012945482960902705, "loss": 2.343, "step": 34816 }, { "epoch": 0.44, "learning_rate": 0.00012942700016523842, "loss": 2.3074, "step": 34824 }, { "epoch": 0.44, "learning_rate": 0.00012939916877303183, "loss": 2.3166, "step": 34832 }, { "epoch": 0.44, "learning_rate": 0.00012937133543519853, "loss": 2.3095, "step": 34840 }, { "epoch": 0.44, "learning_rate": 0.00012934350015453004, "loss": 2.309, "step": 34848 }, { "epoch": 0.44, "learning_rate": 0.0001293156629338181, "loss": 2.3113, "step": 34856 }, { "epoch": 0.44, "learning_rate": 0.0001292878237758546, "loss": 2.3229, "step": 34864 }, { "epoch": 0.44, "learning_rate": 0.00012925998268343165, "loss": 2.3305, "step": 34872 }, { "epoch": 0.44, "learning_rate": 0.00012923213965934159, "loss": 2.315, "step": 34880 }, { "epoch": 0.44, "learning_rate": 0.0001292042947063769, "loss": 2.3205, "step": 34888 }, { "epoch": 0.44, "learning_rate": 0.00012917644782733026, "loss": 2.33, "step": 34896 }, { "epoch": 0.44, "learning_rate": 0.00012914859902499456, "loss": 2.3137, "step": 34904 }, { "epoch": 0.44, "learning_rate": 0.00012912074830216287, "loss": 2.3306, "step": 34912 }, { "epoch": 0.44, "learning_rate": 0.0001290928956616285, "loss": 2.3163, "step": 34920 }, { "epoch": 0.44, "learning_rate": 0.00012906504110618487, "loss": 2.317, "step": 34928 }, { "epoch": 0.44, "learning_rate": 0.00012903718463862563, "loss": 2.3251, "step": 34936 }, { "epoch": 0.44, "learning_rate": 0.00012900932626174467, "loss": 2.3335, "step": 34944 }, { "epoch": 0.44, "learning_rate": 0.00012898146597833599, "loss": 2.3228, "step": 34952 }, { "epoch": 0.44, "learning_rate": 0.00012895360379119384, "loss": 2.3115, "step": 34960 }, { "epoch": 0.44, "learning_rate": 0.00012892573970311257, "loss": 2.3396, "step": 34968 }, { "epoch": 0.44, "learning_rate": 0.0001288978737168869, "loss": 2.3162, "step": 34976 }, { "epoch": 0.44, "learning_rate": 0.00012887000583531157, "loss": 2.3303, "step": 34984 }, { "epoch": 0.44, "learning_rate": 0.00012884213606118155, "loss": 2.3148, "step": 34992 }, { "epoch": 0.44, "learning_rate": 0.00012881426439729208, "loss": 2.3229, "step": 35000 }, { "epoch": 0.44, "learning_rate": 0.00012878639084643848, "loss": 2.3267, "step": 35008 }, { "epoch": 0.44, "learning_rate": 0.00012875851541141635, "loss": 2.3249, "step": 35016 }, { "epoch": 0.44, "learning_rate": 0.00012873063809502142, "loss": 2.3268, "step": 35024 }, { "epoch": 0.44, "learning_rate": 0.00012870275890004956, "loss": 2.3257, "step": 35032 }, { "epoch": 0.44, "learning_rate": 0.00012867487782929703, "loss": 2.3137, "step": 35040 }, { "epoch": 0.44, "learning_rate": 0.00012864699488556003, "loss": 2.3177, "step": 35048 }, { "epoch": 0.44, "learning_rate": 0.00012861911007163508, "loss": 2.3147, "step": 35056 }, { "epoch": 0.44, "learning_rate": 0.00012859122339031894, "loss": 2.3161, "step": 35064 }, { "epoch": 0.44, "learning_rate": 0.00012856333484440846, "loss": 2.3207, "step": 35072 }, { "epoch": 0.44, "learning_rate": 0.00012853544443670062, "loss": 2.3339, "step": 35080 }, { "epoch": 0.44, "learning_rate": 0.00012850755216999276, "loss": 2.3327, "step": 35088 }, { "epoch": 0.44, "learning_rate": 0.00012847965804708232, "loss": 2.3168, "step": 35096 }, { "epoch": 0.44, "learning_rate": 0.00012845176207076684, "loss": 2.3467, "step": 35104 }, { "epoch": 0.44, "learning_rate": 0.00012842386424384417, "loss": 2.3303, "step": 35112 }, { "epoch": 0.44, "learning_rate": 0.00012839596456911236, "loss": 2.3164, "step": 35120 }, { "epoch": 0.44, "learning_rate": 0.0001283680630493695, "loss": 2.3109, "step": 35128 }, { "epoch": 0.44, "learning_rate": 0.00012834015968741396, "loss": 2.3139, "step": 35136 }, { "epoch": 0.44, "learning_rate": 0.0001283122544860444, "loss": 2.3147, "step": 35144 }, { "epoch": 0.44, "learning_rate": 0.00012828434744805947, "loss": 2.3319, "step": 35152 }, { "epoch": 0.44, "learning_rate": 0.0001282564385762581, "loss": 2.3231, "step": 35160 }, { "epoch": 0.44, "learning_rate": 0.0001282285278734393, "loss": 2.321, "step": 35168 }, { "epoch": 0.44, "learning_rate": 0.00012820061534240252, "loss": 2.3155, "step": 35176 }, { "epoch": 0.44, "learning_rate": 0.00012817270098594715, "loss": 2.3178, "step": 35184 }, { "epoch": 0.44, "learning_rate": 0.00012814478480687288, "loss": 2.3227, "step": 35192 }, { "epoch": 0.44, "learning_rate": 0.0001281168668079794, "loss": 2.3269, "step": 35200 }, { "epoch": 0.44, "learning_rate": 0.0001280889469920669, "loss": 2.3199, "step": 35208 }, { "epoch": 0.44, "learning_rate": 0.0001280610253619355, "loss": 2.3257, "step": 35216 }, { "epoch": 0.44, "learning_rate": 0.00012803310192038562, "loss": 2.3252, "step": 35224 }, { "epoch": 0.44, "learning_rate": 0.00012800517667021778, "loss": 2.3276, "step": 35232 }, { "epoch": 0.44, "learning_rate": 0.00012797724961423275, "loss": 2.3214, "step": 35240 }, { "epoch": 0.44, "learning_rate": 0.00012794932075523146, "loss": 2.3358, "step": 35248 }, { "epoch": 0.44, "learning_rate": 0.00012792139009601498, "loss": 2.3073, "step": 35256 }, { "epoch": 0.44, "learning_rate": 0.00012789345763938463, "loss": 2.3399, "step": 35264 }, { "epoch": 0.44, "learning_rate": 0.00012786552338814184, "loss": 2.3255, "step": 35272 }, { "epoch": 0.44, "learning_rate": 0.00012783758734508834, "loss": 2.3135, "step": 35280 }, { "epoch": 0.44, "learning_rate": 0.0001278096495130259, "loss": 2.3236, "step": 35288 }, { "epoch": 0.44, "learning_rate": 0.0001277817098947565, "loss": 2.3276, "step": 35296 }, { "epoch": 0.44, "learning_rate": 0.00012775376849308233, "loss": 2.3406, "step": 35304 }, { "epoch": 0.44, "learning_rate": 0.0001277258253108058, "loss": 2.3086, "step": 35312 }, { "epoch": 0.44, "learning_rate": 0.00012769788035072948, "loss": 2.3288, "step": 35320 }, { "epoch": 0.44, "learning_rate": 0.000127669933615656, "loss": 2.3275, "step": 35328 }, { "epoch": 0.44, "learning_rate": 0.0001276419851083883, "loss": 2.3064, "step": 35336 }, { "epoch": 0.44, "learning_rate": 0.00012761403483172945, "loss": 2.3304, "step": 35344 }, { "epoch": 0.44, "learning_rate": 0.00012758608278848273, "loss": 2.3202, "step": 35352 }, { "epoch": 0.44, "learning_rate": 0.00012755812898145155, "loss": 2.3175, "step": 35360 }, { "epoch": 0.44, "learning_rate": 0.00012753017341343953, "loss": 2.3092, "step": 35368 }, { "epoch": 0.44, "learning_rate": 0.00012750221608725046, "loss": 2.3127, "step": 35376 }, { "epoch": 0.44, "learning_rate": 0.00012747425700568828, "loss": 2.3398, "step": 35384 }, { "epoch": 0.44, "learning_rate": 0.0001274462961715571, "loss": 2.3146, "step": 35392 }, { "epoch": 0.44, "learning_rate": 0.0001274183335876613, "loss": 2.3411, "step": 35400 }, { "epoch": 0.44, "learning_rate": 0.00012739036925680532, "loss": 2.3546, "step": 35408 }, { "epoch": 0.44, "learning_rate": 0.0001273624031817939, "loss": 2.3257, "step": 35416 }, { "epoch": 0.44, "learning_rate": 0.00012733443536543177, "loss": 2.3158, "step": 35424 }, { "epoch": 0.44, "learning_rate": 0.00012730646581052401, "loss": 2.3337, "step": 35432 }, { "epoch": 0.44, "learning_rate": 0.00012727849451987577, "loss": 2.3402, "step": 35440 }, { "epoch": 0.44, "learning_rate": 0.00012725052149629247, "loss": 2.3223, "step": 35448 }, { "epoch": 0.44, "learning_rate": 0.00012722254674257956, "loss": 2.3288, "step": 35456 }, { "epoch": 0.44, "learning_rate": 0.0001271945702615429, "loss": 2.3428, "step": 35464 }, { "epoch": 0.44, "learning_rate": 0.00012716659205598817, "loss": 2.3239, "step": 35472 }, { "epoch": 0.44, "learning_rate": 0.00012713861212872155, "loss": 2.3195, "step": 35480 }, { "epoch": 0.44, "learning_rate": 0.00012711063048254927, "loss": 2.3424, "step": 35488 }, { "epoch": 0.44, "learning_rate": 0.0001270826471202777, "loss": 2.3361, "step": 35496 }, { "epoch": 0.44, "learning_rate": 0.00012705466204471344, "loss": 2.3074, "step": 35504 }, { "epoch": 0.44, "learning_rate": 0.0001270266752586632, "loss": 2.3243, "step": 35512 }, { "epoch": 0.44, "learning_rate": 0.0001269986867649339, "loss": 2.3278, "step": 35520 }, { "epoch": 0.44, "learning_rate": 0.00012697069656633265, "loss": 2.3328, "step": 35528 }, { "epoch": 0.44, "learning_rate": 0.00012694270466566664, "loss": 2.3323, "step": 35536 }, { "epoch": 0.44, "learning_rate": 0.0001269147110657434, "loss": 2.3209, "step": 35544 }, { "epoch": 0.44, "learning_rate": 0.0001268867157693705, "loss": 2.3379, "step": 35552 }, { "epoch": 0.44, "learning_rate": 0.00012685871877935568, "loss": 2.3276, "step": 35560 }, { "epoch": 0.44, "learning_rate": 0.0001268307200985069, "loss": 2.3087, "step": 35568 }, { "epoch": 0.44, "learning_rate": 0.00012680271972963225, "loss": 2.339, "step": 35576 }, { "epoch": 0.44, "learning_rate": 0.00012677471767554, "loss": 2.3296, "step": 35584 }, { "epoch": 0.44, "learning_rate": 0.0001267467139390387, "loss": 2.3006, "step": 35592 }, { "epoch": 0.45, "learning_rate": 0.0001267187085229368, "loss": 2.3167, "step": 35600 }, { "epoch": 0.45, "learning_rate": 0.00012669070143004317, "loss": 2.3297, "step": 35608 }, { "epoch": 0.45, "learning_rate": 0.00012666269266316683, "loss": 2.3163, "step": 35616 }, { "epoch": 0.45, "learning_rate": 0.00012663468222511677, "loss": 2.3302, "step": 35624 }, { "epoch": 0.45, "learning_rate": 0.00012660667011870236, "loss": 2.3274, "step": 35632 }, { "epoch": 0.45, "learning_rate": 0.00012657865634673303, "loss": 2.3218, "step": 35640 }, { "epoch": 0.45, "learning_rate": 0.0001265506409120184, "loss": 2.3262, "step": 35648 }, { "epoch": 0.45, "learning_rate": 0.0001265226238173683, "loss": 2.3393, "step": 35656 }, { "epoch": 0.45, "learning_rate": 0.00012649460506559263, "loss": 2.3246, "step": 35664 }, { "epoch": 0.45, "learning_rate": 0.00012646658465950152, "loss": 2.3288, "step": 35672 }, { "epoch": 0.45, "learning_rate": 0.00012643856260190531, "loss": 2.326, "step": 35680 }, { "epoch": 0.45, "learning_rate": 0.00012641053889561442, "loss": 2.3293, "step": 35688 }, { "epoch": 0.45, "learning_rate": 0.0001263825135434394, "loss": 2.3186, "step": 35696 }, { "epoch": 0.45, "learning_rate": 0.00012635448654819118, "loss": 2.331, "step": 35704 }, { "epoch": 0.45, "learning_rate": 0.00012632645791268058, "loss": 2.3387, "step": 35712 }, { "epoch": 0.45, "learning_rate": 0.00012629842763971878, "loss": 2.3084, "step": 35720 }, { "epoch": 0.45, "learning_rate": 0.00012627039573211705, "loss": 2.3067, "step": 35728 }, { "epoch": 0.45, "learning_rate": 0.0001262423621926868, "loss": 2.3111, "step": 35736 }, { "epoch": 0.45, "learning_rate": 0.00012621432702423965, "loss": 2.3362, "step": 35744 }, { "epoch": 0.45, "learning_rate": 0.00012618629022958738, "loss": 2.3327, "step": 35752 }, { "epoch": 0.45, "learning_rate": 0.00012615825181154196, "loss": 2.3232, "step": 35760 }, { "epoch": 0.45, "learning_rate": 0.00012613021177291538, "loss": 2.3142, "step": 35768 }, { "epoch": 0.45, "learning_rate": 0.00012610217011652, "loss": 2.3136, "step": 35776 }, { "epoch": 0.45, "learning_rate": 0.00012607412684516818, "loss": 2.3051, "step": 35784 }, { "epoch": 0.45, "learning_rate": 0.00012604608196167252, "loss": 2.3207, "step": 35792 }, { "epoch": 0.45, "learning_rate": 0.00012601803546884575, "loss": 2.3219, "step": 35800 }, { "epoch": 0.45, "learning_rate": 0.00012598998736950082, "loss": 2.3193, "step": 35808 }, { "epoch": 0.45, "learning_rate": 0.00012596193766645076, "loss": 2.3212, "step": 35816 }, { "epoch": 0.45, "learning_rate": 0.00012593388636250873, "loss": 2.3263, "step": 35824 }, { "epoch": 0.45, "learning_rate": 0.00012590583346048826, "loss": 2.3116, "step": 35832 }, { "epoch": 0.45, "learning_rate": 0.00012587777896320277, "loss": 2.2988, "step": 35840 }, { "epoch": 0.45, "learning_rate": 0.000125849722873466, "loss": 2.3228, "step": 35848 }, { "epoch": 0.45, "learning_rate": 0.00012582166519409192, "loss": 2.3214, "step": 35856 }, { "epoch": 0.45, "learning_rate": 0.00012579360592789441, "loss": 2.3232, "step": 35864 }, { "epoch": 0.45, "learning_rate": 0.00012576554507768775, "loss": 2.3058, "step": 35872 }, { "epoch": 0.45, "learning_rate": 0.00012573748264628622, "loss": 2.3431, "step": 35880 }, { "epoch": 0.45, "learning_rate": 0.0001257094186365044, "loss": 2.3248, "step": 35888 }, { "epoch": 0.45, "learning_rate": 0.00012568135305115685, "loss": 2.3134, "step": 35896 }, { "epoch": 0.45, "learning_rate": 0.00012565328589305848, "loss": 2.2908, "step": 35904 }, { "epoch": 0.45, "learning_rate": 0.00012562521716502422, "loss": 2.312, "step": 35912 }, { "epoch": 0.45, "learning_rate": 0.0001255971468698692, "loss": 2.2978, "step": 35920 }, { "epoch": 0.45, "learning_rate": 0.00012556907501040876, "loss": 2.3208, "step": 35928 }, { "epoch": 0.45, "learning_rate": 0.00012554100158945828, "loss": 2.3214, "step": 35936 }, { "epoch": 0.45, "learning_rate": 0.00012551292660983342, "loss": 2.2977, "step": 35944 }, { "epoch": 0.45, "learning_rate": 0.00012548485007434995, "loss": 2.3021, "step": 35952 }, { "epoch": 0.45, "learning_rate": 0.0001254567719858237, "loss": 2.3519, "step": 35960 }, { "epoch": 0.45, "learning_rate": 0.00012542869234707083, "loss": 2.33, "step": 35968 }, { "epoch": 0.45, "learning_rate": 0.00012540061116090754, "loss": 2.3284, "step": 35976 }, { "epoch": 0.45, "learning_rate": 0.00012537252843015023, "loss": 2.3012, "step": 35984 }, { "epoch": 0.45, "learning_rate": 0.00012534444415761544, "loss": 2.3089, "step": 35992 }, { "epoch": 0.45, "learning_rate": 0.0001253163583461198, "loss": 2.3059, "step": 36000 }, { "epoch": 0.45, "learning_rate": 0.0001252882709984802, "loss": 2.3114, "step": 36008 }, { "epoch": 0.45, "learning_rate": 0.0001252601821175137, "loss": 2.3095, "step": 36016 }, { "epoch": 0.45, "learning_rate": 0.00012523209170603737, "loss": 2.3257, "step": 36024 }, { "epoch": 0.45, "learning_rate": 0.00012520399976686858, "loss": 2.3157, "step": 36032 }, { "epoch": 0.45, "learning_rate": 0.00012517590630282472, "loss": 2.323, "step": 36040 }, { "epoch": 0.45, "learning_rate": 0.00012514781131672348, "loss": 2.3198, "step": 36048 }, { "epoch": 0.45, "learning_rate": 0.0001251197148113826, "loss": 2.3166, "step": 36056 }, { "epoch": 0.45, "learning_rate": 0.00012509161678961995, "loss": 2.2942, "step": 36064 }, { "epoch": 0.45, "learning_rate": 0.00012506351725425372, "loss": 2.2966, "step": 36072 }, { "epoch": 0.45, "learning_rate": 0.000125035416208102, "loss": 2.3076, "step": 36080 }, { "epoch": 0.45, "learning_rate": 0.00012500731365398327, "loss": 2.333, "step": 36088 }, { "epoch": 0.45, "learning_rate": 0.000124979209594716, "loss": 2.3147, "step": 36096 }, { "epoch": 0.45, "learning_rate": 0.00012495110403311892, "loss": 2.3291, "step": 36104 }, { "epoch": 0.45, "learning_rate": 0.00012492299697201077, "loss": 2.3327, "step": 36112 }, { "epoch": 0.45, "learning_rate": 0.00012489488841421062, "loss": 2.3247, "step": 36120 }, { "epoch": 0.45, "learning_rate": 0.00012486677836253752, "loss": 2.3318, "step": 36128 }, { "epoch": 0.45, "learning_rate": 0.00012483866681981085, "loss": 2.3198, "step": 36136 }, { "epoch": 0.45, "learning_rate": 0.00012481055378884992, "loss": 2.3276, "step": 36144 }, { "epoch": 0.45, "learning_rate": 0.0001247824392724744, "loss": 2.321, "step": 36152 }, { "epoch": 0.45, "learning_rate": 0.00012475432327350395, "loss": 2.3244, "step": 36160 }, { "epoch": 0.45, "learning_rate": 0.00012472620579475857, "loss": 2.3513, "step": 36168 }, { "epoch": 0.45, "learning_rate": 0.00012469808683905807, "loss": 2.3104, "step": 36176 }, { "epoch": 0.45, "learning_rate": 0.00012466996640922282, "loss": 2.3317, "step": 36184 }, { "epoch": 0.45, "learning_rate": 0.00012464184450807303, "loss": 2.3242, "step": 36192 }, { "epoch": 0.45, "learning_rate": 0.00012461372113842923, "loss": 2.3207, "step": 36200 }, { "epoch": 0.45, "learning_rate": 0.00012458559630311198, "loss": 2.33, "step": 36208 }, { "epoch": 0.45, "learning_rate": 0.00012455747000494208, "loss": 2.313, "step": 36216 }, { "epoch": 0.45, "learning_rate": 0.00012452934224674043, "loss": 2.3112, "step": 36224 }, { "epoch": 0.45, "learning_rate": 0.00012450121303132807, "loss": 2.3176, "step": 36232 }, { "epoch": 0.45, "learning_rate": 0.0001244730823615262, "loss": 2.3316, "step": 36240 }, { "epoch": 0.45, "learning_rate": 0.00012444495024015618, "loss": 2.3208, "step": 36248 }, { "epoch": 0.45, "learning_rate": 0.00012441681667003953, "loss": 2.3303, "step": 36256 }, { "epoch": 0.45, "learning_rate": 0.00012438868165399783, "loss": 2.2997, "step": 36264 }, { "epoch": 0.45, "learning_rate": 0.00012436054519485292, "loss": 2.2914, "step": 36272 }, { "epoch": 0.45, "learning_rate": 0.00012433240729542666, "loss": 2.3033, "step": 36280 }, { "epoch": 0.45, "learning_rate": 0.00012430426795854117, "loss": 2.3171, "step": 36288 }, { "epoch": 0.45, "learning_rate": 0.00012427612718701872, "loss": 2.3284, "step": 36296 }, { "epoch": 0.45, "learning_rate": 0.00012424798498368152, "loss": 2.327, "step": 36304 }, { "epoch": 0.45, "learning_rate": 0.00012421984135135218, "loss": 2.3266, "step": 36312 }, { "epoch": 0.45, "learning_rate": 0.00012419169629285335, "loss": 2.3162, "step": 36320 }, { "epoch": 0.45, "learning_rate": 0.0001241635498110078, "loss": 2.3251, "step": 36328 }, { "epoch": 0.45, "learning_rate": 0.00012413540190863844, "loss": 2.332, "step": 36336 }, { "epoch": 0.45, "learning_rate": 0.00012410725258856837, "loss": 2.317, "step": 36344 }, { "epoch": 0.45, "learning_rate": 0.00012407910185362078, "loss": 2.312, "step": 36352 }, { "epoch": 0.45, "learning_rate": 0.00012405094970661907, "loss": 2.3103, "step": 36360 }, { "epoch": 0.45, "learning_rate": 0.00012402279615038675, "loss": 2.328, "step": 36368 }, { "epoch": 0.45, "learning_rate": 0.0001239946411877474, "loss": 2.3279, "step": 36376 }, { "epoch": 0.45, "learning_rate": 0.00012396648482152484, "loss": 2.3065, "step": 36384 }, { "epoch": 0.45, "learning_rate": 0.000123938327054543, "loss": 2.3227, "step": 36392 }, { "epoch": 0.46, "learning_rate": 0.00012391016788962592, "loss": 2.3109, "step": 36400 }, { "epoch": 0.46, "learning_rate": 0.00012388200732959783, "loss": 2.3046, "step": 36408 }, { "epoch": 0.46, "learning_rate": 0.00012385384537728304, "loss": 2.3268, "step": 36416 }, { "epoch": 0.46, "learning_rate": 0.00012382568203550608, "loss": 2.3244, "step": 36424 }, { "epoch": 0.46, "learning_rate": 0.0001237975173070916, "loss": 2.3162, "step": 36432 }, { "epoch": 0.46, "learning_rate": 0.00012376935119486426, "loss": 2.3322, "step": 36440 }, { "epoch": 0.46, "learning_rate": 0.000123741183701649, "loss": 2.3115, "step": 36448 }, { "epoch": 0.46, "learning_rate": 0.00012371301483027092, "loss": 2.3171, "step": 36456 }, { "epoch": 0.46, "learning_rate": 0.00012368484458355513, "loss": 2.3138, "step": 36464 }, { "epoch": 0.46, "learning_rate": 0.00012365667296432702, "loss": 2.3149, "step": 36472 }, { "epoch": 0.46, "learning_rate": 0.0001236284999754119, "loss": 2.3253, "step": 36480 }, { "epoch": 0.46, "learning_rate": 0.0001236003256196355, "loss": 2.3028, "step": 36488 }, { "epoch": 0.46, "learning_rate": 0.00012357214989982355, "loss": 2.3456, "step": 36496 }, { "epoch": 0.46, "learning_rate": 0.00012354397281880183, "loss": 2.3143, "step": 36504 }, { "epoch": 0.46, "learning_rate": 0.00012351579437939634, "loss": 2.3296, "step": 36512 }, { "epoch": 0.46, "learning_rate": 0.00012348761458443334, "loss": 2.3229, "step": 36520 }, { "epoch": 0.46, "learning_rate": 0.00012345943343673895, "loss": 2.3292, "step": 36528 }, { "epoch": 0.46, "learning_rate": 0.0001234312509391397, "loss": 2.316, "step": 36536 }, { "epoch": 0.46, "learning_rate": 0.00012340306709446208, "loss": 2.2996, "step": 36544 }, { "epoch": 0.46, "learning_rate": 0.00012337488190553275, "loss": 2.3416, "step": 36552 }, { "epoch": 0.46, "learning_rate": 0.0001233466953751786, "loss": 2.3318, "step": 36560 }, { "epoch": 0.46, "learning_rate": 0.0001233185075062265, "loss": 2.3093, "step": 36568 }, { "epoch": 0.46, "learning_rate": 0.00012329031830150353, "loss": 2.3301, "step": 36576 }, { "epoch": 0.46, "learning_rate": 0.00012326212776383699, "loss": 2.3024, "step": 36584 }, { "epoch": 0.46, "learning_rate": 0.00012323393589605417, "loss": 2.3384, "step": 36592 }, { "epoch": 0.46, "learning_rate": 0.00012320574270098254, "loss": 2.3186, "step": 36600 }, { "epoch": 0.46, "learning_rate": 0.0001231775481814498, "loss": 2.3222, "step": 36608 }, { "epoch": 0.46, "learning_rate": 0.0001231493523402836, "loss": 2.3406, "step": 36616 }, { "epoch": 0.46, "learning_rate": 0.0001231211551803119, "loss": 2.3087, "step": 36624 }, { "epoch": 0.46, "learning_rate": 0.00012309295670436264, "loss": 2.3262, "step": 36632 }, { "epoch": 0.46, "learning_rate": 0.00012306475691526407, "loss": 2.3166, "step": 36640 }, { "epoch": 0.46, "learning_rate": 0.0001230365558158444, "loss": 2.3204, "step": 36648 }, { "epoch": 0.46, "learning_rate": 0.00012300835340893203, "loss": 2.3239, "step": 36656 }, { "epoch": 0.46, "learning_rate": 0.0001229801496973555, "loss": 2.3336, "step": 36664 }, { "epoch": 0.46, "learning_rate": 0.00012295194468394353, "loss": 2.3312, "step": 36672 }, { "epoch": 0.46, "learning_rate": 0.00012292373837152485, "loss": 2.3209, "step": 36680 }, { "epoch": 0.46, "learning_rate": 0.00012289553076292852, "loss": 2.3186, "step": 36688 }, { "epoch": 0.46, "learning_rate": 0.0001228673218609835, "loss": 2.311, "step": 36696 }, { "epoch": 0.46, "learning_rate": 0.00012283911166851902, "loss": 2.3076, "step": 36704 }, { "epoch": 0.46, "learning_rate": 0.00012281090018836433, "loss": 2.3019, "step": 36712 }, { "epoch": 0.46, "learning_rate": 0.000122782687423349, "loss": 2.3257, "step": 36720 }, { "epoch": 0.46, "learning_rate": 0.00012275447337630252, "loss": 2.347, "step": 36728 }, { "epoch": 0.46, "learning_rate": 0.00012272625805005466, "loss": 2.3258, "step": 36736 }, { "epoch": 0.46, "learning_rate": 0.0001226980414474352, "loss": 2.3135, "step": 36744 }, { "epoch": 0.46, "learning_rate": 0.00012266982357127414, "loss": 2.3088, "step": 36752 }, { "epoch": 0.46, "learning_rate": 0.0001226416044244016, "loss": 2.3362, "step": 36760 }, { "epoch": 0.46, "learning_rate": 0.00012261338400964774, "loss": 2.3336, "step": 36768 }, { "epoch": 0.46, "learning_rate": 0.0001225851623298429, "loss": 2.3109, "step": 36776 }, { "epoch": 0.46, "learning_rate": 0.00012255693938781768, "loss": 2.3124, "step": 36784 }, { "epoch": 0.46, "learning_rate": 0.0001225287151864025, "loss": 2.3143, "step": 36792 }, { "epoch": 0.46, "learning_rate": 0.00012250048972842822, "loss": 2.3266, "step": 36800 }, { "epoch": 0.46, "learning_rate": 0.00012247226301672566, "loss": 2.3098, "step": 36808 }, { "epoch": 0.46, "learning_rate": 0.00012244403505412576, "loss": 2.2957, "step": 36816 }, { "epoch": 0.46, "learning_rate": 0.0001224158058434597, "loss": 2.3267, "step": 36824 }, { "epoch": 0.46, "learning_rate": 0.00012238757538755862, "loss": 2.3403, "step": 36832 }, { "epoch": 0.46, "learning_rate": 0.00012235934368925395, "loss": 2.3172, "step": 36840 }, { "epoch": 0.46, "learning_rate": 0.00012233111075137714, "loss": 2.3234, "step": 36848 }, { "epoch": 0.46, "learning_rate": 0.00012230287657675977, "loss": 2.311, "step": 36856 }, { "epoch": 0.46, "learning_rate": 0.0001222746411682336, "loss": 2.3063, "step": 36864 }, { "epoch": 0.46, "learning_rate": 0.0001222464045286305, "loss": 2.3026, "step": 36872 }, { "epoch": 0.46, "learning_rate": 0.0001222181666607824, "loss": 2.3283, "step": 36880 }, { "epoch": 0.46, "learning_rate": 0.00012218992756752139, "loss": 2.3204, "step": 36888 }, { "epoch": 0.46, "learning_rate": 0.00012216168725167974, "loss": 2.3205, "step": 36896 }, { "epoch": 0.46, "learning_rate": 0.0001221334457160898, "loss": 2.304, "step": 36904 }, { "epoch": 0.46, "learning_rate": 0.00012210520296358394, "loss": 2.293, "step": 36912 }, { "epoch": 0.46, "learning_rate": 0.00012207695899699487, "loss": 2.3304, "step": 36920 }, { "epoch": 0.46, "learning_rate": 0.00012204871381915521, "loss": 2.3389, "step": 36928 }, { "epoch": 0.46, "learning_rate": 0.00012202046743289785, "loss": 2.3319, "step": 36936 }, { "epoch": 0.46, "learning_rate": 0.00012199221984105571, "loss": 2.311, "step": 36944 }, { "epoch": 0.46, "learning_rate": 0.00012196397104646187, "loss": 2.337, "step": 36952 }, { "epoch": 0.46, "learning_rate": 0.00012193572105194953, "loss": 2.3229, "step": 36960 }, { "epoch": 0.46, "learning_rate": 0.000121907469860352, "loss": 2.3131, "step": 36968 }, { "epoch": 0.46, "learning_rate": 0.00012187921747450271, "loss": 2.3223, "step": 36976 }, { "epoch": 0.46, "learning_rate": 0.0001218509638972352, "loss": 2.3264, "step": 36984 }, { "epoch": 0.46, "learning_rate": 0.00012182270913138319, "loss": 2.3202, "step": 36992 }, { "epoch": 0.46, "learning_rate": 0.00012179445317978044, "loss": 2.3259, "step": 37000 }, { "epoch": 0.46, "learning_rate": 0.00012176619604526088, "loss": 2.3078, "step": 37008 }, { "epoch": 0.46, "learning_rate": 0.0001217379377306585, "loss": 2.3269, "step": 37016 }, { "epoch": 0.46, "learning_rate": 0.0001217096782388075, "loss": 2.3322, "step": 37024 }, { "epoch": 0.46, "learning_rate": 0.0001216814175725421, "loss": 2.3154, "step": 37032 }, { "epoch": 0.46, "learning_rate": 0.00012165315573469671, "loss": 2.3052, "step": 37040 }, { "epoch": 0.46, "learning_rate": 0.00012162489272810586, "loss": 2.309, "step": 37048 }, { "epoch": 0.46, "learning_rate": 0.0001215966285556041, "loss": 2.3113, "step": 37056 }, { "epoch": 0.46, "learning_rate": 0.00012156836322002623, "loss": 2.3136, "step": 37064 }, { "epoch": 0.46, "learning_rate": 0.00012154009672420707, "loss": 2.3161, "step": 37072 }, { "epoch": 0.46, "learning_rate": 0.00012151182907098162, "loss": 2.3354, "step": 37080 }, { "epoch": 0.46, "learning_rate": 0.00012148356026318493, "loss": 2.3048, "step": 37088 }, { "epoch": 0.46, "learning_rate": 0.00012145529030365222, "loss": 2.3229, "step": 37096 }, { "epoch": 0.46, "learning_rate": 0.00012142701919521877, "loss": 2.3097, "step": 37104 }, { "epoch": 0.46, "learning_rate": 0.00012139874694072007, "loss": 2.3118, "step": 37112 }, { "epoch": 0.46, "learning_rate": 0.00012137047354299163, "loss": 2.3223, "step": 37120 }, { "epoch": 0.46, "learning_rate": 0.00012134219900486913, "loss": 2.3229, "step": 37128 }, { "epoch": 0.46, "learning_rate": 0.00012131392332918836, "loss": 2.3164, "step": 37136 }, { "epoch": 0.46, "learning_rate": 0.00012128564651878515, "loss": 2.323, "step": 37144 }, { "epoch": 0.46, "learning_rate": 0.00012125736857649554, "loss": 2.3151, "step": 37152 }, { "epoch": 0.46, "learning_rate": 0.00012122908950515568, "loss": 2.3147, "step": 37160 }, { "epoch": 0.46, "learning_rate": 0.00012120080930760179, "loss": 2.3124, "step": 37168 }, { "epoch": 0.46, "learning_rate": 0.00012117252798667016, "loss": 2.3009, "step": 37176 }, { "epoch": 0.46, "learning_rate": 0.00012114424554519726, "loss": 2.3105, "step": 37184 }, { "epoch": 0.46, "learning_rate": 0.00012111596198601971, "loss": 2.2959, "step": 37192 }, { "epoch": 0.47, "learning_rate": 0.00012108767731197414, "loss": 2.3256, "step": 37200 }, { "epoch": 0.47, "learning_rate": 0.00012105939152589738, "loss": 2.3349, "step": 37208 }, { "epoch": 0.47, "learning_rate": 0.00012103110463062631, "loss": 2.2895, "step": 37216 }, { "epoch": 0.47, "learning_rate": 0.00012100281662899795, "loss": 2.2992, "step": 37224 }, { "epoch": 0.47, "learning_rate": 0.00012097452752384942, "loss": 2.3281, "step": 37232 }, { "epoch": 0.47, "learning_rate": 0.00012094623731801797, "loss": 2.3133, "step": 37240 }, { "epoch": 0.47, "learning_rate": 0.00012091794601434094, "loss": 2.3121, "step": 37248 }, { "epoch": 0.47, "learning_rate": 0.00012088965361565578, "loss": 2.332, "step": 37256 }, { "epoch": 0.47, "learning_rate": 0.00012086136012480012, "loss": 2.3212, "step": 37264 }, { "epoch": 0.47, "learning_rate": 0.00012083306554461154, "loss": 2.3227, "step": 37272 }, { "epoch": 0.47, "learning_rate": 0.00012080476987792787, "loss": 2.2924, "step": 37280 }, { "epoch": 0.47, "learning_rate": 0.00012077647312758698, "loss": 2.3191, "step": 37288 }, { "epoch": 0.47, "learning_rate": 0.00012074817529642693, "loss": 2.3228, "step": 37296 }, { "epoch": 0.47, "learning_rate": 0.00012071987638728579, "loss": 2.3182, "step": 37304 }, { "epoch": 0.47, "learning_rate": 0.00012069157640300181, "loss": 2.3124, "step": 37312 }, { "epoch": 0.47, "learning_rate": 0.00012066327534641327, "loss": 2.322, "step": 37320 }, { "epoch": 0.47, "learning_rate": 0.00012063497322035864, "loss": 2.3227, "step": 37328 }, { "epoch": 0.47, "learning_rate": 0.00012060667002767649, "loss": 2.3065, "step": 37336 }, { "epoch": 0.47, "learning_rate": 0.00012057836577120541, "loss": 2.3055, "step": 37344 }, { "epoch": 0.47, "learning_rate": 0.00012055006045378417, "loss": 2.3391, "step": 37352 }, { "epoch": 0.47, "learning_rate": 0.00012052175407825166, "loss": 2.3318, "step": 37360 }, { "epoch": 0.47, "learning_rate": 0.00012049344664744684, "loss": 2.3272, "step": 37368 }, { "epoch": 0.47, "learning_rate": 0.00012046513816420879, "loss": 2.3359, "step": 37376 }, { "epoch": 0.47, "learning_rate": 0.00012043682863137665, "loss": 2.322, "step": 37384 }, { "epoch": 0.47, "learning_rate": 0.00012040851805178974, "loss": 2.328, "step": 37392 }, { "epoch": 0.47, "learning_rate": 0.00012038020642828749, "loss": 2.3279, "step": 37400 }, { "epoch": 0.47, "learning_rate": 0.00012035189376370932, "loss": 2.3141, "step": 37408 }, { "epoch": 0.47, "learning_rate": 0.00012032358006089486, "loss": 2.3221, "step": 37416 }, { "epoch": 0.47, "learning_rate": 0.00012029526532268383, "loss": 2.3143, "step": 37424 }, { "epoch": 0.47, "learning_rate": 0.00012026694955191602, "loss": 2.2934, "step": 37432 }, { "epoch": 0.47, "learning_rate": 0.00012023863275143137, "loss": 2.3392, "step": 37440 }, { "epoch": 0.47, "learning_rate": 0.0001202103149240698, "loss": 2.3168, "step": 37448 }, { "epoch": 0.47, "learning_rate": 0.00012018199607267155, "loss": 2.3223, "step": 37456 }, { "epoch": 0.47, "learning_rate": 0.00012015367620007678, "loss": 2.3083, "step": 37464 }, { "epoch": 0.47, "learning_rate": 0.00012012535530912584, "loss": 2.3219, "step": 37472 }, { "epoch": 0.47, "learning_rate": 0.0001200970334026591, "loss": 2.3158, "step": 37480 }, { "epoch": 0.47, "learning_rate": 0.00012006871048351716, "loss": 2.3126, "step": 37488 }, { "epoch": 0.47, "learning_rate": 0.0001200403865545406, "loss": 2.3439, "step": 37496 }, { "epoch": 0.47, "learning_rate": 0.00012001206161857013, "loss": 2.311, "step": 37504 }, { "epoch": 0.47, "learning_rate": 0.00011998373567844665, "loss": 2.3219, "step": 37512 }, { "epoch": 0.47, "learning_rate": 0.000119955408737011, "loss": 2.3139, "step": 37520 }, { "epoch": 0.47, "learning_rate": 0.00011992708079710435, "loss": 2.3104, "step": 37528 }, { "epoch": 0.47, "learning_rate": 0.0001198987518615677, "loss": 2.3077, "step": 37536 }, { "epoch": 0.47, "learning_rate": 0.00011987042193324232, "loss": 2.3353, "step": 37544 }, { "epoch": 0.47, "learning_rate": 0.00011984209101496952, "loss": 2.3075, "step": 37552 }, { "epoch": 0.47, "learning_rate": 0.00011981375910959078, "loss": 2.3164, "step": 37560 }, { "epoch": 0.47, "learning_rate": 0.00011978542621994763, "loss": 2.326, "step": 37568 }, { "epoch": 0.47, "learning_rate": 0.0001197570923488817, "loss": 2.3389, "step": 37576 }, { "epoch": 0.47, "learning_rate": 0.00011972875749923462, "loss": 2.3217, "step": 37584 }, { "epoch": 0.47, "learning_rate": 0.00011970042167384834, "loss": 2.323, "step": 37592 }, { "epoch": 0.47, "learning_rate": 0.00011967208487556474, "loss": 2.3195, "step": 37600 }, { "epoch": 0.47, "learning_rate": 0.00011964374710722581, "loss": 2.295, "step": 37608 }, { "epoch": 0.47, "learning_rate": 0.00011961540837167372, "loss": 2.3128, "step": 37616 }, { "epoch": 0.47, "learning_rate": 0.0001195870686717506, "loss": 2.3232, "step": 37624 }, { "epoch": 0.47, "learning_rate": 0.00011955872801029886, "loss": 2.3186, "step": 37632 }, { "epoch": 0.47, "learning_rate": 0.00011953038639016084, "loss": 2.3133, "step": 37640 }, { "epoch": 0.47, "learning_rate": 0.00011950204381417906, "loss": 2.3324, "step": 37648 }, { "epoch": 0.47, "learning_rate": 0.00011947370028519615, "loss": 2.3105, "step": 37656 }, { "epoch": 0.47, "learning_rate": 0.0001194453558060548, "loss": 2.3042, "step": 37664 }, { "epoch": 0.47, "learning_rate": 0.00011941701037959776, "loss": 2.3289, "step": 37672 }, { "epoch": 0.47, "learning_rate": 0.00011938866400866793, "loss": 2.3219, "step": 37680 }, { "epoch": 0.47, "learning_rate": 0.00011936031669610827, "loss": 2.2825, "step": 37688 }, { "epoch": 0.47, "learning_rate": 0.00011933196844476194, "loss": 2.3304, "step": 37696 }, { "epoch": 0.47, "learning_rate": 0.00011930361925747205, "loss": 2.3094, "step": 37704 }, { "epoch": 0.47, "learning_rate": 0.00011927526913708184, "loss": 2.3282, "step": 37712 }, { "epoch": 0.47, "learning_rate": 0.00011924691808643469, "loss": 2.3044, "step": 37720 }, { "epoch": 0.47, "learning_rate": 0.00011921856610837407, "loss": 2.328, "step": 37728 }, { "epoch": 0.47, "learning_rate": 0.00011919021320574348, "loss": 2.3204, "step": 37736 }, { "epoch": 0.47, "learning_rate": 0.0001191618593813866, "loss": 2.319, "step": 37744 }, { "epoch": 0.47, "learning_rate": 0.00011913350463814715, "loss": 2.3122, "step": 37752 }, { "epoch": 0.47, "learning_rate": 0.0001191051489788689, "loss": 2.3164, "step": 37760 }, { "epoch": 0.47, "learning_rate": 0.00011907679240639584, "loss": 2.3157, "step": 37768 }, { "epoch": 0.47, "learning_rate": 0.00011904843492357192, "loss": 2.314, "step": 37776 }, { "epoch": 0.47, "learning_rate": 0.00011902007653324123, "loss": 2.3011, "step": 37784 }, { "epoch": 0.47, "learning_rate": 0.000118991717238248, "loss": 2.3152, "step": 37792 }, { "epoch": 0.47, "learning_rate": 0.00011896335704143646, "loss": 2.3033, "step": 37800 }, { "epoch": 0.47, "learning_rate": 0.000118934995945651, "loss": 2.3245, "step": 37808 }, { "epoch": 0.47, "learning_rate": 0.00011890663395373611, "loss": 2.2987, "step": 37816 }, { "epoch": 0.47, "learning_rate": 0.00011887827106853624, "loss": 2.3125, "step": 37824 }, { "epoch": 0.47, "learning_rate": 0.00011884990729289611, "loss": 2.3229, "step": 37832 }, { "epoch": 0.47, "learning_rate": 0.0001188215426296605, "loss": 2.3146, "step": 37840 }, { "epoch": 0.47, "learning_rate": 0.00011879317708167406, "loss": 2.3037, "step": 37848 }, { "epoch": 0.47, "learning_rate": 0.00011876481065178182, "loss": 2.3309, "step": 37856 }, { "epoch": 0.47, "learning_rate": 0.00011873644334282871, "loss": 2.3224, "step": 37864 }, { "epoch": 0.47, "learning_rate": 0.00011870807515765984, "loss": 2.3274, "step": 37872 }, { "epoch": 0.47, "learning_rate": 0.00011867970609912042, "loss": 2.3, "step": 37880 }, { "epoch": 0.47, "learning_rate": 0.00011865133617005562, "loss": 2.3231, "step": 37888 }, { "epoch": 0.47, "learning_rate": 0.00011862296537331084, "loss": 2.3028, "step": 37896 }, { "epoch": 0.47, "learning_rate": 0.00011859459371173147, "loss": 2.3247, "step": 37904 }, { "epoch": 0.47, "learning_rate": 0.00011856622118816307, "loss": 2.328, "step": 37912 }, { "epoch": 0.47, "learning_rate": 0.00011853784780545123, "loss": 2.3142, "step": 37920 }, { "epoch": 0.47, "learning_rate": 0.00011850947356644162, "loss": 2.3235, "step": 37928 }, { "epoch": 0.47, "learning_rate": 0.00011848109847398003, "loss": 2.3164, "step": 37936 }, { "epoch": 0.47, "learning_rate": 0.00011845272253091234, "loss": 2.3243, "step": 37944 }, { "epoch": 0.47, "learning_rate": 0.00011842434574008445, "loss": 2.3184, "step": 37952 }, { "epoch": 0.47, "learning_rate": 0.00011839596810434239, "loss": 2.3332, "step": 37960 }, { "epoch": 0.47, "learning_rate": 0.00011836758962653236, "loss": 2.3311, "step": 37968 }, { "epoch": 0.47, "learning_rate": 0.00011833921030950048, "loss": 2.283, "step": 37976 }, { "epoch": 0.47, "learning_rate": 0.00011831083015609306, "loss": 2.305, "step": 37984 }, { "epoch": 0.47, "learning_rate": 0.00011828244916915645, "loss": 2.3127, "step": 37992 }, { "epoch": 0.47, "learning_rate": 0.00011825406735153712, "loss": 2.3114, "step": 38000 }, { "epoch": 0.48, "learning_rate": 0.00011822568470608164, "loss": 2.2898, "step": 38008 }, { "epoch": 0.48, "learning_rate": 0.0001181973012356366, "loss": 2.294, "step": 38016 }, { "epoch": 0.48, "learning_rate": 0.00011816891694304865, "loss": 2.3258, "step": 38024 }, { "epoch": 0.48, "learning_rate": 0.00011814053183116463, "loss": 2.3146, "step": 38032 }, { "epoch": 0.48, "learning_rate": 0.00011811214590283141, "loss": 2.3118, "step": 38040 }, { "epoch": 0.48, "learning_rate": 0.00011808375916089592, "loss": 2.319, "step": 38048 }, { "epoch": 0.48, "learning_rate": 0.00011805537160820517, "loss": 2.3343, "step": 38056 }, { "epoch": 0.48, "learning_rate": 0.0001180269832476063, "loss": 2.3238, "step": 38064 }, { "epoch": 0.48, "learning_rate": 0.00011799859408194651, "loss": 2.3064, "step": 38072 }, { "epoch": 0.48, "learning_rate": 0.00011797020411407305, "loss": 2.2943, "step": 38080 }, { "epoch": 0.48, "learning_rate": 0.00011794181334683327, "loss": 2.3138, "step": 38088 }, { "epoch": 0.48, "learning_rate": 0.0001179134217830746, "loss": 2.3178, "step": 38096 }, { "epoch": 0.48, "learning_rate": 0.0001178850294256446, "loss": 2.3185, "step": 38104 }, { "epoch": 0.48, "learning_rate": 0.0001178566362773908, "loss": 2.3068, "step": 38112 }, { "epoch": 0.48, "learning_rate": 0.00011782824234116092, "loss": 2.3225, "step": 38120 }, { "epoch": 0.48, "learning_rate": 0.00011779984761980268, "loss": 2.3259, "step": 38128 }, { "epoch": 0.48, "learning_rate": 0.00011777145211616392, "loss": 2.3123, "step": 38136 }, { "epoch": 0.48, "learning_rate": 0.00011774305583309257, "loss": 2.3154, "step": 38144 }, { "epoch": 0.48, "learning_rate": 0.00011771465877343658, "loss": 2.3124, "step": 38152 }, { "epoch": 0.48, "learning_rate": 0.000117686260940044, "loss": 2.3111, "step": 38160 }, { "epoch": 0.48, "learning_rate": 0.00011765786233576302, "loss": 2.2979, "step": 38168 }, { "epoch": 0.48, "learning_rate": 0.00011762946296344184, "loss": 2.3212, "step": 38176 }, { "epoch": 0.48, "learning_rate": 0.00011760106282592876, "loss": 2.333, "step": 38184 }, { "epoch": 0.48, "learning_rate": 0.00011757266192607212, "loss": 2.2995, "step": 38192 }, { "epoch": 0.48, "learning_rate": 0.00011754426026672045, "loss": 2.3076, "step": 38200 }, { "epoch": 0.48, "learning_rate": 0.00011751585785072218, "loss": 2.3159, "step": 38208 }, { "epoch": 0.48, "learning_rate": 0.00011748745468092599, "loss": 2.3275, "step": 38216 }, { "epoch": 0.48, "learning_rate": 0.00011745905076018048, "loss": 2.3247, "step": 38224 }, { "epoch": 0.48, "learning_rate": 0.00011743064609133448, "loss": 2.3027, "step": 38232 }, { "epoch": 0.48, "learning_rate": 0.00011740224067723678, "loss": 2.3414, "step": 38240 }, { "epoch": 0.48, "learning_rate": 0.00011737383452073628, "loss": 2.3372, "step": 38248 }, { "epoch": 0.48, "learning_rate": 0.00011734542762468193, "loss": 2.3117, "step": 38256 }, { "epoch": 0.48, "learning_rate": 0.00011731701999192282, "loss": 2.3179, "step": 38264 }, { "epoch": 0.48, "learning_rate": 0.00011728861162530809, "loss": 2.3148, "step": 38272 }, { "epoch": 0.48, "learning_rate": 0.00011726020252768691, "loss": 2.3098, "step": 38280 }, { "epoch": 0.48, "learning_rate": 0.00011723179270190857, "loss": 2.3142, "step": 38288 }, { "epoch": 0.48, "learning_rate": 0.00011720338215082234, "loss": 2.3194, "step": 38296 }, { "epoch": 0.48, "learning_rate": 0.00011717497087727773, "loss": 2.3348, "step": 38304 }, { "epoch": 0.48, "learning_rate": 0.00011714655888412421, "loss": 2.3006, "step": 38312 }, { "epoch": 0.48, "learning_rate": 0.00011711814617421132, "loss": 2.3151, "step": 38320 }, { "epoch": 0.48, "learning_rate": 0.0001170897327503887, "loss": 2.3295, "step": 38328 }, { "epoch": 0.48, "learning_rate": 0.00011706131861550607, "loss": 2.3098, "step": 38336 }, { "epoch": 0.48, "learning_rate": 0.00011703290377241318, "loss": 2.3393, "step": 38344 }, { "epoch": 0.48, "learning_rate": 0.00011700448822395988, "loss": 2.3019, "step": 38352 }, { "epoch": 0.48, "learning_rate": 0.00011697607197299611, "loss": 2.2937, "step": 38360 }, { "epoch": 0.48, "learning_rate": 0.00011694765502237188, "loss": 2.3271, "step": 38368 }, { "epoch": 0.48, "learning_rate": 0.0001169192373749372, "loss": 2.327, "step": 38376 }, { "epoch": 0.48, "learning_rate": 0.00011689081903354221, "loss": 2.3241, "step": 38384 }, { "epoch": 0.48, "learning_rate": 0.0001168624000010371, "loss": 2.3222, "step": 38392 }, { "epoch": 0.48, "learning_rate": 0.00011683398028027217, "loss": 2.323, "step": 38400 }, { "epoch": 0.48, "learning_rate": 0.00011680555987409776, "loss": 2.315, "step": 38408 }, { "epoch": 0.48, "learning_rate": 0.00011677713878536425, "loss": 2.3028, "step": 38416 }, { "epoch": 0.48, "learning_rate": 0.00011674871701692209, "loss": 2.3153, "step": 38424 }, { "epoch": 0.48, "learning_rate": 0.00011672029457162188, "loss": 2.3182, "step": 38432 }, { "epoch": 0.48, "learning_rate": 0.00011669187145231421, "loss": 2.3148, "step": 38440 }, { "epoch": 0.48, "learning_rate": 0.00011666344766184973, "loss": 2.303, "step": 38448 }, { "epoch": 0.48, "learning_rate": 0.00011663502320307923, "loss": 2.3174, "step": 38456 }, { "epoch": 0.48, "learning_rate": 0.00011660659807885348, "loss": 2.331, "step": 38464 }, { "epoch": 0.48, "learning_rate": 0.00011657817229202339, "loss": 2.3161, "step": 38472 }, { "epoch": 0.48, "learning_rate": 0.00011654974584543989, "loss": 2.3191, "step": 38480 }, { "epoch": 0.48, "learning_rate": 0.000116521318741954, "loss": 2.3164, "step": 38488 }, { "epoch": 0.48, "learning_rate": 0.00011649289098441678, "loss": 2.3036, "step": 38496 }, { "epoch": 0.48, "learning_rate": 0.0001164644625756794, "loss": 2.3209, "step": 38504 }, { "epoch": 0.48, "learning_rate": 0.00011643603351859302, "loss": 2.3136, "step": 38512 }, { "epoch": 0.48, "learning_rate": 0.00011640760381600899, "loss": 2.3291, "step": 38520 }, { "epoch": 0.48, "learning_rate": 0.00011637917347077856, "loss": 2.3013, "step": 38528 }, { "epoch": 0.48, "learning_rate": 0.0001163507424857532, "loss": 2.2992, "step": 38536 }, { "epoch": 0.48, "learning_rate": 0.00011632231086378438, "loss": 2.3215, "step": 38544 }, { "epoch": 0.48, "learning_rate": 0.00011629387860772358, "loss": 2.3334, "step": 38552 }, { "epoch": 0.48, "learning_rate": 0.00011626544572042239, "loss": 2.3236, "step": 38560 }, { "epoch": 0.48, "learning_rate": 0.00011623701220473255, "loss": 2.32, "step": 38568 }, { "epoch": 0.48, "learning_rate": 0.0001162085780635057, "loss": 2.3021, "step": 38576 }, { "epoch": 0.48, "learning_rate": 0.00011618014329959366, "loss": 2.3234, "step": 38584 }, { "epoch": 0.48, "learning_rate": 0.00011615170791584824, "loss": 2.2908, "step": 38592 }, { "epoch": 0.48, "learning_rate": 0.0001161232719151214, "loss": 2.3176, "step": 38600 }, { "epoch": 0.48, "learning_rate": 0.00011609483530026508, "loss": 2.3169, "step": 38608 }, { "epoch": 0.48, "learning_rate": 0.00011606639807413129, "loss": 2.3297, "step": 38616 }, { "epoch": 0.48, "learning_rate": 0.00011603796023957218, "loss": 2.3018, "step": 38624 }, { "epoch": 0.48, "learning_rate": 0.00011600952179943987, "loss": 2.2942, "step": 38632 }, { "epoch": 0.48, "learning_rate": 0.00011598108275658655, "loss": 2.3208, "step": 38640 }, { "epoch": 0.48, "learning_rate": 0.00011595264311386453, "loss": 2.3259, "step": 38648 }, { "epoch": 0.48, "learning_rate": 0.00011592420287412616, "loss": 2.3124, "step": 38656 }, { "epoch": 0.48, "learning_rate": 0.00011589576204022377, "loss": 2.3131, "step": 38664 }, { "epoch": 0.48, "learning_rate": 0.00011586732061500986, "loss": 2.325, "step": 38672 }, { "epoch": 0.48, "learning_rate": 0.00011583887860133697, "loss": 2.3, "step": 38680 }, { "epoch": 0.48, "learning_rate": 0.00011581043600205761, "loss": 2.295, "step": 38688 }, { "epoch": 0.48, "learning_rate": 0.00011578199282002447, "loss": 2.3361, "step": 38696 }, { "epoch": 0.48, "learning_rate": 0.00011575354905809017, "loss": 2.2889, "step": 38704 }, { "epoch": 0.48, "learning_rate": 0.00011572510471910755, "loss": 2.3189, "step": 38712 }, { "epoch": 0.48, "learning_rate": 0.00011569665980592936, "loss": 2.2983, "step": 38720 }, { "epoch": 0.48, "learning_rate": 0.00011566821432140844, "loss": 2.2947, "step": 38728 }, { "epoch": 0.48, "learning_rate": 0.00011563976826839775, "loss": 2.3158, "step": 38736 }, { "epoch": 0.48, "learning_rate": 0.00011561132164975028, "loss": 2.3284, "step": 38744 }, { "epoch": 0.48, "learning_rate": 0.00011558287446831901, "loss": 2.3124, "step": 38752 }, { "epoch": 0.48, "learning_rate": 0.00011555442672695711, "loss": 2.3056, "step": 38760 }, { "epoch": 0.48, "learning_rate": 0.00011552597842851767, "loss": 2.3164, "step": 38768 }, { "epoch": 0.48, "learning_rate": 0.00011549752957585387, "loss": 2.3147, "step": 38776 }, { "epoch": 0.48, "learning_rate": 0.00011546908017181906, "loss": 2.308, "step": 38784 }, { "epoch": 0.48, "learning_rate": 0.00011544063021926645, "loss": 2.3277, "step": 38792 }, { "epoch": 0.48, "learning_rate": 0.00011541217972104946, "loss": 2.3112, "step": 38800 }, { "epoch": 0.49, "learning_rate": 0.00011538372868002154, "loss": 2.2954, "step": 38808 }, { "epoch": 0.49, "learning_rate": 0.00011535527709903611, "loss": 2.3225, "step": 38816 }, { "epoch": 0.49, "learning_rate": 0.00011532682498094676, "loss": 2.315, "step": 38824 }, { "epoch": 0.49, "learning_rate": 0.00011529837232860701, "loss": 2.3046, "step": 38832 }, { "epoch": 0.49, "learning_rate": 0.00011526991914487058, "loss": 2.3362, "step": 38840 }, { "epoch": 0.49, "learning_rate": 0.00011524146543259111, "loss": 2.3121, "step": 38848 }, { "epoch": 0.49, "learning_rate": 0.00011521301119462236, "loss": 2.3073, "step": 38856 }, { "epoch": 0.49, "learning_rate": 0.00011518455643381809, "loss": 2.3177, "step": 38864 }, { "epoch": 0.49, "learning_rate": 0.00011515610115303222, "loss": 2.3036, "step": 38872 }, { "epoch": 0.49, "learning_rate": 0.00011512764535511861, "loss": 2.3274, "step": 38880 }, { "epoch": 0.49, "learning_rate": 0.00011509918904293122, "loss": 2.3093, "step": 38888 }, { "epoch": 0.49, "learning_rate": 0.00011507073221932407, "loss": 2.3014, "step": 38896 }, { "epoch": 0.49, "learning_rate": 0.00011504227488715122, "loss": 2.3243, "step": 38904 }, { "epoch": 0.49, "learning_rate": 0.00011501381704926678, "loss": 2.3211, "step": 38912 }, { "epoch": 0.49, "learning_rate": 0.00011498535870852485, "loss": 2.3233, "step": 38920 }, { "epoch": 0.49, "learning_rate": 0.00011495689986777973, "loss": 2.3115, "step": 38928 }, { "epoch": 0.49, "learning_rate": 0.00011492844052988565, "loss": 2.319, "step": 38936 }, { "epoch": 0.49, "learning_rate": 0.00011489998069769688, "loss": 2.3161, "step": 38944 }, { "epoch": 0.49, "learning_rate": 0.00011487152037406783, "loss": 2.3085, "step": 38952 }, { "epoch": 0.49, "learning_rate": 0.00011484305956185288, "loss": 2.3102, "step": 38960 }, { "epoch": 0.49, "learning_rate": 0.00011481459826390648, "loss": 2.3186, "step": 38968 }, { "epoch": 0.49, "learning_rate": 0.00011478613648308319, "loss": 2.3204, "step": 38976 }, { "epoch": 0.49, "learning_rate": 0.00011475767422223753, "loss": 2.3064, "step": 38984 }, { "epoch": 0.49, "learning_rate": 0.00011472921148422411, "loss": 2.3127, "step": 38992 }, { "epoch": 0.49, "learning_rate": 0.00011470074827189752, "loss": 2.3052, "step": 39000 }, { "epoch": 0.49, "learning_rate": 0.00011467228458811257, "loss": 2.3219, "step": 39008 }, { "epoch": 0.49, "learning_rate": 0.00011464382043572392, "loss": 2.3244, "step": 39016 }, { "epoch": 0.49, "learning_rate": 0.00011461535581758643, "loss": 2.3035, "step": 39024 }, { "epoch": 0.49, "learning_rate": 0.00011458689073655484, "loss": 2.3157, "step": 39032 }, { "epoch": 0.49, "learning_rate": 0.00011455842519548416, "loss": 2.3044, "step": 39040 }, { "epoch": 0.49, "learning_rate": 0.00011452995919722924, "loss": 2.3036, "step": 39048 }, { "epoch": 0.49, "learning_rate": 0.00011450149274464507, "loss": 2.3129, "step": 39056 }, { "epoch": 0.49, "learning_rate": 0.0001144730258405867, "loss": 2.3054, "step": 39064 }, { "epoch": 0.49, "learning_rate": 0.00011444455848790918, "loss": 2.3219, "step": 39072 }, { "epoch": 0.49, "learning_rate": 0.00011441609068946764, "loss": 2.3145, "step": 39080 }, { "epoch": 0.49, "learning_rate": 0.00011438762244811722, "loss": 2.3103, "step": 39088 }, { "epoch": 0.49, "learning_rate": 0.00011435915376671313, "loss": 2.3282, "step": 39096 }, { "epoch": 0.49, "learning_rate": 0.00011433068464811058, "loss": 2.3122, "step": 39104 }, { "epoch": 0.49, "learning_rate": 0.00011430221509516495, "loss": 2.344, "step": 39112 }, { "epoch": 0.49, "learning_rate": 0.00011427374511073152, "loss": 2.3051, "step": 39120 }, { "epoch": 0.49, "learning_rate": 0.00011424527469766566, "loss": 2.324, "step": 39128 }, { "epoch": 0.49, "learning_rate": 0.00011421680385882279, "loss": 2.3402, "step": 39136 }, { "epoch": 0.49, "learning_rate": 0.00011418833259705839, "loss": 2.3191, "step": 39144 }, { "epoch": 0.49, "learning_rate": 0.00011415986091522797, "loss": 2.29, "step": 39152 }, { "epoch": 0.49, "learning_rate": 0.00011413138881618707, "loss": 2.306, "step": 39160 }, { "epoch": 0.49, "learning_rate": 0.00011410291630279127, "loss": 2.3219, "step": 39168 }, { "epoch": 0.49, "learning_rate": 0.00011407444337789624, "loss": 2.3063, "step": 39176 }, { "epoch": 0.49, "learning_rate": 0.00011404597004435762, "loss": 2.3045, "step": 39184 }, { "epoch": 0.49, "learning_rate": 0.00011401749630503109, "loss": 2.2954, "step": 39192 }, { "epoch": 0.49, "learning_rate": 0.0001139890221627725, "loss": 2.3349, "step": 39200 }, { "epoch": 0.49, "learning_rate": 0.00011396054762043758, "loss": 2.3137, "step": 39208 }, { "epoch": 0.49, "learning_rate": 0.00011393207268088215, "loss": 2.3245, "step": 39216 }, { "epoch": 0.49, "learning_rate": 0.00011390359734696212, "loss": 2.2768, "step": 39224 }, { "epoch": 0.49, "learning_rate": 0.00011387512162153338, "loss": 2.3144, "step": 39232 }, { "epoch": 0.49, "learning_rate": 0.00011384664550745193, "loss": 2.318, "step": 39240 }, { "epoch": 0.49, "learning_rate": 0.00011381816900757371, "loss": 2.3161, "step": 39248 }, { "epoch": 0.49, "learning_rate": 0.00011378969212475481, "loss": 2.302, "step": 39256 }, { "epoch": 0.49, "learning_rate": 0.00011376121486185121, "loss": 2.3046, "step": 39264 }, { "epoch": 0.49, "learning_rate": 0.00011373273722171908, "loss": 2.3222, "step": 39272 }, { "epoch": 0.49, "learning_rate": 0.00011370425920721459, "loss": 2.3058, "step": 39280 }, { "epoch": 0.49, "learning_rate": 0.00011367578082119387, "loss": 2.3222, "step": 39288 }, { "epoch": 0.49, "learning_rate": 0.00011364730206651318, "loss": 2.315, "step": 39296 }, { "epoch": 0.49, "learning_rate": 0.00011361882294602873, "loss": 2.3385, "step": 39304 }, { "epoch": 0.49, "learning_rate": 0.00011359034346259687, "loss": 2.3115, "step": 39312 }, { "epoch": 0.49, "learning_rate": 0.00011356186361907388, "loss": 2.3016, "step": 39320 }, { "epoch": 0.49, "learning_rate": 0.00011353338341831619, "loss": 2.3079, "step": 39328 }, { "epoch": 0.49, "learning_rate": 0.00011350490286318014, "loss": 2.3184, "step": 39336 }, { "epoch": 0.49, "learning_rate": 0.0001134764219565222, "loss": 2.3163, "step": 39344 }, { "epoch": 0.49, "learning_rate": 0.00011344794070119882, "loss": 2.3195, "step": 39352 }, { "epoch": 0.49, "learning_rate": 0.00011341945910006655, "loss": 2.3059, "step": 39360 }, { "epoch": 0.49, "learning_rate": 0.00011339097715598186, "loss": 2.3092, "step": 39368 }, { "epoch": 0.49, "learning_rate": 0.00011336249487180145, "loss": 2.311, "step": 39376 }, { "epoch": 0.49, "learning_rate": 0.0001133340122503818, "loss": 2.293, "step": 39384 }, { "epoch": 0.49, "learning_rate": 0.00011330552929457966, "loss": 2.3154, "step": 39392 }, { "epoch": 0.49, "learning_rate": 0.00011327704600725158, "loss": 2.3334, "step": 39400 }, { "epoch": 0.49, "learning_rate": 0.00011324856239125441, "loss": 2.3094, "step": 39408 }, { "epoch": 0.49, "learning_rate": 0.00011322007844944485, "loss": 2.3285, "step": 39416 }, { "epoch": 0.49, "learning_rate": 0.00011319159418467966, "loss": 2.3027, "step": 39424 }, { "epoch": 0.49, "learning_rate": 0.00011316310959981562, "loss": 2.337, "step": 39432 }, { "epoch": 0.49, "learning_rate": 0.00011313462469770966, "loss": 2.3262, "step": 39440 }, { "epoch": 0.49, "learning_rate": 0.00011310613948121859, "loss": 2.3312, "step": 39448 }, { "epoch": 0.49, "learning_rate": 0.00011307765395319932, "loss": 2.2959, "step": 39456 }, { "epoch": 0.49, "learning_rate": 0.00011304916811650879, "loss": 2.3287, "step": 39464 }, { "epoch": 0.49, "learning_rate": 0.000113020681974004, "loss": 2.3087, "step": 39472 }, { "epoch": 0.49, "learning_rate": 0.00011299219552854192, "loss": 2.3186, "step": 39480 }, { "epoch": 0.49, "learning_rate": 0.00011296370878297957, "loss": 2.2957, "step": 39488 }, { "epoch": 0.49, "learning_rate": 0.00011293522174017404, "loss": 2.3167, "step": 39496 }, { "epoch": 0.49, "learning_rate": 0.00011290673440298236, "loss": 2.3186, "step": 39504 }, { "epoch": 0.49, "learning_rate": 0.00011287824677426175, "loss": 2.3165, "step": 39512 }, { "epoch": 0.49, "learning_rate": 0.00011284975885686926, "loss": 2.2917, "step": 39520 }, { "epoch": 0.49, "learning_rate": 0.0001128212706536621, "loss": 2.3281, "step": 39528 }, { "epoch": 0.49, "learning_rate": 0.00011279278216749749, "loss": 2.2977, "step": 39536 }, { "epoch": 0.49, "learning_rate": 0.00011276429340123265, "loss": 2.3101, "step": 39544 }, { "epoch": 0.49, "learning_rate": 0.00011273580435772486, "loss": 2.2923, "step": 39552 }, { "epoch": 0.49, "learning_rate": 0.00011270731503983141, "loss": 2.3002, "step": 39560 }, { "epoch": 0.49, "learning_rate": 0.00011267882545040953, "loss": 2.3354, "step": 39568 }, { "epoch": 0.49, "learning_rate": 0.0001126503355923167, "loss": 2.3142, "step": 39576 }, { "epoch": 0.49, "learning_rate": 0.0001126218454684102, "loss": 2.2916, "step": 39584 }, { "epoch": 0.49, "learning_rate": 0.00011259335508154747, "loss": 2.2948, "step": 39592 }, { "epoch": 0.49, "learning_rate": 0.00011256486443458591, "loss": 2.325, "step": 39600 }, { "epoch": 0.5, "learning_rate": 0.000112536373530383, "loss": 2.3238, "step": 39608 }, { "epoch": 0.5, "learning_rate": 0.00011250788237179617, "loss": 2.3006, "step": 39616 }, { "epoch": 0.5, "learning_rate": 0.00011247939096168297, "loss": 2.3277, "step": 39624 }, { "epoch": 0.5, "learning_rate": 0.00011245089930290089, "loss": 2.3121, "step": 39632 }, { "epoch": 0.5, "learning_rate": 0.00011242240739830749, "loss": 2.3125, "step": 39640 }, { "epoch": 0.5, "learning_rate": 0.0001123939152507604, "loss": 2.307, "step": 39648 }, { "epoch": 0.5, "learning_rate": 0.00011236542286311713, "loss": 2.283, "step": 39656 }, { "epoch": 0.5, "learning_rate": 0.00011233693023823539, "loss": 2.2993, "step": 39664 }, { "epoch": 0.5, "learning_rate": 0.00011230843737897274, "loss": 2.3332, "step": 39672 }, { "epoch": 0.5, "learning_rate": 0.00011227994428818691, "loss": 2.3127, "step": 39680 }, { "epoch": 0.5, "learning_rate": 0.00011225145096873561, "loss": 2.3107, "step": 39688 }, { "epoch": 0.5, "learning_rate": 0.00011222295742347653, "loss": 2.3024, "step": 39696 }, { "epoch": 0.5, "learning_rate": 0.00011219446365526742, "loss": 2.3242, "step": 39704 }, { "epoch": 0.5, "learning_rate": 0.00011216596966696602, "loss": 2.3285, "step": 39712 }, { "epoch": 0.5, "learning_rate": 0.00011213747546143014, "loss": 2.2696, "step": 39720 }, { "epoch": 0.5, "learning_rate": 0.00011210898104151761, "loss": 2.2993, "step": 39728 }, { "epoch": 0.5, "learning_rate": 0.00011208048641008621, "loss": 2.273, "step": 39736 }, { "epoch": 0.5, "learning_rate": 0.00011205199156999381, "loss": 2.3094, "step": 39744 }, { "epoch": 0.5, "learning_rate": 0.0001120234965240983, "loss": 2.316, "step": 39752 }, { "epoch": 0.5, "learning_rate": 0.00011199500127525753, "loss": 2.3134, "step": 39760 }, { "epoch": 0.5, "learning_rate": 0.00011196650582632946, "loss": 2.3003, "step": 39768 }, { "epoch": 0.5, "learning_rate": 0.00011193801018017198, "loss": 2.3021, "step": 39776 }, { "epoch": 0.5, "learning_rate": 0.00011190951433964305, "loss": 2.3161, "step": 39784 }, { "epoch": 0.5, "learning_rate": 0.00011188101830760067, "loss": 2.3021, "step": 39792 }, { "epoch": 0.5, "learning_rate": 0.00011185252208690282, "loss": 2.324, "step": 39800 }, { "epoch": 0.5, "learning_rate": 0.00011182402568040749, "loss": 2.3121, "step": 39808 }, { "epoch": 0.5, "learning_rate": 0.0001117955290909727, "loss": 2.302, "step": 39816 }, { "epoch": 0.5, "learning_rate": 0.00011176703232145655, "loss": 2.3075, "step": 39824 }, { "epoch": 0.5, "learning_rate": 0.00011173853537471709, "loss": 2.3194, "step": 39832 }, { "epoch": 0.5, "learning_rate": 0.00011171003825361233, "loss": 2.3229, "step": 39840 }, { "epoch": 0.5, "learning_rate": 0.00011168154096100046, "loss": 2.3115, "step": 39848 }, { "epoch": 0.5, "learning_rate": 0.0001116530434997395, "loss": 2.3026, "step": 39856 }, { "epoch": 0.5, "learning_rate": 0.00011162454587268774, "loss": 2.3199, "step": 39864 }, { "epoch": 0.5, "learning_rate": 0.00011159604808270314, "loss": 2.3086, "step": 39872 }, { "epoch": 0.5, "learning_rate": 0.00011156755013264401, "loss": 2.3299, "step": 39880 }, { "epoch": 0.5, "learning_rate": 0.0001115390520253685, "loss": 2.2996, "step": 39888 }, { "epoch": 0.5, "learning_rate": 0.00011151055376373476, "loss": 2.308, "step": 39896 }, { "epoch": 0.5, "learning_rate": 0.00011148205535060106, "loss": 2.324, "step": 39904 }, { "epoch": 0.5, "learning_rate": 0.00011145355678882558, "loss": 2.3061, "step": 39912 }, { "epoch": 0.5, "learning_rate": 0.0001114250580812666, "loss": 2.3108, "step": 39920 }, { "epoch": 0.5, "learning_rate": 0.00011139655923078238, "loss": 2.2693, "step": 39928 }, { "epoch": 0.5, "learning_rate": 0.00011136806024023119, "loss": 2.3138, "step": 39936 }, { "epoch": 0.5, "learning_rate": 0.00011133956111247126, "loss": 2.312, "step": 39944 }, { "epoch": 0.5, "learning_rate": 0.00011131106185036099, "loss": 2.3129, "step": 39952 }, { "epoch": 0.5, "learning_rate": 0.00011128256245675863, "loss": 2.3095, "step": 39960 }, { "epoch": 0.5, "learning_rate": 0.00011125406293452252, "loss": 2.2999, "step": 39968 }, { "epoch": 0.5, "learning_rate": 0.00011122556328651099, "loss": 2.3004, "step": 39976 }, { "epoch": 0.5, "learning_rate": 0.00011119706351558243, "loss": 2.3131, "step": 39984 }, { "epoch": 0.5, "learning_rate": 0.00011116856362459517, "loss": 2.3082, "step": 39992 }, { "epoch": 0.5, "learning_rate": 0.00011114006361640766, "loss": 2.3248, "step": 40000 }, { "epoch": 0.5, "learning_rate": 0.00011111156349387812, "loss": 2.3204, "step": 40008 }, { "epoch": 0.5, "learning_rate": 0.00011108306325986513, "loss": 2.3051, "step": 40016 }, { "epoch": 0.5, "learning_rate": 0.000111054562917227, "loss": 2.2978, "step": 40024 }, { "epoch": 0.5, "learning_rate": 0.0001110260624688222, "loss": 2.3146, "step": 40032 }, { "epoch": 0.5, "learning_rate": 0.00011099756191750917, "loss": 2.2796, "step": 40040 }, { "epoch": 0.5, "learning_rate": 0.00011096906126614632, "loss": 2.3304, "step": 40048 }, { "epoch": 0.5, "learning_rate": 0.00011094056051759212, "loss": 2.3289, "step": 40056 }, { "epoch": 0.5, "learning_rate": 0.00011091205967470502, "loss": 2.2966, "step": 40064 }, { "epoch": 0.5, "learning_rate": 0.00011088355874034346, "loss": 2.327, "step": 40072 }, { "epoch": 0.5, "learning_rate": 0.00011085505771736602, "loss": 2.3346, "step": 40080 }, { "epoch": 0.5, "learning_rate": 0.00011082655660863113, "loss": 2.3055, "step": 40088 }, { "epoch": 0.5, "learning_rate": 0.00011079805541699728, "loss": 2.3125, "step": 40096 }, { "epoch": 0.5, "learning_rate": 0.000110769554145323, "loss": 2.3026, "step": 40104 }, { "epoch": 0.5, "learning_rate": 0.0001107410527964668, "loss": 2.3164, "step": 40112 }, { "epoch": 0.5, "learning_rate": 0.0001107125513732872, "loss": 2.2912, "step": 40120 }, { "epoch": 0.5, "learning_rate": 0.00011068404987864276, "loss": 2.3167, "step": 40128 }, { "epoch": 0.5, "learning_rate": 0.00011065554831539195, "loss": 2.2963, "step": 40136 }, { "epoch": 0.5, "learning_rate": 0.00011062704668639338, "loss": 2.306, "step": 40144 }, { "epoch": 0.5, "learning_rate": 0.0001105985449945056, "loss": 2.2963, "step": 40152 }, { "epoch": 0.5, "learning_rate": 0.0001105700432425871, "loss": 2.3024, "step": 40160 }, { "epoch": 0.5, "learning_rate": 0.00011054154143349656, "loss": 2.2982, "step": 40168 }, { "epoch": 0.5, "learning_rate": 0.00011051303957009242, "loss": 2.3268, "step": 40176 }, { "epoch": 0.5, "learning_rate": 0.00011048453765523337, "loss": 2.2912, "step": 40184 }, { "epoch": 0.5, "learning_rate": 0.00011045603569177789, "loss": 2.3089, "step": 40192 }, { "epoch": 0.5, "learning_rate": 0.00011042753368258465, "loss": 2.2939, "step": 40200 }, { "epoch": 0.5, "learning_rate": 0.00011039903163051217, "loss": 2.3153, "step": 40208 }, { "epoch": 0.5, "learning_rate": 0.00011037052953841914, "loss": 2.3241, "step": 40216 }, { "epoch": 0.5, "learning_rate": 0.00011034202740916404, "loss": 2.326, "step": 40224 }, { "epoch": 0.5, "learning_rate": 0.00011031352524560554, "loss": 2.3158, "step": 40232 }, { "epoch": 0.5, "learning_rate": 0.00011028502305060222, "loss": 2.3167, "step": 40240 }, { "epoch": 0.5, "learning_rate": 0.00011025652082701273, "loss": 2.3003, "step": 40248 }, { "epoch": 0.5, "learning_rate": 0.00011022801857769565, "loss": 2.3132, "step": 40256 }, { "epoch": 0.5, "learning_rate": 0.00011019951630550962, "loss": 2.3101, "step": 40264 }, { "epoch": 0.5, "learning_rate": 0.00011017101401331317, "loss": 2.3139, "step": 40272 }, { "epoch": 0.5, "learning_rate": 0.00011014251170396504, "loss": 2.3024, "step": 40280 }, { "epoch": 0.5, "learning_rate": 0.00011011400938032377, "loss": 2.2991, "step": 40288 }, { "epoch": 0.5, "learning_rate": 0.000110085507045248, "loss": 2.3013, "step": 40296 }, { "epoch": 0.5, "learning_rate": 0.00011005700470159639, "loss": 2.3226, "step": 40304 }, { "epoch": 0.5, "learning_rate": 0.00011002850235222751, "loss": 2.308, "step": 40312 }, { "epoch": 0.5, "learning_rate": 0.00011000000000000002, "loss": 2.3367, "step": 40320 }, { "epoch": 0.5, "learning_rate": 0.0001099714976477725, "loss": 2.324, "step": 40328 }, { "epoch": 0.5, "learning_rate": 0.00010994299529840364, "loss": 2.3037, "step": 40336 }, { "epoch": 0.5, "learning_rate": 0.000109914492954752, "loss": 2.3332, "step": 40344 }, { "epoch": 0.5, "learning_rate": 0.00010988599061967626, "loss": 2.2995, "step": 40352 }, { "epoch": 0.5, "learning_rate": 0.000109857488296035, "loss": 2.3043, "step": 40360 }, { "epoch": 0.5, "learning_rate": 0.00010982898598668685, "loss": 2.3345, "step": 40368 }, { "epoch": 0.5, "learning_rate": 0.00010980048369449041, "loss": 2.3242, "step": 40376 }, { "epoch": 0.5, "learning_rate": 0.00010977198142230436, "loss": 2.3171, "step": 40384 }, { "epoch": 0.5, "learning_rate": 0.00010974347917298731, "loss": 2.3113, "step": 40392 }, { "epoch": 0.51, "learning_rate": 0.0001097149769493978, "loss": 2.3076, "step": 40400 }, { "epoch": 0.51, "learning_rate": 0.00010968647475439448, "loss": 2.2891, "step": 40408 }, { "epoch": 0.51, "learning_rate": 0.00010965797259083599, "loss": 2.316, "step": 40416 }, { "epoch": 0.51, "learning_rate": 0.00010962947046158092, "loss": 2.3197, "step": 40424 }, { "epoch": 0.51, "learning_rate": 0.00010960096836948784, "loss": 2.296, "step": 40432 }, { "epoch": 0.51, "learning_rate": 0.00010957246631741537, "loss": 2.2941, "step": 40440 }, { "epoch": 0.51, "learning_rate": 0.00010954396430822213, "loss": 2.3092, "step": 40448 }, { "epoch": 0.51, "learning_rate": 0.00010951546234476666, "loss": 2.3177, "step": 40456 }, { "epoch": 0.51, "learning_rate": 0.00010948696042990758, "loss": 2.3084, "step": 40464 }, { "epoch": 0.51, "learning_rate": 0.00010945845856650348, "loss": 2.335, "step": 40472 }, { "epoch": 0.51, "learning_rate": 0.0001094299567574129, "loss": 2.3034, "step": 40480 }, { "epoch": 0.51, "learning_rate": 0.00010940145500549444, "loss": 2.312, "step": 40488 }, { "epoch": 0.51, "learning_rate": 0.00010937295331360664, "loss": 2.3106, "step": 40496 }, { "epoch": 0.51, "learning_rate": 0.00010934445168460808, "loss": 2.3026, "step": 40504 }, { "epoch": 0.51, "learning_rate": 0.00010931595012135727, "loss": 2.2865, "step": 40512 }, { "epoch": 0.51, "learning_rate": 0.0001092874486267128, "loss": 2.3102, "step": 40520 }, { "epoch": 0.51, "learning_rate": 0.00010925894720353322, "loss": 2.3152, "step": 40528 }, { "epoch": 0.51, "learning_rate": 0.00010923044585467703, "loss": 2.293, "step": 40536 }, { "epoch": 0.51, "learning_rate": 0.00010920194458300273, "loss": 2.3052, "step": 40544 }, { "epoch": 0.51, "learning_rate": 0.0001091734433913689, "loss": 2.2823, "step": 40552 }, { "epoch": 0.51, "learning_rate": 0.00010914494228263398, "loss": 2.3042, "step": 40560 }, { "epoch": 0.51, "learning_rate": 0.00010911644125965657, "loss": 2.2974, "step": 40568 }, { "epoch": 0.51, "learning_rate": 0.00010908794032529501, "loss": 2.2982, "step": 40576 }, { "epoch": 0.51, "learning_rate": 0.00010905943948240793, "loss": 2.3155, "step": 40584 }, { "epoch": 0.51, "learning_rate": 0.00010903093873385373, "loss": 2.3153, "step": 40592 }, { "epoch": 0.51, "learning_rate": 0.00010900243808249087, "loss": 2.3206, "step": 40600 }, { "epoch": 0.51, "learning_rate": 0.00010897393753117782, "loss": 2.3006, "step": 40608 }, { "epoch": 0.51, "learning_rate": 0.000108945437082773, "loss": 2.2978, "step": 40616 }, { "epoch": 0.51, "learning_rate": 0.0001089169367401349, "loss": 2.3088, "step": 40624 }, { "epoch": 0.51, "learning_rate": 0.0001088884365061219, "loss": 2.3071, "step": 40632 }, { "epoch": 0.51, "learning_rate": 0.00010885993638359242, "loss": 2.3006, "step": 40640 }, { "epoch": 0.51, "learning_rate": 0.00010883143637540482, "loss": 2.2962, "step": 40648 }, { "epoch": 0.51, "learning_rate": 0.0001088029364844176, "loss": 2.283, "step": 40656 }, { "epoch": 0.51, "learning_rate": 0.00010877443671348903, "loss": 2.3001, "step": 40664 }, { "epoch": 0.51, "learning_rate": 0.00010874593706547753, "loss": 2.3058, "step": 40672 }, { "epoch": 0.51, "learning_rate": 0.0001087174375432414, "loss": 2.3164, "step": 40680 }, { "epoch": 0.51, "learning_rate": 0.00010868893814963903, "loss": 2.3095, "step": 40688 }, { "epoch": 0.51, "learning_rate": 0.00010866043888752874, "loss": 2.3285, "step": 40696 }, { "epoch": 0.51, "learning_rate": 0.00010863193975976889, "loss": 2.3068, "step": 40704 }, { "epoch": 0.51, "learning_rate": 0.00010860344076921765, "loss": 2.287, "step": 40712 }, { "epoch": 0.51, "learning_rate": 0.00010857494191873343, "loss": 2.3192, "step": 40720 }, { "epoch": 0.51, "learning_rate": 0.00010854644321117444, "loss": 2.3142, "step": 40728 }, { "epoch": 0.51, "learning_rate": 0.00010851794464939898, "loss": 2.313, "step": 40736 }, { "epoch": 0.51, "learning_rate": 0.00010848944623626526, "loss": 2.3191, "step": 40744 }, { "epoch": 0.51, "learning_rate": 0.00010846094797463156, "loss": 2.3046, "step": 40752 }, { "epoch": 0.51, "learning_rate": 0.00010843244986735601, "loss": 2.2815, "step": 40760 }, { "epoch": 0.51, "learning_rate": 0.00010840395191729686, "loss": 2.3175, "step": 40768 }, { "epoch": 0.51, "learning_rate": 0.00010837545412731231, "loss": 2.286, "step": 40776 }, { "epoch": 0.51, "learning_rate": 0.00010834695650026048, "loss": 2.2999, "step": 40784 }, { "epoch": 0.51, "learning_rate": 0.0001083184590389996, "loss": 2.3086, "step": 40792 }, { "epoch": 0.51, "learning_rate": 0.00010828996174638771, "loss": 2.3154, "step": 40800 }, { "epoch": 0.51, "learning_rate": 0.00010826146462528298, "loss": 2.3211, "step": 40808 }, { "epoch": 0.51, "learning_rate": 0.00010823296767854345, "loss": 2.3023, "step": 40816 }, { "epoch": 0.51, "learning_rate": 0.0001082044709090273, "loss": 2.3119, "step": 40824 }, { "epoch": 0.51, "learning_rate": 0.00010817597431959255, "loss": 2.3004, "step": 40832 }, { "epoch": 0.51, "learning_rate": 0.00010814747791309723, "loss": 2.2792, "step": 40840 }, { "epoch": 0.51, "learning_rate": 0.00010811898169239934, "loss": 2.3028, "step": 40848 }, { "epoch": 0.51, "learning_rate": 0.00010809048566035696, "loss": 2.3169, "step": 40856 }, { "epoch": 0.51, "learning_rate": 0.00010806198981982805, "loss": 2.2997, "step": 40864 }, { "epoch": 0.51, "learning_rate": 0.00010803349417367057, "loss": 2.3118, "step": 40872 }, { "epoch": 0.51, "learning_rate": 0.0001080049987247425, "loss": 2.3168, "step": 40880 }, { "epoch": 0.51, "learning_rate": 0.00010797650347590174, "loss": 2.2823, "step": 40888 }, { "epoch": 0.51, "learning_rate": 0.00010794800843000621, "loss": 2.2986, "step": 40896 }, { "epoch": 0.51, "learning_rate": 0.00010791951358991381, "loss": 2.3033, "step": 40904 }, { "epoch": 0.51, "learning_rate": 0.00010789101895848241, "loss": 2.2938, "step": 40912 }, { "epoch": 0.51, "learning_rate": 0.00010786252453856989, "loss": 2.3143, "step": 40920 }, { "epoch": 0.51, "learning_rate": 0.000107834030333034, "loss": 2.2907, "step": 40928 }, { "epoch": 0.51, "learning_rate": 0.0001078055363447326, "loss": 2.2963, "step": 40936 }, { "epoch": 0.51, "learning_rate": 0.0001077770425765235, "loss": 2.2969, "step": 40944 }, { "epoch": 0.51, "learning_rate": 0.0001077485490312644, "loss": 2.3158, "step": 40952 }, { "epoch": 0.51, "learning_rate": 0.0001077200557118131, "loss": 2.3117, "step": 40960 }, { "epoch": 0.51, "learning_rate": 0.00010769156262102729, "loss": 2.2931, "step": 40968 }, { "epoch": 0.51, "learning_rate": 0.00010766306976176467, "loss": 2.3069, "step": 40976 }, { "epoch": 0.51, "learning_rate": 0.00010763457713688287, "loss": 2.3004, "step": 40984 }, { "epoch": 0.51, "learning_rate": 0.00010760608474923964, "loss": 2.3145, "step": 40992 }, { "epoch": 0.51, "learning_rate": 0.0001075775926016925, "loss": 2.2891, "step": 41000 }, { "epoch": 0.51, "learning_rate": 0.00010754910069709913, "loss": 2.3175, "step": 41008 }, { "epoch": 0.51, "learning_rate": 0.00010752060903831707, "loss": 2.3085, "step": 41016 }, { "epoch": 0.51, "learning_rate": 0.00010749211762820384, "loss": 2.3009, "step": 41024 }, { "epoch": 0.51, "learning_rate": 0.00010746362646961702, "loss": 2.3174, "step": 41032 }, { "epoch": 0.51, "learning_rate": 0.00010743513556541411, "loss": 2.3065, "step": 41040 }, { "epoch": 0.51, "learning_rate": 0.00010740664491845254, "loss": 2.3182, "step": 41048 }, { "epoch": 0.51, "learning_rate": 0.00010737815453158981, "loss": 2.3174, "step": 41056 }, { "epoch": 0.51, "learning_rate": 0.00010734966440768335, "loss": 2.315, "step": 41064 }, { "epoch": 0.51, "learning_rate": 0.00010732117454959048, "loss": 2.2915, "step": 41072 }, { "epoch": 0.51, "learning_rate": 0.00010729268496016864, "loss": 2.3255, "step": 41080 }, { "epoch": 0.51, "learning_rate": 0.00010726419564227516, "loss": 2.2975, "step": 41088 }, { "epoch": 0.51, "learning_rate": 0.00010723570659876738, "loss": 2.3002, "step": 41096 }, { "epoch": 0.51, "learning_rate": 0.00010720721783250254, "loss": 2.2941, "step": 41104 }, { "epoch": 0.51, "learning_rate": 0.00010717872934633792, "loss": 2.3163, "step": 41112 }, { "epoch": 0.51, "learning_rate": 0.00010715024114313078, "loss": 2.3005, "step": 41120 }, { "epoch": 0.51, "learning_rate": 0.00010712175322573827, "loss": 2.3059, "step": 41128 }, { "epoch": 0.51, "learning_rate": 0.00010709326559701765, "loss": 2.3077, "step": 41136 }, { "epoch": 0.51, "learning_rate": 0.000107064778259826, "loss": 2.2911, "step": 41144 }, { "epoch": 0.51, "learning_rate": 0.00010703629121702045, "loss": 2.3138, "step": 41152 }, { "epoch": 0.51, "learning_rate": 0.0001070078044714581, "loss": 2.3275, "step": 41160 }, { "epoch": 0.51, "learning_rate": 0.00010697931802599603, "loss": 2.309, "step": 41168 }, { "epoch": 0.51, "learning_rate": 0.00010695083188349122, "loss": 2.2899, "step": 41176 }, { "epoch": 0.51, "learning_rate": 0.00010692234604680072, "loss": 2.2874, "step": 41184 }, { "epoch": 0.51, "learning_rate": 0.00010689386051878146, "loss": 2.2992, "step": 41192 }, { "epoch": 0.52, "learning_rate": 0.00010686537530229037, "loss": 2.3091, "step": 41200 }, { "epoch": 0.52, "learning_rate": 0.00010683689040018439, "loss": 2.3312, "step": 41208 }, { "epoch": 0.52, "learning_rate": 0.00010680840581532036, "loss": 2.3282, "step": 41216 }, { "epoch": 0.52, "learning_rate": 0.00010677992155055516, "loss": 2.3134, "step": 41224 }, { "epoch": 0.52, "learning_rate": 0.00010675143760874562, "loss": 2.3041, "step": 41232 }, { "epoch": 0.52, "learning_rate": 0.00010672295399274843, "loss": 2.3146, "step": 41240 }, { "epoch": 0.52, "learning_rate": 0.0001066944707054204, "loss": 2.3119, "step": 41248 }, { "epoch": 0.52, "learning_rate": 0.00010666598774961822, "loss": 2.2882, "step": 41256 }, { "epoch": 0.52, "learning_rate": 0.00010663750512819859, "loss": 2.284, "step": 41264 }, { "epoch": 0.52, "learning_rate": 0.00010660902284401816, "loss": 2.3088, "step": 41272 }, { "epoch": 0.52, "learning_rate": 0.00010658054089993349, "loss": 2.2812, "step": 41280 }, { "epoch": 0.52, "learning_rate": 0.00010655205929880121, "loss": 2.3095, "step": 41288 }, { "epoch": 0.52, "learning_rate": 0.00010652357804347784, "loss": 2.3062, "step": 41296 }, { "epoch": 0.52, "learning_rate": 0.00010649509713681988, "loss": 2.3074, "step": 41304 }, { "epoch": 0.52, "learning_rate": 0.00010646661658168384, "loss": 2.3275, "step": 41312 }, { "epoch": 0.52, "learning_rate": 0.00010643813638092612, "loss": 2.3013, "step": 41320 }, { "epoch": 0.52, "learning_rate": 0.00010640965653740316, "loss": 2.2992, "step": 41328 }, { "epoch": 0.52, "learning_rate": 0.00010638117705397128, "loss": 2.3256, "step": 41336 }, { "epoch": 0.52, "learning_rate": 0.00010635269793348686, "loss": 2.3019, "step": 41344 }, { "epoch": 0.52, "learning_rate": 0.00010632421917880613, "loss": 2.313, "step": 41352 }, { "epoch": 0.52, "learning_rate": 0.00010629574079278544, "loss": 2.2922, "step": 41360 }, { "epoch": 0.52, "learning_rate": 0.00010626726277828094, "loss": 2.312, "step": 41368 }, { "epoch": 0.52, "learning_rate": 0.00010623878513814883, "loss": 2.3184, "step": 41376 }, { "epoch": 0.52, "learning_rate": 0.00010621030787524522, "loss": 2.297, "step": 41384 }, { "epoch": 0.52, "learning_rate": 0.00010618183099242628, "loss": 2.2943, "step": 41392 }, { "epoch": 0.52, "learning_rate": 0.00010615335449254808, "loss": 2.3047, "step": 41400 }, { "epoch": 0.52, "learning_rate": 0.00010612487837846666, "loss": 2.3133, "step": 41408 }, { "epoch": 0.52, "learning_rate": 0.0001060964026530379, "loss": 2.3041, "step": 41416 }, { "epoch": 0.52, "learning_rate": 0.00010606792731911788, "loss": 2.3138, "step": 41424 }, { "epoch": 0.52, "learning_rate": 0.00010603945237956247, "loss": 2.2992, "step": 41432 }, { "epoch": 0.52, "learning_rate": 0.00010601097783722753, "loss": 2.2993, "step": 41440 }, { "epoch": 0.52, "learning_rate": 0.00010598250369496892, "loss": 2.2912, "step": 41448 }, { "epoch": 0.52, "learning_rate": 0.00010595402995564243, "loss": 2.3078, "step": 41456 }, { "epoch": 0.52, "learning_rate": 0.0001059255566221038, "loss": 2.2973, "step": 41464 }, { "epoch": 0.52, "learning_rate": 0.00010589708369720874, "loss": 2.2894, "step": 41472 }, { "epoch": 0.52, "learning_rate": 0.00010586861118381297, "loss": 2.2959, "step": 41480 }, { "epoch": 0.52, "learning_rate": 0.00010584013908477206, "loss": 2.2747, "step": 41488 }, { "epoch": 0.52, "learning_rate": 0.00010581166740294164, "loss": 2.297, "step": 41496 }, { "epoch": 0.52, "learning_rate": 0.00010578319614117726, "loss": 2.2968, "step": 41504 }, { "epoch": 0.52, "learning_rate": 0.00010575472530233439, "loss": 2.295, "step": 41512 }, { "epoch": 0.52, "learning_rate": 0.00010572625488926853, "loss": 2.3006, "step": 41520 }, { "epoch": 0.52, "learning_rate": 0.00010569778490483506, "loss": 2.3169, "step": 41528 }, { "epoch": 0.52, "learning_rate": 0.00010566931535188944, "loss": 2.3021, "step": 41536 }, { "epoch": 0.52, "learning_rate": 0.00010564084623328692, "loss": 2.304, "step": 41544 }, { "epoch": 0.52, "learning_rate": 0.00010561237755188283, "loss": 2.2904, "step": 41552 }, { "epoch": 0.52, "learning_rate": 0.0001055839093105324, "loss": 2.2943, "step": 41560 }, { "epoch": 0.52, "learning_rate": 0.00010555544151209082, "loss": 2.289, "step": 41568 }, { "epoch": 0.52, "learning_rate": 0.00010552697415941333, "loss": 2.3049, "step": 41576 }, { "epoch": 0.52, "learning_rate": 0.00010549850725535495, "loss": 2.3005, "step": 41584 }, { "epoch": 0.52, "learning_rate": 0.00010547004080277078, "loss": 2.3021, "step": 41592 }, { "epoch": 0.52, "learning_rate": 0.00010544157480451587, "loss": 2.3002, "step": 41600 }, { "epoch": 0.52, "learning_rate": 0.00010541310926344516, "loss": 2.297, "step": 41608 }, { "epoch": 0.52, "learning_rate": 0.00010538464418241361, "loss": 2.2845, "step": 41616 }, { "epoch": 0.52, "learning_rate": 0.0001053561795642761, "loss": 2.2973, "step": 41624 }, { "epoch": 0.52, "learning_rate": 0.00010532771541188746, "loss": 2.2888, "step": 41632 }, { "epoch": 0.52, "learning_rate": 0.00010529925172810248, "loss": 2.2998, "step": 41640 }, { "epoch": 0.52, "learning_rate": 0.00010527078851577595, "loss": 2.2833, "step": 41648 }, { "epoch": 0.52, "learning_rate": 0.0001052423257777625, "loss": 2.2866, "step": 41656 }, { "epoch": 0.52, "learning_rate": 0.00010521386351691682, "loss": 2.3078, "step": 41664 }, { "epoch": 0.52, "learning_rate": 0.00010518540173609355, "loss": 2.3371, "step": 41672 }, { "epoch": 0.52, "learning_rate": 0.00010515694043814716, "loss": 2.2941, "step": 41680 }, { "epoch": 0.52, "learning_rate": 0.00010512847962593219, "loss": 2.3026, "step": 41688 }, { "epoch": 0.52, "learning_rate": 0.00010510001930230313, "loss": 2.3105, "step": 41696 }, { "epoch": 0.52, "learning_rate": 0.00010507155947011437, "loss": 2.3073, "step": 41704 }, { "epoch": 0.52, "learning_rate": 0.00010504310013222032, "loss": 2.3004, "step": 41712 }, { "epoch": 0.52, "learning_rate": 0.00010501464129147516, "loss": 2.3072, "step": 41720 }, { "epoch": 0.52, "learning_rate": 0.00010498618295073326, "loss": 2.3063, "step": 41728 }, { "epoch": 0.52, "learning_rate": 0.0001049577251128488, "loss": 2.2903, "step": 41736 }, { "epoch": 0.52, "learning_rate": 0.00010492926778067595, "loss": 2.3036, "step": 41744 }, { "epoch": 0.52, "learning_rate": 0.0001049008109570688, "loss": 2.2932, "step": 41752 }, { "epoch": 0.52, "learning_rate": 0.00010487235464488141, "loss": 2.2999, "step": 41760 }, { "epoch": 0.52, "learning_rate": 0.00010484389884696782, "loss": 2.2961, "step": 41768 }, { "epoch": 0.52, "learning_rate": 0.00010481544356618193, "loss": 2.2944, "step": 41776 }, { "epoch": 0.52, "learning_rate": 0.00010478698880537769, "loss": 2.3114, "step": 41784 }, { "epoch": 0.52, "learning_rate": 0.00010475853456740892, "loss": 2.3058, "step": 41792 }, { "epoch": 0.52, "learning_rate": 0.00010473008085512946, "loss": 2.3159, "step": 41800 }, { "epoch": 0.52, "learning_rate": 0.000104701627671393, "loss": 2.3001, "step": 41808 }, { "epoch": 0.52, "learning_rate": 0.00010467317501905327, "loss": 2.2894, "step": 41816 }, { "epoch": 0.52, "learning_rate": 0.0001046447229009639, "loss": 2.2993, "step": 41824 }, { "epoch": 0.52, "learning_rate": 0.00010461627131997849, "loss": 2.305, "step": 41832 }, { "epoch": 0.52, "learning_rate": 0.00010458782027895055, "loss": 2.279, "step": 41840 }, { "epoch": 0.52, "learning_rate": 0.0001045593697807336, "loss": 2.2947, "step": 41848 }, { "epoch": 0.52, "learning_rate": 0.000104530919828181, "loss": 2.2992, "step": 41856 }, { "epoch": 0.52, "learning_rate": 0.00010450247042414614, "loss": 2.3024, "step": 41864 }, { "epoch": 0.52, "learning_rate": 0.00010447402157148238, "loss": 2.2991, "step": 41872 }, { "epoch": 0.52, "learning_rate": 0.00010444557327304292, "loss": 2.3166, "step": 41880 }, { "epoch": 0.52, "learning_rate": 0.000104417125531681, "loss": 2.3056, "step": 41888 }, { "epoch": 0.52, "learning_rate": 0.00010438867835024974, "loss": 2.2767, "step": 41896 }, { "epoch": 0.52, "learning_rate": 0.00010436023173160227, "loss": 2.29, "step": 41904 }, { "epoch": 0.52, "learning_rate": 0.00010433178567859159, "loss": 2.3076, "step": 41912 }, { "epoch": 0.52, "learning_rate": 0.00010430334019407066, "loss": 2.3071, "step": 41920 }, { "epoch": 0.52, "learning_rate": 0.00010427489528089247, "loss": 2.2919, "step": 41928 }, { "epoch": 0.52, "learning_rate": 0.00010424645094190983, "loss": 2.2968, "step": 41936 }, { "epoch": 0.52, "learning_rate": 0.00010421800717997556, "loss": 2.2938, "step": 41944 }, { "epoch": 0.52, "learning_rate": 0.0001041895639979424, "loss": 2.2932, "step": 41952 }, { "epoch": 0.52, "learning_rate": 0.00010416112139866305, "loss": 2.3062, "step": 41960 }, { "epoch": 0.52, "learning_rate": 0.00010413267938499014, "loss": 2.3143, "step": 41968 }, { "epoch": 0.52, "learning_rate": 0.00010410423795977629, "loss": 2.3132, "step": 41976 }, { "epoch": 0.52, "learning_rate": 0.00010407579712587388, "loss": 2.2922, "step": 41984 }, { "epoch": 0.52, "learning_rate": 0.0001040473568861355, "loss": 2.2885, "step": 41992 }, { "epoch": 0.53, "learning_rate": 0.00010401891724341346, "loss": 2.2924, "step": 42000 }, { "epoch": 0.53, "learning_rate": 0.00010399047820056016, "loss": 2.303, "step": 42008 }, { "epoch": 0.53, "learning_rate": 0.00010396203976042784, "loss": 2.2758, "step": 42016 }, { "epoch": 0.53, "learning_rate": 0.00010393360192586872, "loss": 2.3252, "step": 42024 }, { "epoch": 0.53, "learning_rate": 0.00010390516469973495, "loss": 2.2892, "step": 42032 }, { "epoch": 0.53, "learning_rate": 0.00010387672808487862, "loss": 2.3077, "step": 42040 }, { "epoch": 0.53, "learning_rate": 0.00010384829208415179, "loss": 2.3002, "step": 42048 }, { "epoch": 0.53, "learning_rate": 0.00010381985670040635, "loss": 2.3017, "step": 42056 }, { "epoch": 0.53, "learning_rate": 0.00010379142193649434, "loss": 2.3172, "step": 42064 }, { "epoch": 0.53, "learning_rate": 0.0001037629877952675, "loss": 2.2812, "step": 42072 }, { "epoch": 0.53, "learning_rate": 0.0001037345542795776, "loss": 2.2807, "step": 42080 }, { "epoch": 0.53, "learning_rate": 0.00010370612139227644, "loss": 2.3093, "step": 42088 }, { "epoch": 0.53, "learning_rate": 0.00010367768913621565, "loss": 2.2823, "step": 42096 }, { "epoch": 0.53, "learning_rate": 0.00010364925751424681, "loss": 2.3032, "step": 42104 }, { "epoch": 0.53, "learning_rate": 0.00010362082652922148, "loss": 2.3072, "step": 42112 }, { "epoch": 0.53, "learning_rate": 0.00010359239618399103, "loss": 2.317, "step": 42120 }, { "epoch": 0.53, "learning_rate": 0.00010356396648140699, "loss": 2.3177, "step": 42128 }, { "epoch": 0.53, "learning_rate": 0.00010353553742432063, "loss": 2.2968, "step": 42136 }, { "epoch": 0.53, "learning_rate": 0.00010350710901558325, "loss": 2.3242, "step": 42144 }, { "epoch": 0.53, "learning_rate": 0.00010347868125804603, "loss": 2.2912, "step": 42152 }, { "epoch": 0.53, "learning_rate": 0.00010345025415456013, "loss": 2.3084, "step": 42160 }, { "epoch": 0.53, "learning_rate": 0.00010342182770797663, "loss": 2.3047, "step": 42168 }, { "epoch": 0.53, "learning_rate": 0.00010339340192114654, "loss": 2.2915, "step": 42176 }, { "epoch": 0.53, "learning_rate": 0.00010336497679692081, "loss": 2.3056, "step": 42184 }, { "epoch": 0.53, "learning_rate": 0.00010333655233815028, "loss": 2.3089, "step": 42192 }, { "epoch": 0.53, "learning_rate": 0.00010330812854768584, "loss": 2.3013, "step": 42200 }, { "epoch": 0.53, "learning_rate": 0.00010327970542837814, "loss": 2.2917, "step": 42208 }, { "epoch": 0.53, "learning_rate": 0.00010325128298307793, "loss": 2.3007, "step": 42216 }, { "epoch": 0.53, "learning_rate": 0.00010322286121463577, "loss": 2.312, "step": 42224 }, { "epoch": 0.53, "learning_rate": 0.00010319444012590225, "loss": 2.2998, "step": 42232 }, { "epoch": 0.53, "learning_rate": 0.00010316601971972785, "loss": 2.2962, "step": 42240 }, { "epoch": 0.53, "learning_rate": 0.00010313759999896293, "loss": 2.309, "step": 42248 }, { "epoch": 0.53, "learning_rate": 0.00010310918096645783, "loss": 2.2772, "step": 42256 }, { "epoch": 0.53, "learning_rate": 0.00010308076262506283, "loss": 2.3025, "step": 42264 }, { "epoch": 0.53, "learning_rate": 0.00010305234497762817, "loss": 2.3131, "step": 42272 }, { "epoch": 0.53, "learning_rate": 0.0001030239280270039, "loss": 2.3079, "step": 42280 }, { "epoch": 0.53, "learning_rate": 0.00010299551177604014, "loss": 2.2963, "step": 42288 }, { "epoch": 0.53, "learning_rate": 0.00010296709622758684, "loss": 2.3078, "step": 42296 }, { "epoch": 0.53, "learning_rate": 0.00010293868138449399, "loss": 2.283, "step": 42304 }, { "epoch": 0.53, "learning_rate": 0.00010291026724961132, "loss": 2.304, "step": 42312 }, { "epoch": 0.53, "learning_rate": 0.00010288185382578872, "loss": 2.3008, "step": 42320 }, { "epoch": 0.53, "learning_rate": 0.00010285344111587583, "loss": 2.2938, "step": 42328 }, { "epoch": 0.53, "learning_rate": 0.00010282502912272229, "loss": 2.2929, "step": 42336 }, { "epoch": 0.53, "learning_rate": 0.00010279661784917769, "loss": 2.3177, "step": 42344 }, { "epoch": 0.53, "learning_rate": 0.0001027682072980915, "loss": 2.3039, "step": 42352 }, { "epoch": 0.53, "learning_rate": 0.0001027397974723131, "loss": 2.301, "step": 42360 }, { "epoch": 0.53, "learning_rate": 0.00010271138837469194, "loss": 2.3047, "step": 42368 }, { "epoch": 0.53, "learning_rate": 0.00010268298000807719, "loss": 2.2946, "step": 42376 }, { "epoch": 0.53, "learning_rate": 0.0001026545723753181, "loss": 2.2901, "step": 42384 }, { "epoch": 0.53, "learning_rate": 0.00010262616547926376, "loss": 2.3042, "step": 42392 }, { "epoch": 0.53, "learning_rate": 0.00010259775932276326, "loss": 2.3173, "step": 42400 }, { "epoch": 0.53, "learning_rate": 0.00010256935390866556, "loss": 2.3031, "step": 42408 }, { "epoch": 0.53, "learning_rate": 0.00010254094923981954, "loss": 2.2917, "step": 42416 }, { "epoch": 0.53, "learning_rate": 0.00010251254531907406, "loss": 2.294, "step": 42424 }, { "epoch": 0.53, "learning_rate": 0.00010248414214927781, "loss": 2.3146, "step": 42432 }, { "epoch": 0.53, "learning_rate": 0.0001024557397332796, "loss": 2.289, "step": 42440 }, { "epoch": 0.53, "learning_rate": 0.0001024273380739279, "loss": 2.3096, "step": 42448 }, { "epoch": 0.53, "learning_rate": 0.00010239893717407128, "loss": 2.3096, "step": 42456 }, { "epoch": 0.53, "learning_rate": 0.00010237053703655819, "loss": 2.2851, "step": 42464 }, { "epoch": 0.53, "learning_rate": 0.00010234213766423699, "loss": 2.2732, "step": 42472 }, { "epoch": 0.53, "learning_rate": 0.00010231373905995605, "loss": 2.3076, "step": 42480 }, { "epoch": 0.53, "learning_rate": 0.00010228534122656349, "loss": 2.3163, "step": 42488 }, { "epoch": 0.53, "learning_rate": 0.00010225694416690748, "loss": 2.2813, "step": 42496 }, { "epoch": 0.53, "learning_rate": 0.00010222854788383612, "loss": 2.3012, "step": 42504 }, { "epoch": 0.53, "learning_rate": 0.00010220015238019733, "loss": 2.3096, "step": 42512 }, { "epoch": 0.53, "learning_rate": 0.00010217175765883913, "loss": 2.3145, "step": 42520 }, { "epoch": 0.53, "learning_rate": 0.00010214336372260922, "loss": 2.297, "step": 42528 }, { "epoch": 0.53, "learning_rate": 0.00010211497057435542, "loss": 2.2937, "step": 42536 }, { "epoch": 0.53, "learning_rate": 0.00010208657821692541, "loss": 2.2999, "step": 42544 }, { "epoch": 0.53, "learning_rate": 0.00010205818665316675, "loss": 2.2955, "step": 42552 }, { "epoch": 0.53, "learning_rate": 0.00010202979588592698, "loss": 2.2889, "step": 42560 }, { "epoch": 0.53, "learning_rate": 0.0001020014059180535, "loss": 2.3177, "step": 42568 }, { "epoch": 0.53, "learning_rate": 0.0001019730167523937, "loss": 2.2985, "step": 42576 }, { "epoch": 0.53, "learning_rate": 0.00010194462839179486, "loss": 2.3037, "step": 42584 }, { "epoch": 0.53, "learning_rate": 0.00010191624083910412, "loss": 2.3042, "step": 42592 }, { "epoch": 0.53, "learning_rate": 0.00010188785409716864, "loss": 2.3035, "step": 42600 }, { "epoch": 0.53, "learning_rate": 0.00010185946816883538, "loss": 2.2998, "step": 42608 }, { "epoch": 0.53, "learning_rate": 0.0001018310830569514, "loss": 2.3073, "step": 42616 }, { "epoch": 0.53, "learning_rate": 0.00010180269876436345, "loss": 2.3003, "step": 42624 }, { "epoch": 0.53, "learning_rate": 0.00010177431529391837, "loss": 2.2804, "step": 42632 }, { "epoch": 0.53, "learning_rate": 0.00010174593264846288, "loss": 2.2982, "step": 42640 }, { "epoch": 0.53, "learning_rate": 0.00010171755083084356, "loss": 2.3084, "step": 42648 }, { "epoch": 0.53, "learning_rate": 0.000101689169843907, "loss": 2.3019, "step": 42656 }, { "epoch": 0.53, "learning_rate": 0.00010166078969049957, "loss": 2.2963, "step": 42664 }, { "epoch": 0.53, "learning_rate": 0.00010163241037346766, "loss": 2.3163, "step": 42672 }, { "epoch": 0.53, "learning_rate": 0.00010160403189565764, "loss": 2.3219, "step": 42680 }, { "epoch": 0.53, "learning_rate": 0.0001015756542599156, "loss": 2.2902, "step": 42688 }, { "epoch": 0.53, "learning_rate": 0.00010154727746908773, "loss": 2.3088, "step": 42696 }, { "epoch": 0.53, "learning_rate": 0.00010151890152602001, "loss": 2.315, "step": 42704 }, { "epoch": 0.53, "learning_rate": 0.00010149052643355841, "loss": 2.2957, "step": 42712 }, { "epoch": 0.53, "learning_rate": 0.00010146215219454885, "loss": 2.3088, "step": 42720 }, { "epoch": 0.53, "learning_rate": 0.00010143377881183695, "loss": 2.2971, "step": 42728 }, { "epoch": 0.53, "learning_rate": 0.00010140540628826855, "loss": 2.2777, "step": 42736 }, { "epoch": 0.53, "learning_rate": 0.00010137703462668917, "loss": 2.2804, "step": 42744 }, { "epoch": 0.53, "learning_rate": 0.00010134866382994442, "loss": 2.2992, "step": 42752 }, { "epoch": 0.53, "learning_rate": 0.00010132029390087962, "loss": 2.2948, "step": 42760 }, { "epoch": 0.53, "learning_rate": 0.00010129192484234015, "loss": 2.311, "step": 42768 }, { "epoch": 0.53, "learning_rate": 0.00010126355665717134, "loss": 2.3109, "step": 42776 }, { "epoch": 0.53, "learning_rate": 0.0001012351893482182, "loss": 2.2969, "step": 42784 }, { "epoch": 0.53, "learning_rate": 0.00010120682291832598, "loss": 2.2997, "step": 42792 }, { "epoch": 0.54, "learning_rate": 0.00010117845737033957, "loss": 2.3081, "step": 42800 }, { "epoch": 0.54, "learning_rate": 0.00010115009270710387, "loss": 2.2822, "step": 42808 }, { "epoch": 0.54, "learning_rate": 0.00010112172893146378, "loss": 2.3076, "step": 42816 }, { "epoch": 0.54, "learning_rate": 0.00010109336604626394, "loss": 2.3113, "step": 42824 }, { "epoch": 0.54, "learning_rate": 0.00010106500405434902, "loss": 2.2999, "step": 42832 }, { "epoch": 0.54, "learning_rate": 0.00010103664295856359, "loss": 2.2949, "step": 42840 }, { "epoch": 0.54, "learning_rate": 0.00010100828276175202, "loss": 2.3018, "step": 42848 }, { "epoch": 0.54, "learning_rate": 0.00010097992346675881, "loss": 2.2996, "step": 42856 }, { "epoch": 0.54, "learning_rate": 0.00010095156507642809, "loss": 2.2856, "step": 42864 }, { "epoch": 0.54, "learning_rate": 0.00010092320759360418, "loss": 2.3038, "step": 42872 }, { "epoch": 0.54, "learning_rate": 0.00010089485102113114, "loss": 2.2979, "step": 42880 }, { "epoch": 0.54, "learning_rate": 0.00010086649536185289, "loss": 2.2989, "step": 42888 }, { "epoch": 0.54, "learning_rate": 0.00010083814061861343, "loss": 2.2923, "step": 42896 }, { "epoch": 0.54, "learning_rate": 0.00010080978679425653, "loss": 2.3045, "step": 42904 }, { "epoch": 0.54, "learning_rate": 0.00010078143389162598, "loss": 2.2918, "step": 42912 }, { "epoch": 0.54, "learning_rate": 0.00010075308191356532, "loss": 2.3095, "step": 42920 }, { "epoch": 0.54, "learning_rate": 0.00010072473086291818, "loss": 2.3025, "step": 42928 }, { "epoch": 0.54, "learning_rate": 0.00010069638074252801, "loss": 2.3297, "step": 42936 }, { "epoch": 0.54, "learning_rate": 0.00010066803155523807, "loss": 2.3128, "step": 42944 }, { "epoch": 0.54, "learning_rate": 0.00010063968330389175, "loss": 2.3206, "step": 42952 }, { "epoch": 0.54, "learning_rate": 0.0001006113359913321, "loss": 2.3323, "step": 42960 }, { "epoch": 0.54, "learning_rate": 0.00010058298962040229, "loss": 2.2972, "step": 42968 }, { "epoch": 0.54, "learning_rate": 0.00010055464419394527, "loss": 2.3056, "step": 42976 }, { "epoch": 0.54, "learning_rate": 0.00010052629971480387, "loss": 2.3087, "step": 42984 }, { "epoch": 0.54, "learning_rate": 0.00010049795618582096, "loss": 2.3108, "step": 42992 }, { "epoch": 0.54, "learning_rate": 0.00010046961360983917, "loss": 2.3072, "step": 43000 }, { "epoch": 0.54, "learning_rate": 0.00010044127198970117, "loss": 2.2862, "step": 43008 }, { "epoch": 0.54, "learning_rate": 0.00010041293132824945, "loss": 2.3101, "step": 43016 }, { "epoch": 0.54, "learning_rate": 0.00010038459162832635, "loss": 2.3118, "step": 43024 }, { "epoch": 0.54, "learning_rate": 0.00010035625289277421, "loss": 2.3137, "step": 43032 }, { "epoch": 0.54, "learning_rate": 0.00010032791512443527, "loss": 2.3008, "step": 43040 }, { "epoch": 0.54, "learning_rate": 0.0001002995783261517, "loss": 2.2978, "step": 43048 }, { "epoch": 0.54, "learning_rate": 0.00010027124250076539, "loss": 2.28, "step": 43056 }, { "epoch": 0.54, "learning_rate": 0.00010024290765111835, "loss": 2.2969, "step": 43064 }, { "epoch": 0.54, "learning_rate": 0.00010021457378005239, "loss": 2.294, "step": 43072 }, { "epoch": 0.54, "learning_rate": 0.00010018624089040922, "loss": 2.3237, "step": 43080 }, { "epoch": 0.54, "learning_rate": 0.0001001579089850305, "loss": 2.3093, "step": 43088 }, { "epoch": 0.54, "learning_rate": 0.00010012957806675771, "loss": 2.3071, "step": 43096 }, { "epoch": 0.54, "learning_rate": 0.00010010124813843236, "loss": 2.2992, "step": 43104 }, { "epoch": 0.54, "learning_rate": 0.00010007291920289572, "loss": 2.2821, "step": 43112 }, { "epoch": 0.54, "learning_rate": 0.000100044591262989, "loss": 2.304, "step": 43120 }, { "epoch": 0.54, "learning_rate": 0.00010001626432155337, "loss": 2.2977, "step": 43128 }, { "epoch": 0.54, "learning_rate": 9.998793838142986e-05, "loss": 2.2894, "step": 43136 }, { "epoch": 0.54, "learning_rate": 9.995961344545944e-05, "loss": 2.3071, "step": 43144 }, { "epoch": 0.54, "learning_rate": 9.993128951648289e-05, "loss": 2.3119, "step": 43152 }, { "epoch": 0.54, "learning_rate": 9.990296659734091e-05, "loss": 2.2908, "step": 43160 }, { "epoch": 0.54, "learning_rate": 9.98746446908742e-05, "loss": 2.2991, "step": 43168 }, { "epoch": 0.54, "learning_rate": 9.984632379992323e-05, "loss": 2.2774, "step": 43176 }, { "epoch": 0.54, "learning_rate": 9.981800392732845e-05, "loss": 2.3025, "step": 43184 }, { "epoch": 0.54, "learning_rate": 9.97896850759302e-05, "loss": 2.2995, "step": 43192 }, { "epoch": 0.54, "learning_rate": 9.976136724856866e-05, "loss": 2.3057, "step": 43200 }, { "epoch": 0.54, "learning_rate": 9.973305044808401e-05, "loss": 2.3014, "step": 43208 }, { "epoch": 0.54, "learning_rate": 9.970473467731618e-05, "loss": 2.3051, "step": 43216 }, { "epoch": 0.54, "learning_rate": 9.967641993910518e-05, "loss": 2.3001, "step": 43224 }, { "epoch": 0.54, "learning_rate": 9.964810623629071e-05, "loss": 2.2885, "step": 43232 }, { "epoch": 0.54, "learning_rate": 9.961979357171254e-05, "loss": 2.2805, "step": 43240 }, { "epoch": 0.54, "learning_rate": 9.959148194821027e-05, "loss": 2.3048, "step": 43248 }, { "epoch": 0.54, "learning_rate": 9.956317136862336e-05, "loss": 2.2945, "step": 43256 }, { "epoch": 0.54, "learning_rate": 9.953486183579124e-05, "loss": 2.3017, "step": 43264 }, { "epoch": 0.54, "learning_rate": 9.950655335255317e-05, "loss": 2.2784, "step": 43272 }, { "epoch": 0.54, "learning_rate": 9.947824592174835e-05, "loss": 2.3053, "step": 43280 }, { "epoch": 0.54, "learning_rate": 9.944993954621587e-05, "loss": 2.2954, "step": 43288 }, { "epoch": 0.54, "learning_rate": 9.942163422879463e-05, "loss": 2.2982, "step": 43296 }, { "epoch": 0.54, "learning_rate": 9.939332997232356e-05, "loss": 2.3051, "step": 43304 }, { "epoch": 0.54, "learning_rate": 9.936502677964135e-05, "loss": 2.3075, "step": 43312 }, { "epoch": 0.54, "learning_rate": 9.933672465358677e-05, "loss": 2.3024, "step": 43320 }, { "epoch": 0.54, "learning_rate": 9.930842359699824e-05, "loss": 2.3206, "step": 43328 }, { "epoch": 0.54, "learning_rate": 9.928012361271422e-05, "loss": 2.2904, "step": 43336 }, { "epoch": 0.54, "learning_rate": 9.925182470357311e-05, "loss": 2.2906, "step": 43344 }, { "epoch": 0.54, "learning_rate": 9.922352687241303e-05, "loss": 2.2915, "step": 43352 }, { "epoch": 0.54, "learning_rate": 9.91952301220722e-05, "loss": 2.2974, "step": 43360 }, { "epoch": 0.54, "learning_rate": 9.916693445538852e-05, "loss": 2.3028, "step": 43368 }, { "epoch": 0.54, "learning_rate": 9.913863987519992e-05, "loss": 2.3058, "step": 43376 }, { "epoch": 0.54, "learning_rate": 9.911034638434424e-05, "loss": 2.2847, "step": 43384 }, { "epoch": 0.54, "learning_rate": 9.908205398565907e-05, "loss": 2.302, "step": 43392 }, { "epoch": 0.54, "learning_rate": 9.905376268198205e-05, "loss": 2.2857, "step": 43400 }, { "epoch": 0.54, "learning_rate": 9.902547247615062e-05, "loss": 2.3047, "step": 43408 }, { "epoch": 0.54, "learning_rate": 9.899718337100207e-05, "loss": 2.3228, "step": 43416 }, { "epoch": 0.54, "learning_rate": 9.896889536937375e-05, "loss": 2.296, "step": 43424 }, { "epoch": 0.54, "learning_rate": 9.894060847410264e-05, "loss": 2.3182, "step": 43432 }, { "epoch": 0.54, "learning_rate": 9.891232268802588e-05, "loss": 2.2831, "step": 43440 }, { "epoch": 0.54, "learning_rate": 9.88840380139803e-05, "loss": 2.3262, "step": 43448 }, { "epoch": 0.54, "learning_rate": 9.885575445480278e-05, "loss": 2.3164, "step": 43456 }, { "epoch": 0.54, "learning_rate": 9.882747201332989e-05, "loss": 2.3014, "step": 43464 }, { "epoch": 0.54, "learning_rate": 9.879919069239825e-05, "loss": 2.3126, "step": 43472 }, { "epoch": 0.54, "learning_rate": 9.877091049484435e-05, "loss": 2.2903, "step": 43480 }, { "epoch": 0.54, "learning_rate": 9.874263142350444e-05, "loss": 2.2932, "step": 43488 }, { "epoch": 0.54, "learning_rate": 9.871435348121487e-05, "loss": 2.3037, "step": 43496 }, { "epoch": 0.54, "learning_rate": 9.868607667081169e-05, "loss": 2.3064, "step": 43504 }, { "epoch": 0.54, "learning_rate": 9.865780099513089e-05, "loss": 2.3046, "step": 43512 }, { "epoch": 0.54, "learning_rate": 9.86295264570084e-05, "loss": 2.2858, "step": 43520 }, { "epoch": 0.54, "learning_rate": 9.860125305927994e-05, "loss": 2.2735, "step": 43528 }, { "epoch": 0.54, "learning_rate": 9.857298080478123e-05, "loss": 2.2981, "step": 43536 }, { "epoch": 0.54, "learning_rate": 9.854470969634784e-05, "loss": 2.3059, "step": 43544 }, { "epoch": 0.54, "learning_rate": 9.851643973681511e-05, "loss": 2.3115, "step": 43552 }, { "epoch": 0.54, "learning_rate": 9.848817092901843e-05, "loss": 2.2911, "step": 43560 }, { "epoch": 0.54, "learning_rate": 9.845990327579295e-05, "loss": 2.2974, "step": 43568 }, { "epoch": 0.54, "learning_rate": 9.843163677997378e-05, "loss": 2.3143, "step": 43576 }, { "epoch": 0.54, "learning_rate": 9.840337144439593e-05, "loss": 2.2975, "step": 43584 }, { "epoch": 0.54, "learning_rate": 9.837510727189419e-05, "loss": 2.3232, "step": 43592 }, { "epoch": 0.55, "learning_rate": 9.834684426530332e-05, "loss": 2.2983, "step": 43600 }, { "epoch": 0.55, "learning_rate": 9.831858242745791e-05, "loss": 2.2911, "step": 43608 }, { "epoch": 0.55, "learning_rate": 9.829032176119256e-05, "loss": 2.3037, "step": 43616 }, { "epoch": 0.55, "learning_rate": 9.826206226934151e-05, "loss": 2.2845, "step": 43624 }, { "epoch": 0.55, "learning_rate": 9.823380395473916e-05, "loss": 2.3093, "step": 43632 }, { "epoch": 0.55, "learning_rate": 9.820554682021958e-05, "loss": 2.3247, "step": 43640 }, { "epoch": 0.55, "learning_rate": 9.817729086861682e-05, "loss": 2.2972, "step": 43648 }, { "epoch": 0.55, "learning_rate": 9.814903610276482e-05, "loss": 2.2789, "step": 43656 }, { "epoch": 0.55, "learning_rate": 9.812078252549732e-05, "loss": 2.3011, "step": 43664 }, { "epoch": 0.55, "learning_rate": 9.809253013964804e-05, "loss": 2.2929, "step": 43672 }, { "epoch": 0.55, "learning_rate": 9.80642789480505e-05, "loss": 2.2947, "step": 43680 }, { "epoch": 0.55, "learning_rate": 9.803602895353816e-05, "loss": 2.294, "step": 43688 }, { "epoch": 0.55, "learning_rate": 9.800778015894434e-05, "loss": 2.2883, "step": 43696 }, { "epoch": 0.55, "learning_rate": 9.797953256710214e-05, "loss": 2.2903, "step": 43704 }, { "epoch": 0.55, "learning_rate": 9.79512861808448e-05, "loss": 2.3099, "step": 43712 }, { "epoch": 0.55, "learning_rate": 9.792304100300518e-05, "loss": 2.3017, "step": 43720 }, { "epoch": 0.55, "learning_rate": 9.789479703641607e-05, "loss": 2.2888, "step": 43728 }, { "epoch": 0.55, "learning_rate": 9.786655428391025e-05, "loss": 2.3041, "step": 43736 }, { "epoch": 0.55, "learning_rate": 9.783831274832025e-05, "loss": 2.2966, "step": 43744 }, { "epoch": 0.55, "learning_rate": 9.781007243247864e-05, "loss": 2.3075, "step": 43752 }, { "epoch": 0.55, "learning_rate": 9.778183333921766e-05, "loss": 2.3012, "step": 43760 }, { "epoch": 0.55, "learning_rate": 9.775359547136953e-05, "loss": 2.3098, "step": 43768 }, { "epoch": 0.55, "learning_rate": 9.772535883176641e-05, "loss": 2.295, "step": 43776 }, { "epoch": 0.55, "learning_rate": 9.769712342324023e-05, "loss": 2.3145, "step": 43784 }, { "epoch": 0.55, "learning_rate": 9.76688892486229e-05, "loss": 2.3048, "step": 43792 }, { "epoch": 0.55, "learning_rate": 9.764065631074606e-05, "loss": 2.3006, "step": 43800 }, { "epoch": 0.55, "learning_rate": 9.761242461244137e-05, "loss": 2.3134, "step": 43808 }, { "epoch": 0.55, "learning_rate": 9.758419415654034e-05, "loss": 2.2953, "step": 43816 }, { "epoch": 0.55, "learning_rate": 9.755596494587425e-05, "loss": 2.3063, "step": 43824 }, { "epoch": 0.55, "learning_rate": 9.752773698327435e-05, "loss": 2.3052, "step": 43832 }, { "epoch": 0.55, "learning_rate": 9.749951027157178e-05, "loss": 2.3159, "step": 43840 }, { "epoch": 0.55, "learning_rate": 9.747128481359751e-05, "loss": 2.2961, "step": 43848 }, { "epoch": 0.55, "learning_rate": 9.74430606121824e-05, "loss": 2.2969, "step": 43856 }, { "epoch": 0.55, "learning_rate": 9.741483767015709e-05, "loss": 2.2936, "step": 43864 }, { "epoch": 0.55, "learning_rate": 9.738661599035228e-05, "loss": 2.2882, "step": 43872 }, { "epoch": 0.55, "learning_rate": 9.735839557559843e-05, "loss": 2.2976, "step": 43880 }, { "epoch": 0.55, "learning_rate": 9.733017642872585e-05, "loss": 2.3021, "step": 43888 }, { "epoch": 0.55, "learning_rate": 9.73019585525648e-05, "loss": 2.3144, "step": 43896 }, { "epoch": 0.55, "learning_rate": 9.727374194994535e-05, "loss": 2.2869, "step": 43904 }, { "epoch": 0.55, "learning_rate": 9.724552662369748e-05, "loss": 2.2863, "step": 43912 }, { "epoch": 0.55, "learning_rate": 9.7217312576651e-05, "loss": 2.2926, "step": 43920 }, { "epoch": 0.55, "learning_rate": 9.718909981163569e-05, "loss": 2.298, "step": 43928 }, { "epoch": 0.55, "learning_rate": 9.716088833148105e-05, "loss": 2.3022, "step": 43936 }, { "epoch": 0.55, "learning_rate": 9.713267813901652e-05, "loss": 2.279, "step": 43944 }, { "epoch": 0.55, "learning_rate": 9.71044692370715e-05, "loss": 2.2969, "step": 43952 }, { "epoch": 0.55, "learning_rate": 9.707626162847511e-05, "loss": 2.3199, "step": 43960 }, { "epoch": 0.55, "learning_rate": 9.70480553160565e-05, "loss": 2.3056, "step": 43968 }, { "epoch": 0.55, "learning_rate": 9.701985030264451e-05, "loss": 2.3002, "step": 43976 }, { "epoch": 0.55, "learning_rate": 9.699164659106801e-05, "loss": 2.3045, "step": 43984 }, { "epoch": 0.55, "learning_rate": 9.696344418415566e-05, "loss": 2.3102, "step": 43992 }, { "epoch": 0.55, "learning_rate": 9.693524308473595e-05, "loss": 2.2897, "step": 44000 }, { "epoch": 0.55, "learning_rate": 9.690704329563735e-05, "loss": 2.3133, "step": 44008 }, { "epoch": 0.55, "learning_rate": 9.687884481968811e-05, "loss": 2.2975, "step": 44016 }, { "epoch": 0.55, "learning_rate": 9.685064765971641e-05, "loss": 2.2806, "step": 44024 }, { "epoch": 0.55, "learning_rate": 9.682245181855023e-05, "loss": 2.3249, "step": 44032 }, { "epoch": 0.55, "learning_rate": 9.679425729901743e-05, "loss": 2.2984, "step": 44040 }, { "epoch": 0.55, "learning_rate": 9.676606410394584e-05, "loss": 2.2948, "step": 44048 }, { "epoch": 0.55, "learning_rate": 9.673787223616302e-05, "loss": 2.3128, "step": 44056 }, { "epoch": 0.55, "learning_rate": 9.670968169849648e-05, "loss": 2.3133, "step": 44064 }, { "epoch": 0.55, "learning_rate": 9.668149249377354e-05, "loss": 2.3145, "step": 44072 }, { "epoch": 0.55, "learning_rate": 9.665330462482143e-05, "loss": 2.2746, "step": 44080 }, { "epoch": 0.55, "learning_rate": 9.662511809446726e-05, "loss": 2.2985, "step": 44088 }, { "epoch": 0.55, "learning_rate": 9.659693290553793e-05, "loss": 2.2929, "step": 44096 }, { "epoch": 0.55, "learning_rate": 9.656874906086031e-05, "loss": 2.3128, "step": 44104 }, { "epoch": 0.55, "learning_rate": 9.654056656326108e-05, "loss": 2.3123, "step": 44112 }, { "epoch": 0.55, "learning_rate": 9.651238541556669e-05, "loss": 2.2935, "step": 44120 }, { "epoch": 0.55, "learning_rate": 9.648420562060368e-05, "loss": 2.286, "step": 44128 }, { "epoch": 0.55, "learning_rate": 9.645602718119821e-05, "loss": 2.3084, "step": 44136 }, { "epoch": 0.55, "learning_rate": 9.64278501001765e-05, "loss": 2.3011, "step": 44144 }, { "epoch": 0.55, "learning_rate": 9.639967438036448e-05, "loss": 2.3173, "step": 44152 }, { "epoch": 0.55, "learning_rate": 9.637150002458813e-05, "loss": 2.3074, "step": 44160 }, { "epoch": 0.55, "learning_rate": 9.634332703567306e-05, "loss": 2.2841, "step": 44168 }, { "epoch": 0.55, "learning_rate": 9.631515541644487e-05, "loss": 2.3107, "step": 44176 }, { "epoch": 0.55, "learning_rate": 9.628698516972911e-05, "loss": 2.2944, "step": 44184 }, { "epoch": 0.55, "learning_rate": 9.6258816298351e-05, "loss": 2.2882, "step": 44192 }, { "epoch": 0.55, "learning_rate": 9.623064880513579e-05, "loss": 2.3073, "step": 44200 }, { "epoch": 0.55, "learning_rate": 9.620248269290846e-05, "loss": 2.3152, "step": 44208 }, { "epoch": 0.55, "learning_rate": 9.617431796449392e-05, "loss": 2.3081, "step": 44216 }, { "epoch": 0.55, "learning_rate": 9.614615462271698e-05, "loss": 2.2906, "step": 44224 }, { "epoch": 0.55, "learning_rate": 9.61179926704022e-05, "loss": 2.2955, "step": 44232 }, { "epoch": 0.55, "learning_rate": 9.60898321103741e-05, "loss": 2.2945, "step": 44240 }, { "epoch": 0.55, "learning_rate": 9.606167294545705e-05, "loss": 2.3038, "step": 44248 }, { "epoch": 0.55, "learning_rate": 9.603351517847519e-05, "loss": 2.2973, "step": 44256 }, { "epoch": 0.55, "learning_rate": 9.600535881225266e-05, "loss": 2.2903, "step": 44264 }, { "epoch": 0.55, "learning_rate": 9.59772038496133e-05, "loss": 2.2653, "step": 44272 }, { "epoch": 0.55, "learning_rate": 9.594905029338095e-05, "loss": 2.311, "step": 44280 }, { "epoch": 0.55, "learning_rate": 9.592089814637925e-05, "loss": 2.3064, "step": 44288 }, { "epoch": 0.55, "learning_rate": 9.589274741143166e-05, "loss": 2.3186, "step": 44296 }, { "epoch": 0.55, "learning_rate": 9.58645980913616e-05, "loss": 2.2997, "step": 44304 }, { "epoch": 0.55, "learning_rate": 9.583645018899223e-05, "loss": 2.2999, "step": 44312 }, { "epoch": 0.55, "learning_rate": 9.580830370714669e-05, "loss": 2.299, "step": 44320 }, { "epoch": 0.55, "learning_rate": 9.578015864864782e-05, "loss": 2.2914, "step": 44328 }, { "epoch": 0.55, "learning_rate": 9.575201501631853e-05, "loss": 2.3105, "step": 44336 }, { "epoch": 0.55, "learning_rate": 9.572387281298135e-05, "loss": 2.3056, "step": 44344 }, { "epoch": 0.55, "learning_rate": 9.569573204145881e-05, "loss": 2.293, "step": 44352 }, { "epoch": 0.55, "learning_rate": 9.566759270457337e-05, "loss": 2.2826, "step": 44360 }, { "epoch": 0.55, "learning_rate": 9.563945480514711e-05, "loss": 2.2935, "step": 44368 }, { "epoch": 0.55, "learning_rate": 9.561131834600216e-05, "loss": 2.3018, "step": 44376 }, { "epoch": 0.55, "learning_rate": 9.55831833299605e-05, "loss": 2.2963, "step": 44384 }, { "epoch": 0.55, "learning_rate": 9.555504975984382e-05, "loss": 2.2936, "step": 44392 }, { "epoch": 0.56, "learning_rate": 9.552691763847384e-05, "loss": 2.2907, "step": 44400 }, { "epoch": 0.56, "learning_rate": 9.549878696867196e-05, "loss": 2.3125, "step": 44408 }, { "epoch": 0.56, "learning_rate": 9.54706577532596e-05, "loss": 2.3076, "step": 44416 }, { "epoch": 0.56, "learning_rate": 9.544252999505796e-05, "loss": 2.2936, "step": 44424 }, { "epoch": 0.56, "learning_rate": 9.541440369688803e-05, "loss": 2.3006, "step": 44432 }, { "epoch": 0.56, "learning_rate": 9.538627886157081e-05, "loss": 2.3292, "step": 44440 }, { "epoch": 0.56, "learning_rate": 9.535815549192697e-05, "loss": 2.2957, "step": 44448 }, { "epoch": 0.56, "learning_rate": 9.533003359077721e-05, "loss": 2.3082, "step": 44456 }, { "epoch": 0.56, "learning_rate": 9.530191316094196e-05, "loss": 2.2839, "step": 44464 }, { "epoch": 0.56, "learning_rate": 9.52737942052415e-05, "loss": 2.302, "step": 44472 }, { "epoch": 0.56, "learning_rate": 9.524567672649605e-05, "loss": 2.307, "step": 44480 }, { "epoch": 0.56, "learning_rate": 9.521756072752562e-05, "loss": 2.2939, "step": 44488 }, { "epoch": 0.56, "learning_rate": 9.518944621115009e-05, "loss": 2.3133, "step": 44496 }, { "epoch": 0.56, "learning_rate": 9.516133318018919e-05, "loss": 2.3084, "step": 44504 }, { "epoch": 0.56, "learning_rate": 9.513322163746248e-05, "loss": 2.2941, "step": 44512 }, { "epoch": 0.56, "learning_rate": 9.510511158578943e-05, "loss": 2.2944, "step": 44520 }, { "epoch": 0.56, "learning_rate": 9.507700302798925e-05, "loss": 2.2914, "step": 44528 }, { "epoch": 0.56, "learning_rate": 9.504889596688113e-05, "loss": 2.2982, "step": 44536 }, { "epoch": 0.56, "learning_rate": 9.502079040528398e-05, "loss": 2.2999, "step": 44544 }, { "epoch": 0.56, "learning_rate": 9.499268634601675e-05, "loss": 2.3109, "step": 44552 }, { "epoch": 0.56, "learning_rate": 9.496458379189804e-05, "loss": 2.2933, "step": 44560 }, { "epoch": 0.56, "learning_rate": 9.493648274574632e-05, "loss": 2.284, "step": 44568 }, { "epoch": 0.56, "learning_rate": 9.490838321038005e-05, "loss": 2.2871, "step": 44576 }, { "epoch": 0.56, "learning_rate": 9.488028518861742e-05, "loss": 2.3025, "step": 44584 }, { "epoch": 0.56, "learning_rate": 9.485218868327654e-05, "loss": 2.3163, "step": 44592 }, { "epoch": 0.56, "learning_rate": 9.482409369717533e-05, "loss": 2.3007, "step": 44600 }, { "epoch": 0.56, "learning_rate": 9.479600023313144e-05, "loss": 2.2959, "step": 44608 }, { "epoch": 0.56, "learning_rate": 9.476790829396265e-05, "loss": 2.2752, "step": 44616 }, { "epoch": 0.56, "learning_rate": 9.473981788248632e-05, "loss": 2.3065, "step": 44624 }, { "epoch": 0.56, "learning_rate": 9.471172900151982e-05, "loss": 2.3096, "step": 44632 }, { "epoch": 0.56, "learning_rate": 9.468364165388024e-05, "loss": 2.3138, "step": 44640 }, { "epoch": 0.56, "learning_rate": 9.465555584238459e-05, "loss": 2.3157, "step": 44648 }, { "epoch": 0.56, "learning_rate": 9.46274715698498e-05, "loss": 2.286, "step": 44656 }, { "epoch": 0.56, "learning_rate": 9.459938883909246e-05, "loss": 2.304, "step": 44664 }, { "epoch": 0.56, "learning_rate": 9.457130765292919e-05, "loss": 2.3226, "step": 44672 }, { "epoch": 0.56, "learning_rate": 9.45432280141763e-05, "loss": 2.2986, "step": 44680 }, { "epoch": 0.56, "learning_rate": 9.451514992565009e-05, "loss": 2.2969, "step": 44688 }, { "epoch": 0.56, "learning_rate": 9.44870733901666e-05, "loss": 2.2838, "step": 44696 }, { "epoch": 0.56, "learning_rate": 9.445899841054174e-05, "loss": 2.3107, "step": 44704 }, { "epoch": 0.56, "learning_rate": 9.443092498959127e-05, "loss": 2.3009, "step": 44712 }, { "epoch": 0.56, "learning_rate": 9.44028531301308e-05, "loss": 2.2919, "step": 44720 }, { "epoch": 0.56, "learning_rate": 9.437478283497583e-05, "loss": 2.2823, "step": 44728 }, { "epoch": 0.56, "learning_rate": 9.434671410694156e-05, "loss": 2.3057, "step": 44736 }, { "epoch": 0.56, "learning_rate": 9.431864694884316e-05, "loss": 2.3022, "step": 44744 }, { "epoch": 0.56, "learning_rate": 9.429058136349564e-05, "loss": 2.328, "step": 44752 }, { "epoch": 0.56, "learning_rate": 9.426251735371378e-05, "loss": 2.2939, "step": 44760 }, { "epoch": 0.56, "learning_rate": 9.423445492231228e-05, "loss": 2.3189, "step": 44768 }, { "epoch": 0.56, "learning_rate": 9.420639407210561e-05, "loss": 2.2837, "step": 44776 }, { "epoch": 0.56, "learning_rate": 9.41783348059081e-05, "loss": 2.3248, "step": 44784 }, { "epoch": 0.56, "learning_rate": 9.415027712653399e-05, "loss": 2.2949, "step": 44792 }, { "epoch": 0.56, "learning_rate": 9.412222103679724e-05, "loss": 2.308, "step": 44800 }, { "epoch": 0.56, "learning_rate": 9.409416653951178e-05, "loss": 2.2958, "step": 44808 }, { "epoch": 0.56, "learning_rate": 9.40661136374913e-05, "loss": 2.283, "step": 44816 }, { "epoch": 0.56, "learning_rate": 9.40380623335493e-05, "loss": 2.2944, "step": 44824 }, { "epoch": 0.56, "learning_rate": 9.401001263049924e-05, "loss": 2.2861, "step": 44832 }, { "epoch": 0.56, "learning_rate": 9.398196453115427e-05, "loss": 2.3139, "step": 44840 }, { "epoch": 0.56, "learning_rate": 9.395391803832749e-05, "loss": 2.3026, "step": 44848 }, { "epoch": 0.56, "learning_rate": 9.392587315483184e-05, "loss": 2.29, "step": 44856 }, { "epoch": 0.56, "learning_rate": 9.389782988348001e-05, "loss": 2.2968, "step": 44864 }, { "epoch": 0.56, "learning_rate": 9.386978822708463e-05, "loss": 2.2976, "step": 44872 }, { "epoch": 0.56, "learning_rate": 9.384174818845806e-05, "loss": 2.2958, "step": 44880 }, { "epoch": 0.56, "learning_rate": 9.381370977041264e-05, "loss": 2.2975, "step": 44888 }, { "epoch": 0.56, "learning_rate": 9.378567297576035e-05, "loss": 2.2957, "step": 44896 }, { "epoch": 0.56, "learning_rate": 9.375763780731323e-05, "loss": 2.2832, "step": 44904 }, { "epoch": 0.56, "learning_rate": 9.3729604267883e-05, "loss": 2.2923, "step": 44912 }, { "epoch": 0.56, "learning_rate": 9.370157236028123e-05, "loss": 2.3051, "step": 44920 }, { "epoch": 0.56, "learning_rate": 9.367354208731945e-05, "loss": 2.3089, "step": 44928 }, { "epoch": 0.56, "learning_rate": 9.364551345180885e-05, "loss": 2.2897, "step": 44936 }, { "epoch": 0.56, "learning_rate": 9.361748645656059e-05, "loss": 2.2766, "step": 44944 }, { "epoch": 0.56, "learning_rate": 9.358946110438565e-05, "loss": 2.3074, "step": 44952 }, { "epoch": 0.56, "learning_rate": 9.356143739809471e-05, "loss": 2.2981, "step": 44960 }, { "epoch": 0.56, "learning_rate": 9.353341534049849e-05, "loss": 2.2768, "step": 44968 }, { "epoch": 0.56, "learning_rate": 9.35053949344074e-05, "loss": 2.2961, "step": 44976 }, { "epoch": 0.56, "learning_rate": 9.347737618263173e-05, "loss": 2.2824, "step": 44984 }, { "epoch": 0.56, "learning_rate": 9.344935908798162e-05, "loss": 2.2931, "step": 44992 }, { "epoch": 0.56, "learning_rate": 9.3421343653267e-05, "loss": 2.2919, "step": 45000 }, { "epoch": 0.56, "learning_rate": 9.339332988129766e-05, "loss": 2.2981, "step": 45008 }, { "epoch": 0.56, "learning_rate": 9.336531777488324e-05, "loss": 2.2888, "step": 45016 }, { "epoch": 0.56, "learning_rate": 9.33373073368332e-05, "loss": 2.2865, "step": 45024 }, { "epoch": 0.56, "learning_rate": 9.33092985699568e-05, "loss": 2.2976, "step": 45032 }, { "epoch": 0.56, "learning_rate": 9.328129147706323e-05, "loss": 2.2725, "step": 45040 }, { "epoch": 0.56, "learning_rate": 9.325328606096136e-05, "loss": 2.3004, "step": 45048 }, { "epoch": 0.56, "learning_rate": 9.322528232445997e-05, "loss": 2.3152, "step": 45056 }, { "epoch": 0.56, "learning_rate": 9.319728027036778e-05, "loss": 2.277, "step": 45064 }, { "epoch": 0.56, "learning_rate": 9.316927990149311e-05, "loss": 2.3114, "step": 45072 }, { "epoch": 0.56, "learning_rate": 9.314128122064431e-05, "loss": 2.2914, "step": 45080 }, { "epoch": 0.56, "learning_rate": 9.311328423062953e-05, "loss": 2.2849, "step": 45088 }, { "epoch": 0.56, "learning_rate": 9.308528893425659e-05, "loss": 2.2992, "step": 45096 }, { "epoch": 0.56, "learning_rate": 9.305729533433336e-05, "loss": 2.2908, "step": 45104 }, { "epoch": 0.56, "learning_rate": 9.302930343366739e-05, "loss": 2.2913, "step": 45112 }, { "epoch": 0.56, "learning_rate": 9.300131323506614e-05, "loss": 2.3015, "step": 45120 }, { "epoch": 0.56, "learning_rate": 9.297332474133684e-05, "loss": 2.2934, "step": 45128 }, { "epoch": 0.56, "learning_rate": 9.29453379552866e-05, "loss": 2.288, "step": 45136 }, { "epoch": 0.56, "learning_rate": 9.29173528797223e-05, "loss": 2.2725, "step": 45144 }, { "epoch": 0.56, "learning_rate": 9.288936951745071e-05, "loss": 2.3112, "step": 45152 }, { "epoch": 0.56, "learning_rate": 9.286138787127845e-05, "loss": 2.2873, "step": 45160 }, { "epoch": 0.56, "learning_rate": 9.283340794401187e-05, "loss": 2.3076, "step": 45168 }, { "epoch": 0.56, "learning_rate": 9.280542973845716e-05, "loss": 2.3029, "step": 45176 }, { "epoch": 0.56, "learning_rate": 9.277745325742044e-05, "loss": 2.2746, "step": 45184 }, { "epoch": 0.56, "learning_rate": 9.274947850370754e-05, "loss": 2.2837, "step": 45192 }, { "epoch": 0.56, "learning_rate": 9.272150548012427e-05, "loss": 2.3092, "step": 45200 }, { "epoch": 0.57, "learning_rate": 9.269353418947602e-05, "loss": 2.2926, "step": 45208 }, { "epoch": 0.57, "learning_rate": 9.266556463456826e-05, "loss": 2.2868, "step": 45216 }, { "epoch": 0.57, "learning_rate": 9.263759681820616e-05, "loss": 2.3081, "step": 45224 }, { "epoch": 0.57, "learning_rate": 9.260963074319469e-05, "loss": 2.2923, "step": 45232 }, { "epoch": 0.57, "learning_rate": 9.258166641233874e-05, "loss": 2.2925, "step": 45240 }, { "epoch": 0.57, "learning_rate": 9.255370382844292e-05, "loss": 2.3034, "step": 45248 }, { "epoch": 0.57, "learning_rate": 9.252574299431176e-05, "loss": 2.2927, "step": 45256 }, { "epoch": 0.57, "learning_rate": 9.249778391274962e-05, "loss": 2.2903, "step": 45264 }, { "epoch": 0.57, "learning_rate": 9.24698265865605e-05, "loss": 2.2981, "step": 45272 }, { "epoch": 0.57, "learning_rate": 9.244187101854847e-05, "loss": 2.2874, "step": 45280 }, { "epoch": 0.57, "learning_rate": 9.241391721151729e-05, "loss": 2.3192, "step": 45288 }, { "epoch": 0.57, "learning_rate": 9.238596516827056e-05, "loss": 2.2886, "step": 45296 }, { "epoch": 0.57, "learning_rate": 9.235801489161176e-05, "loss": 2.2944, "step": 45304 }, { "epoch": 0.57, "learning_rate": 9.233006638434403e-05, "loss": 2.2936, "step": 45312 }, { "epoch": 0.57, "learning_rate": 9.230211964927055e-05, "loss": 2.3177, "step": 45320 }, { "epoch": 0.57, "learning_rate": 9.22741746891942e-05, "loss": 2.2883, "step": 45328 }, { "epoch": 0.57, "learning_rate": 9.224623150691769e-05, "loss": 2.286, "step": 45336 }, { "epoch": 0.57, "learning_rate": 9.221829010524354e-05, "loss": 2.2937, "step": 45344 }, { "epoch": 0.57, "learning_rate": 9.219035048697413e-05, "loss": 2.2754, "step": 45352 }, { "epoch": 0.57, "learning_rate": 9.21624126549117e-05, "loss": 2.2949, "step": 45360 }, { "epoch": 0.57, "learning_rate": 9.213447661185814e-05, "loss": 2.2937, "step": 45368 }, { "epoch": 0.57, "learning_rate": 9.21065423606154e-05, "loss": 2.2918, "step": 45376 }, { "epoch": 0.57, "learning_rate": 9.207860990398504e-05, "loss": 2.2954, "step": 45384 }, { "epoch": 0.57, "learning_rate": 9.205067924476857e-05, "loss": 2.2767, "step": 45392 }, { "epoch": 0.57, "learning_rate": 9.202275038576728e-05, "loss": 2.2897, "step": 45400 }, { "epoch": 0.57, "learning_rate": 9.199482332978224e-05, "loss": 2.3068, "step": 45408 }, { "epoch": 0.57, "learning_rate": 9.19668980796144e-05, "loss": 2.2811, "step": 45416 }, { "epoch": 0.57, "learning_rate": 9.19389746380645e-05, "loss": 2.2993, "step": 45424 }, { "epoch": 0.57, "learning_rate": 9.191105300793311e-05, "loss": 2.3043, "step": 45432 }, { "epoch": 0.57, "learning_rate": 9.188313319202062e-05, "loss": 2.3052, "step": 45440 }, { "epoch": 0.57, "learning_rate": 9.185521519312719e-05, "loss": 2.29, "step": 45448 }, { "epoch": 0.57, "learning_rate": 9.182729901405287e-05, "loss": 2.286, "step": 45456 }, { "epoch": 0.57, "learning_rate": 9.179938465759747e-05, "loss": 2.304, "step": 45464 }, { "epoch": 0.57, "learning_rate": 9.177147212656069e-05, "loss": 2.294, "step": 45472 }, { "epoch": 0.57, "learning_rate": 9.174356142374196e-05, "loss": 2.2973, "step": 45480 }, { "epoch": 0.57, "learning_rate": 9.171565255194054e-05, "loss": 2.3022, "step": 45488 }, { "epoch": 0.57, "learning_rate": 9.168774551395563e-05, "loss": 2.3157, "step": 45496 }, { "epoch": 0.57, "learning_rate": 9.1659840312586e-05, "loss": 2.3247, "step": 45504 }, { "epoch": 0.57, "learning_rate": 9.163193695063054e-05, "loss": 2.2842, "step": 45512 }, { "epoch": 0.57, "learning_rate": 9.160403543088769e-05, "loss": 2.2827, "step": 45520 }, { "epoch": 0.57, "learning_rate": 9.157613575615585e-05, "loss": 2.2944, "step": 45528 }, { "epoch": 0.57, "learning_rate": 9.154823792923321e-05, "loss": 2.2814, "step": 45536 }, { "epoch": 0.57, "learning_rate": 9.152034195291771e-05, "loss": 2.2961, "step": 45544 }, { "epoch": 0.57, "learning_rate": 9.149244783000726e-05, "loss": 2.2884, "step": 45552 }, { "epoch": 0.57, "learning_rate": 9.146455556329938e-05, "loss": 2.3171, "step": 45560 }, { "epoch": 0.57, "learning_rate": 9.143666515559157e-05, "loss": 2.2987, "step": 45568 }, { "epoch": 0.57, "learning_rate": 9.140877660968108e-05, "loss": 2.3025, "step": 45576 }, { "epoch": 0.57, "learning_rate": 9.138088992836488e-05, "loss": 2.2871, "step": 45584 }, { "epoch": 0.57, "learning_rate": 9.135300511444e-05, "loss": 2.2779, "step": 45592 }, { "epoch": 0.57, "learning_rate": 9.1325122170703e-05, "loss": 2.2873, "step": 45600 }, { "epoch": 0.57, "learning_rate": 9.129724109995043e-05, "loss": 2.2971, "step": 45608 }, { "epoch": 0.57, "learning_rate": 9.126936190497864e-05, "loss": 2.3215, "step": 45616 }, { "epoch": 0.57, "learning_rate": 9.124148458858366e-05, "loss": 2.2876, "step": 45624 }, { "epoch": 0.57, "learning_rate": 9.121360915356155e-05, "loss": 2.2955, "step": 45632 }, { "epoch": 0.57, "learning_rate": 9.118573560270794e-05, "loss": 2.2958, "step": 45640 }, { "epoch": 0.57, "learning_rate": 9.115786393881844e-05, "loss": 2.3108, "step": 45648 }, { "epoch": 0.57, "learning_rate": 9.112999416468848e-05, "loss": 2.3128, "step": 45656 }, { "epoch": 0.57, "learning_rate": 9.110212628311313e-05, "loss": 2.2928, "step": 45664 }, { "epoch": 0.57, "learning_rate": 9.107426029688745e-05, "loss": 2.2802, "step": 45672 }, { "epoch": 0.57, "learning_rate": 9.10463962088062e-05, "loss": 2.3134, "step": 45680 }, { "epoch": 0.57, "learning_rate": 9.101853402166402e-05, "loss": 2.3189, "step": 45688 }, { "epoch": 0.57, "learning_rate": 9.099067373825537e-05, "loss": 2.325, "step": 45696 }, { "epoch": 0.57, "learning_rate": 9.096281536137437e-05, "loss": 2.3141, "step": 45704 }, { "epoch": 0.57, "learning_rate": 9.093495889381516e-05, "loss": 2.3007, "step": 45712 }, { "epoch": 0.57, "learning_rate": 9.090710433837151e-05, "loss": 2.2985, "step": 45720 }, { "epoch": 0.57, "learning_rate": 9.087925169783713e-05, "loss": 2.2951, "step": 45728 }, { "epoch": 0.57, "learning_rate": 9.085140097500544e-05, "loss": 2.2774, "step": 45736 }, { "epoch": 0.57, "learning_rate": 9.082355217266978e-05, "loss": 2.2902, "step": 45744 }, { "epoch": 0.57, "learning_rate": 9.079570529362313e-05, "loss": 2.2977, "step": 45752 }, { "epoch": 0.57, "learning_rate": 9.076786034065842e-05, "loss": 2.3039, "step": 45760 }, { "epoch": 0.57, "learning_rate": 9.074001731656839e-05, "loss": 2.3134, "step": 45768 }, { "epoch": 0.57, "learning_rate": 9.071217622414543e-05, "loss": 2.291, "step": 45776 }, { "epoch": 0.57, "learning_rate": 9.068433706618193e-05, "loss": 2.3016, "step": 45784 }, { "epoch": 0.57, "learning_rate": 9.065649984547e-05, "loss": 2.2941, "step": 45792 }, { "epoch": 0.57, "learning_rate": 9.06286645648015e-05, "loss": 2.2863, "step": 45800 }, { "epoch": 0.57, "learning_rate": 9.06008312269682e-05, "loss": 2.288, "step": 45808 }, { "epoch": 0.57, "learning_rate": 9.057299983476157e-05, "loss": 2.2841, "step": 45816 }, { "epoch": 0.57, "learning_rate": 9.054517039097301e-05, "loss": 2.3119, "step": 45824 }, { "epoch": 0.57, "learning_rate": 9.051734289839363e-05, "loss": 2.3046, "step": 45832 }, { "epoch": 0.57, "learning_rate": 9.048951735981433e-05, "loss": 2.2852, "step": 45840 }, { "epoch": 0.57, "learning_rate": 9.046169377802589e-05, "loss": 2.2851, "step": 45848 }, { "epoch": 0.57, "learning_rate": 9.043387215581884e-05, "loss": 2.2761, "step": 45856 }, { "epoch": 0.57, "learning_rate": 9.04060524959836e-05, "loss": 2.3052, "step": 45864 }, { "epoch": 0.57, "learning_rate": 9.037823480131023e-05, "loss": 2.3008, "step": 45872 }, { "epoch": 0.57, "learning_rate": 9.035041907458874e-05, "loss": 2.264, "step": 45880 }, { "epoch": 0.57, "learning_rate": 9.032260531860888e-05, "loss": 2.284, "step": 45888 }, { "epoch": 0.57, "learning_rate": 9.029479353616018e-05, "loss": 2.2915, "step": 45896 }, { "epoch": 0.57, "learning_rate": 9.026698373003208e-05, "loss": 2.2846, "step": 45904 }, { "epoch": 0.57, "learning_rate": 9.023917590301365e-05, "loss": 2.3085, "step": 45912 }, { "epoch": 0.57, "learning_rate": 9.021137005789394e-05, "loss": 2.2704, "step": 45920 }, { "epoch": 0.57, "learning_rate": 9.018356619746166e-05, "loss": 2.2944, "step": 45928 }, { "epoch": 0.57, "learning_rate": 9.015576432450541e-05, "loss": 2.2966, "step": 45936 }, { "epoch": 0.57, "learning_rate": 9.012796444181357e-05, "loss": 2.2991, "step": 45944 }, { "epoch": 0.57, "learning_rate": 9.010016655217428e-05, "loss": 2.2947, "step": 45952 }, { "epoch": 0.57, "learning_rate": 9.007237065837552e-05, "loss": 2.2893, "step": 45960 }, { "epoch": 0.57, "learning_rate": 9.00445767632051e-05, "loss": 2.3064, "step": 45968 }, { "epoch": 0.57, "learning_rate": 9.001678486945053e-05, "loss": 2.3045, "step": 45976 }, { "epoch": 0.57, "learning_rate": 8.99889949798992e-05, "loss": 2.3081, "step": 45984 }, { "epoch": 0.57, "learning_rate": 8.996120709733829e-05, "loss": 2.2962, "step": 45992 }, { "epoch": 0.57, "learning_rate": 8.99334212245548e-05, "loss": 2.2801, "step": 46000 }, { "epoch": 0.58, "learning_rate": 8.990563736433541e-05, "loss": 2.2993, "step": 46008 }, { "epoch": 0.58, "learning_rate": 8.987785551946675e-05, "loss": 2.2789, "step": 46016 }, { "epoch": 0.58, "learning_rate": 8.985007569273516e-05, "loss": 2.2743, "step": 46024 }, { "epoch": 0.58, "learning_rate": 8.982229788692678e-05, "loss": 2.291, "step": 46032 }, { "epoch": 0.58, "learning_rate": 8.979452210482763e-05, "loss": 2.2813, "step": 46040 }, { "epoch": 0.58, "learning_rate": 8.976674834922339e-05, "loss": 2.3083, "step": 46048 }, { "epoch": 0.58, "learning_rate": 8.973897662289966e-05, "loss": 2.3035, "step": 46056 }, { "epoch": 0.58, "learning_rate": 8.971120692864179e-05, "loss": 2.2905, "step": 46064 }, { "epoch": 0.58, "learning_rate": 8.968343926923485e-05, "loss": 2.3, "step": 46072 }, { "epoch": 0.58, "learning_rate": 8.965567364746388e-05, "loss": 2.2914, "step": 46080 }, { "epoch": 0.58, "learning_rate": 8.962791006611355e-05, "loss": 2.2907, "step": 46088 }, { "epoch": 0.58, "learning_rate": 8.960014852796839e-05, "loss": 2.2903, "step": 46096 }, { "epoch": 0.58, "learning_rate": 8.957238903581278e-05, "loss": 2.2917, "step": 46104 }, { "epoch": 0.58, "learning_rate": 8.954463159243073e-05, "loss": 2.2701, "step": 46112 }, { "epoch": 0.58, "learning_rate": 8.95168762006063e-05, "loss": 2.3019, "step": 46120 }, { "epoch": 0.58, "learning_rate": 8.948912286312306e-05, "loss": 2.2809, "step": 46128 }, { "epoch": 0.58, "learning_rate": 8.946137158276461e-05, "loss": 2.3004, "step": 46136 }, { "epoch": 0.58, "learning_rate": 8.943362236231425e-05, "loss": 2.3145, "step": 46144 }, { "epoch": 0.58, "learning_rate": 8.940587520455496e-05, "loss": 2.2967, "step": 46152 }, { "epoch": 0.58, "learning_rate": 8.937813011226972e-05, "loss": 2.294, "step": 46160 }, { "epoch": 0.58, "learning_rate": 8.935038708824117e-05, "loss": 2.2884, "step": 46168 }, { "epoch": 0.58, "learning_rate": 8.932264613525183e-05, "loss": 2.3068, "step": 46176 }, { "epoch": 0.58, "learning_rate": 8.929490725608389e-05, "loss": 2.2923, "step": 46184 }, { "epoch": 0.58, "learning_rate": 8.926717045351942e-05, "loss": 2.2819, "step": 46192 }, { "epoch": 0.58, "learning_rate": 8.923943573034031e-05, "loss": 2.3054, "step": 46200 }, { "epoch": 0.58, "learning_rate": 8.921170308932811e-05, "loss": 2.2758, "step": 46208 }, { "epoch": 0.58, "learning_rate": 8.918397253326433e-05, "loss": 2.2963, "step": 46216 }, { "epoch": 0.58, "learning_rate": 8.915624406493016e-05, "loss": 2.2893, "step": 46224 }, { "epoch": 0.58, "learning_rate": 8.912851768710657e-05, "loss": 2.285, "step": 46232 }, { "epoch": 0.58, "learning_rate": 8.910079340257444e-05, "loss": 2.3097, "step": 46240 }, { "epoch": 0.58, "learning_rate": 8.907307121411426e-05, "loss": 2.2888, "step": 46248 }, { "epoch": 0.58, "learning_rate": 8.904535112450649e-05, "loss": 2.283, "step": 46256 }, { "epoch": 0.58, "learning_rate": 8.901763313653125e-05, "loss": 2.2802, "step": 46264 }, { "epoch": 0.58, "learning_rate": 8.898991725296852e-05, "loss": 2.2998, "step": 46272 }, { "epoch": 0.58, "learning_rate": 8.896220347659807e-05, "loss": 2.292, "step": 46280 }, { "epoch": 0.58, "learning_rate": 8.893449181019935e-05, "loss": 2.3059, "step": 46288 }, { "epoch": 0.58, "learning_rate": 8.890678225655178e-05, "loss": 2.2975, "step": 46296 }, { "epoch": 0.58, "learning_rate": 8.887907481843438e-05, "loss": 2.2791, "step": 46304 }, { "epoch": 0.58, "learning_rate": 8.885136949862616e-05, "loss": 2.2875, "step": 46312 }, { "epoch": 0.58, "learning_rate": 8.882366629990571e-05, "loss": 2.2904, "step": 46320 }, { "epoch": 0.58, "learning_rate": 8.879596522505153e-05, "loss": 2.3126, "step": 46328 }, { "epoch": 0.58, "learning_rate": 8.876826627684191e-05, "loss": 2.2879, "step": 46336 }, { "epoch": 0.58, "learning_rate": 8.874056945805487e-05, "loss": 2.2791, "step": 46344 }, { "epoch": 0.58, "learning_rate": 8.871287477146826e-05, "loss": 2.2887, "step": 46352 }, { "epoch": 0.58, "learning_rate": 8.868518221985968e-05, "loss": 2.2978, "step": 46360 }, { "epoch": 0.58, "learning_rate": 8.865749180600653e-05, "loss": 2.3063, "step": 46368 }, { "epoch": 0.58, "learning_rate": 8.862980353268606e-05, "loss": 2.2812, "step": 46376 }, { "epoch": 0.58, "learning_rate": 8.860211740267516e-05, "loss": 2.2669, "step": 46384 }, { "epoch": 0.58, "learning_rate": 8.857443341875067e-05, "loss": 2.302, "step": 46392 }, { "epoch": 0.58, "learning_rate": 8.854675158368909e-05, "loss": 2.2953, "step": 46400 }, { "epoch": 0.58, "learning_rate": 8.851907190026678e-05, "loss": 2.2824, "step": 46408 }, { "epoch": 0.58, "learning_rate": 8.849139437125985e-05, "loss": 2.3172, "step": 46416 }, { "epoch": 0.58, "learning_rate": 8.846371899944413e-05, "loss": 2.2976, "step": 46424 }, { "epoch": 0.58, "learning_rate": 8.843604578759544e-05, "loss": 2.3026, "step": 46432 }, { "epoch": 0.58, "learning_rate": 8.840837473848911e-05, "loss": 2.306, "step": 46440 }, { "epoch": 0.58, "learning_rate": 8.838070585490048e-05, "loss": 2.2931, "step": 46448 }, { "epoch": 0.58, "learning_rate": 8.835303913960455e-05, "loss": 2.2862, "step": 46456 }, { "epoch": 0.58, "learning_rate": 8.832537459537611e-05, "loss": 2.3008, "step": 46464 }, { "epoch": 0.58, "learning_rate": 8.829771222498981e-05, "loss": 2.2791, "step": 46472 }, { "epoch": 0.58, "learning_rate": 8.827005203121998e-05, "loss": 2.2934, "step": 46480 }, { "epoch": 0.58, "learning_rate": 8.824239401684083e-05, "loss": 2.2906, "step": 46488 }, { "epoch": 0.58, "learning_rate": 8.821473818462627e-05, "loss": 2.3209, "step": 46496 }, { "epoch": 0.58, "learning_rate": 8.818708453735001e-05, "loss": 2.3005, "step": 46504 }, { "epoch": 0.58, "learning_rate": 8.815943307778561e-05, "loss": 2.3194, "step": 46512 }, { "epoch": 0.58, "learning_rate": 8.813178380870625e-05, "loss": 2.2927, "step": 46520 }, { "epoch": 0.58, "learning_rate": 8.810413673288511e-05, "loss": 2.2937, "step": 46528 }, { "epoch": 0.58, "learning_rate": 8.807649185309498e-05, "loss": 2.2878, "step": 46536 }, { "epoch": 0.58, "learning_rate": 8.804884917210849e-05, "loss": 2.2774, "step": 46544 }, { "epoch": 0.58, "learning_rate": 8.802120869269805e-05, "loss": 2.2864, "step": 46552 }, { "epoch": 0.58, "learning_rate": 8.799357041763581e-05, "loss": 2.2788, "step": 46560 }, { "epoch": 0.58, "learning_rate": 8.79659343496938e-05, "loss": 2.293, "step": 46568 }, { "epoch": 0.58, "learning_rate": 8.793830049164369e-05, "loss": 2.2979, "step": 46576 }, { "epoch": 0.58, "learning_rate": 8.791066884625707e-05, "loss": 2.2982, "step": 46584 }, { "epoch": 0.58, "learning_rate": 8.788303941630518e-05, "loss": 2.2859, "step": 46592 }, { "epoch": 0.58, "learning_rate": 8.78554122045591e-05, "loss": 2.2981, "step": 46600 }, { "epoch": 0.58, "learning_rate": 8.782778721378973e-05, "loss": 2.2858, "step": 46608 }, { "epoch": 0.58, "learning_rate": 8.780016444676764e-05, "loss": 2.2771, "step": 46616 }, { "epoch": 0.58, "learning_rate": 8.777254390626329e-05, "loss": 2.3085, "step": 46624 }, { "epoch": 0.58, "learning_rate": 8.774492559504683e-05, "loss": 2.2926, "step": 46632 }, { "epoch": 0.58, "learning_rate": 8.77173095158882e-05, "loss": 2.2986, "step": 46640 }, { "epoch": 0.58, "learning_rate": 8.76896956715572e-05, "loss": 2.2903, "step": 46648 }, { "epoch": 0.58, "learning_rate": 8.766208406482327e-05, "loss": 2.3169, "step": 46656 }, { "epoch": 0.58, "learning_rate": 8.763447469845576e-05, "loss": 2.2932, "step": 46664 }, { "epoch": 0.58, "learning_rate": 8.760686757522374e-05, "loss": 2.2838, "step": 46672 }, { "epoch": 0.58, "learning_rate": 8.757926269789596e-05, "loss": 2.2914, "step": 46680 }, { "epoch": 0.58, "learning_rate": 8.755166006924112e-05, "loss": 2.2918, "step": 46688 }, { "epoch": 0.58, "learning_rate": 8.752405969202755e-05, "loss": 2.2939, "step": 46696 }, { "epoch": 0.58, "learning_rate": 8.749646156902347e-05, "loss": 2.3129, "step": 46704 }, { "epoch": 0.58, "learning_rate": 8.74688657029968e-05, "loss": 2.2885, "step": 46712 }, { "epoch": 0.58, "learning_rate": 8.744127209671517e-05, "loss": 2.3108, "step": 46720 }, { "epoch": 0.58, "learning_rate": 8.741368075294616e-05, "loss": 2.2734, "step": 46728 }, { "epoch": 0.58, "learning_rate": 8.738609167445695e-05, "loss": 2.2924, "step": 46736 }, { "epoch": 0.58, "learning_rate": 8.735850486401466e-05, "loss": 2.2828, "step": 46744 }, { "epoch": 0.58, "learning_rate": 8.733092032438601e-05, "loss": 2.2692, "step": 46752 }, { "epoch": 0.58, "learning_rate": 8.730333805833759e-05, "loss": 2.2952, "step": 46760 }, { "epoch": 0.58, "learning_rate": 8.727575806863581e-05, "loss": 2.3156, "step": 46768 }, { "epoch": 0.58, "learning_rate": 8.724818035804667e-05, "loss": 2.2924, "step": 46776 }, { "epoch": 0.58, "learning_rate": 8.722060492933616e-05, "loss": 2.2943, "step": 46784 }, { "epoch": 0.58, "learning_rate": 8.71930317852699e-05, "loss": 2.2949, "step": 46792 }, { "epoch": 0.58, "learning_rate": 8.716546092861331e-05, "loss": 2.3124, "step": 46800 }, { "epoch": 0.59, "learning_rate": 8.71378923621316e-05, "loss": 2.2969, "step": 46808 }, { "epoch": 0.59, "learning_rate": 8.711032608858974e-05, "loss": 2.2802, "step": 46816 }, { "epoch": 0.59, "learning_rate": 8.708276211075248e-05, "loss": 2.2939, "step": 46824 }, { "epoch": 0.59, "learning_rate": 8.705520043138431e-05, "loss": 2.2812, "step": 46832 }, { "epoch": 0.59, "learning_rate": 8.702764105324954e-05, "loss": 2.3016, "step": 46840 }, { "epoch": 0.59, "learning_rate": 8.700008397911221e-05, "loss": 2.2774, "step": 46848 }, { "epoch": 0.59, "learning_rate": 8.697252921173611e-05, "loss": 2.2791, "step": 46856 }, { "epoch": 0.59, "learning_rate": 8.694497675388487e-05, "loss": 2.2931, "step": 46864 }, { "epoch": 0.59, "learning_rate": 8.691742660832178e-05, "loss": 2.2903, "step": 46872 }, { "epoch": 0.59, "learning_rate": 8.688987877781007e-05, "loss": 2.2856, "step": 46880 }, { "epoch": 0.59, "learning_rate": 8.686233326511255e-05, "loss": 2.3065, "step": 46888 }, { "epoch": 0.59, "learning_rate": 8.683479007299187e-05, "loss": 2.3015, "step": 46896 }, { "epoch": 0.59, "learning_rate": 8.680724920421053e-05, "loss": 2.2848, "step": 46904 }, { "epoch": 0.59, "learning_rate": 8.677971066153063e-05, "loss": 2.2821, "step": 46912 }, { "epoch": 0.59, "learning_rate": 8.675217444771422e-05, "loss": 2.3013, "step": 46920 }, { "epoch": 0.59, "learning_rate": 8.672464056552294e-05, "loss": 2.29, "step": 46928 }, { "epoch": 0.59, "learning_rate": 8.669710901771834e-05, "loss": 2.2922, "step": 46936 }, { "epoch": 0.59, "learning_rate": 8.666957980706172e-05, "loss": 2.2894, "step": 46944 }, { "epoch": 0.59, "learning_rate": 8.664205293631397e-05, "loss": 2.3048, "step": 46952 }, { "epoch": 0.59, "learning_rate": 8.661452840823598e-05, "loss": 2.2729, "step": 46960 }, { "epoch": 0.59, "learning_rate": 8.658700622558829e-05, "loss": 2.2823, "step": 46968 }, { "epoch": 0.59, "learning_rate": 8.655948639113122e-05, "loss": 2.3191, "step": 46976 }, { "epoch": 0.59, "learning_rate": 8.653196890762486e-05, "loss": 2.3, "step": 46984 }, { "epoch": 0.59, "learning_rate": 8.650445377782899e-05, "loss": 2.2593, "step": 46992 }, { "epoch": 0.59, "learning_rate": 8.64769410045033e-05, "loss": 2.2855, "step": 47000 }, { "epoch": 0.59, "learning_rate": 8.644943059040713e-05, "loss": 2.2902, "step": 47008 }, { "epoch": 0.59, "learning_rate": 8.642192253829964e-05, "loss": 2.2908, "step": 47016 }, { "epoch": 0.59, "learning_rate": 8.639441685093973e-05, "loss": 2.2773, "step": 47024 }, { "epoch": 0.59, "learning_rate": 8.636691353108602e-05, "loss": 2.2824, "step": 47032 }, { "epoch": 0.59, "learning_rate": 8.633941258149698e-05, "loss": 2.2896, "step": 47040 }, { "epoch": 0.59, "learning_rate": 8.631191400493079e-05, "loss": 2.2833, "step": 47048 }, { "epoch": 0.59, "learning_rate": 8.628441780414542e-05, "loss": 2.275, "step": 47056 }, { "epoch": 0.59, "learning_rate": 8.625692398189856e-05, "loss": 2.2652, "step": 47064 }, { "epoch": 0.59, "learning_rate": 8.622943254094766e-05, "loss": 2.289, "step": 47072 }, { "epoch": 0.59, "learning_rate": 8.620194348405003e-05, "loss": 2.2838, "step": 47080 }, { "epoch": 0.59, "learning_rate": 8.617445681396257e-05, "loss": 2.3225, "step": 47088 }, { "epoch": 0.59, "learning_rate": 8.614697253344211e-05, "loss": 2.3051, "step": 47096 }, { "epoch": 0.59, "learning_rate": 8.611949064524514e-05, "loss": 2.287, "step": 47104 }, { "epoch": 0.59, "learning_rate": 8.609201115212797e-05, "loss": 2.2978, "step": 47112 }, { "epoch": 0.59, "learning_rate": 8.606453405684662e-05, "loss": 2.307, "step": 47120 }, { "epoch": 0.59, "learning_rate": 8.603705936215682e-05, "loss": 2.3043, "step": 47128 }, { "epoch": 0.59, "learning_rate": 8.600958707081424e-05, "loss": 2.2614, "step": 47136 }, { "epoch": 0.59, "learning_rate": 8.59821171855741e-05, "loss": 2.281, "step": 47144 }, { "epoch": 0.59, "learning_rate": 8.595464970919154e-05, "loss": 2.2977, "step": 47152 }, { "epoch": 0.59, "learning_rate": 8.592718464442135e-05, "loss": 2.286, "step": 47160 }, { "epoch": 0.59, "learning_rate": 8.589972199401812e-05, "loss": 2.2882, "step": 47168 }, { "epoch": 0.59, "learning_rate": 8.587226176073626e-05, "loss": 2.2814, "step": 47176 }, { "epoch": 0.59, "learning_rate": 8.584480394732978e-05, "loss": 2.2769, "step": 47184 }, { "epoch": 0.59, "learning_rate": 8.581734855655266e-05, "loss": 2.2947, "step": 47192 }, { "epoch": 0.59, "learning_rate": 8.578989559115842e-05, "loss": 2.2816, "step": 47200 }, { "epoch": 0.59, "learning_rate": 8.576244505390045e-05, "loss": 2.2802, "step": 47208 }, { "epoch": 0.59, "learning_rate": 8.573499694753194e-05, "loss": 2.2707, "step": 47216 }, { "epoch": 0.59, "learning_rate": 8.57075512748057e-05, "loss": 2.281, "step": 47224 }, { "epoch": 0.59, "learning_rate": 8.568010803847444e-05, "loss": 2.2832, "step": 47232 }, { "epoch": 0.59, "learning_rate": 8.565266724129055e-05, "loss": 2.2764, "step": 47240 }, { "epoch": 0.59, "learning_rate": 8.562522888600614e-05, "loss": 2.3093, "step": 47248 }, { "epoch": 0.59, "learning_rate": 8.559779297537323e-05, "loss": 2.2952, "step": 47256 }, { "epoch": 0.59, "learning_rate": 8.557035951214334e-05, "loss": 2.2961, "step": 47264 }, { "epoch": 0.59, "learning_rate": 8.554292849906797e-05, "loss": 2.2849, "step": 47272 }, { "epoch": 0.59, "learning_rate": 8.551549993889831e-05, "loss": 2.3083, "step": 47280 }, { "epoch": 0.59, "learning_rate": 8.548807383438528e-05, "loss": 2.2844, "step": 47288 }, { "epoch": 0.59, "learning_rate": 8.546065018827956e-05, "loss": 2.2628, "step": 47296 }, { "epoch": 0.59, "learning_rate": 8.543322900333152e-05, "loss": 2.2998, "step": 47304 }, { "epoch": 0.59, "learning_rate": 8.540581028229149e-05, "loss": 2.3172, "step": 47312 }, { "epoch": 0.59, "learning_rate": 8.537839402790928e-05, "loss": 2.2872, "step": 47320 }, { "epoch": 0.59, "learning_rate": 8.535098024293466e-05, "loss": 2.2958, "step": 47328 }, { "epoch": 0.59, "learning_rate": 8.532356893011704e-05, "loss": 2.2943, "step": 47336 }, { "epoch": 0.59, "learning_rate": 8.52961600922056e-05, "loss": 2.2966, "step": 47344 }, { "epoch": 0.59, "learning_rate": 8.526875373194938e-05, "loss": 2.2766, "step": 47352 }, { "epoch": 0.59, "learning_rate": 8.524134985209698e-05, "loss": 2.2856, "step": 47360 }, { "epoch": 0.59, "learning_rate": 8.521394845539692e-05, "loss": 2.2947, "step": 47368 }, { "epoch": 0.59, "learning_rate": 8.518654954459739e-05, "loss": 2.3038, "step": 47376 }, { "epoch": 0.59, "learning_rate": 8.515915312244631e-05, "loss": 2.2959, "step": 47384 }, { "epoch": 0.59, "learning_rate": 8.513175919169147e-05, "loss": 2.2896, "step": 47392 }, { "epoch": 0.59, "learning_rate": 8.510436775508022e-05, "loss": 2.2947, "step": 47400 }, { "epoch": 0.59, "learning_rate": 8.507697881535983e-05, "loss": 2.3049, "step": 47408 }, { "epoch": 0.59, "learning_rate": 8.50495923752773e-05, "loss": 2.2986, "step": 47416 }, { "epoch": 0.59, "learning_rate": 8.50222084375792e-05, "loss": 2.2964, "step": 47424 }, { "epoch": 0.59, "learning_rate": 8.499482700501209e-05, "loss": 2.2985, "step": 47432 }, { "epoch": 0.59, "learning_rate": 8.496744808032213e-05, "loss": 2.3122, "step": 47440 }, { "epoch": 0.59, "learning_rate": 8.494007166625531e-05, "loss": 2.3028, "step": 47448 }, { "epoch": 0.59, "learning_rate": 8.491269776555728e-05, "loss": 2.2938, "step": 47456 }, { "epoch": 0.59, "learning_rate": 8.488532638097353e-05, "loss": 2.2895, "step": 47464 }, { "epoch": 0.59, "learning_rate": 8.485795751524925e-05, "loss": 2.2876, "step": 47472 }, { "epoch": 0.59, "learning_rate": 8.483059117112934e-05, "loss": 2.2789, "step": 47480 }, { "epoch": 0.59, "learning_rate": 8.480322735135855e-05, "loss": 2.275, "step": 47488 }, { "epoch": 0.59, "learning_rate": 8.477586605868125e-05, "loss": 2.296, "step": 47496 }, { "epoch": 0.59, "learning_rate": 8.474850729584166e-05, "loss": 2.2917, "step": 47504 }, { "epoch": 0.59, "learning_rate": 8.472115106558374e-05, "loss": 2.282, "step": 47512 }, { "epoch": 0.59, "learning_rate": 8.469379737065108e-05, "loss": 2.2934, "step": 47520 }, { "epoch": 0.59, "learning_rate": 8.466644621378718e-05, "loss": 2.2988, "step": 47528 }, { "epoch": 0.59, "learning_rate": 8.463909759773516e-05, "loss": 2.2761, "step": 47536 }, { "epoch": 0.59, "learning_rate": 8.461175152523799e-05, "loss": 2.2779, "step": 47544 }, { "epoch": 0.59, "learning_rate": 8.458440799903826e-05, "loss": 2.2903, "step": 47552 }, { "epoch": 0.59, "learning_rate": 8.455706702187837e-05, "loss": 2.3057, "step": 47560 }, { "epoch": 0.59, "learning_rate": 8.452972859650052e-05, "loss": 2.2912, "step": 47568 }, { "epoch": 0.59, "learning_rate": 8.450239272564656e-05, "loss": 2.3204, "step": 47576 }, { "epoch": 0.59, "learning_rate": 8.447505941205814e-05, "loss": 2.2923, "step": 47584 }, { "epoch": 0.59, "learning_rate": 8.444772865847661e-05, "loss": 2.2888, "step": 47592 }, { "epoch": 0.59, "learning_rate": 8.44204004676431e-05, "loss": 2.2744, "step": 47600 }, { "epoch": 0.6, "learning_rate": 8.439307484229853e-05, "loss": 2.2943, "step": 47608 }, { "epoch": 0.6, "learning_rate": 8.43657517851834e-05, "loss": 2.2959, "step": 47616 }, { "epoch": 0.6, "learning_rate": 8.433843129903818e-05, "loss": 2.2875, "step": 47624 }, { "epoch": 0.6, "learning_rate": 8.431111338660283e-05, "loss": 2.2976, "step": 47632 }, { "epoch": 0.6, "learning_rate": 8.428379805061725e-05, "loss": 2.2787, "step": 47640 }, { "epoch": 0.6, "learning_rate": 8.425648529382107e-05, "loss": 2.2982, "step": 47648 }, { "epoch": 0.6, "learning_rate": 8.42291751189535e-05, "loss": 2.2897, "step": 47656 }, { "epoch": 0.6, "learning_rate": 8.420186752875363e-05, "loss": 2.2981, "step": 47664 }, { "epoch": 0.6, "learning_rate": 8.417456252596027e-05, "loss": 2.2776, "step": 47672 }, { "epoch": 0.6, "learning_rate": 8.414726011331197e-05, "loss": 2.2887, "step": 47680 }, { "epoch": 0.6, "learning_rate": 8.411996029354703e-05, "loss": 2.2873, "step": 47688 }, { "epoch": 0.6, "learning_rate": 8.409266306940336e-05, "loss": 2.2809, "step": 47696 }, { "epoch": 0.6, "learning_rate": 8.406536844361881e-05, "loss": 2.2981, "step": 47704 }, { "epoch": 0.6, "learning_rate": 8.403807641893082e-05, "loss": 2.2948, "step": 47712 }, { "epoch": 0.6, "learning_rate": 8.401078699807672e-05, "loss": 2.2959, "step": 47720 }, { "epoch": 0.6, "learning_rate": 8.398350018379339e-05, "loss": 2.2763, "step": 47728 }, { "epoch": 0.6, "learning_rate": 8.395621597881756e-05, "loss": 2.2872, "step": 47736 }, { "epoch": 0.6, "learning_rate": 8.392893438588572e-05, "loss": 2.286, "step": 47744 }, { "epoch": 0.6, "learning_rate": 8.390165540773401e-05, "loss": 2.2588, "step": 47752 }, { "epoch": 0.6, "learning_rate": 8.38743790470984e-05, "loss": 2.2955, "step": 47760 }, { "epoch": 0.6, "learning_rate": 8.384710530671453e-05, "loss": 2.2967, "step": 47768 }, { "epoch": 0.6, "learning_rate": 8.38198341893178e-05, "loss": 2.2893, "step": 47776 }, { "epoch": 0.6, "learning_rate": 8.379256569764338e-05, "loss": 2.2892, "step": 47784 }, { "epoch": 0.6, "learning_rate": 8.37652998344261e-05, "loss": 2.293, "step": 47792 }, { "epoch": 0.6, "learning_rate": 8.373803660240058e-05, "loss": 2.3, "step": 47800 }, { "epoch": 0.6, "learning_rate": 8.371077600430118e-05, "loss": 2.2913, "step": 47808 }, { "epoch": 0.6, "learning_rate": 8.3683518042862e-05, "loss": 2.3001, "step": 47816 }, { "epoch": 0.6, "learning_rate": 8.365626272081688e-05, "loss": 2.3142, "step": 47824 }, { "epoch": 0.6, "learning_rate": 8.362901004089927e-05, "loss": 2.282, "step": 47832 }, { "epoch": 0.6, "learning_rate": 8.360176000584256e-05, "loss": 2.2974, "step": 47840 }, { "epoch": 0.6, "learning_rate": 8.357451261837975e-05, "loss": 2.2852, "step": 47848 }, { "epoch": 0.6, "learning_rate": 8.354726788124359e-05, "loss": 2.2567, "step": 47856 }, { "epoch": 0.6, "learning_rate": 8.352002579716655e-05, "loss": 2.299, "step": 47864 }, { "epoch": 0.6, "learning_rate": 8.349278636888087e-05, "loss": 2.2992, "step": 47872 }, { "epoch": 0.6, "learning_rate": 8.346554959911856e-05, "loss": 2.2775, "step": 47880 }, { "epoch": 0.6, "learning_rate": 8.343831549061123e-05, "loss": 2.2681, "step": 47888 }, { "epoch": 0.6, "learning_rate": 8.341108404609039e-05, "loss": 2.282, "step": 47896 }, { "epoch": 0.6, "learning_rate": 8.338385526828714e-05, "loss": 2.29, "step": 47904 }, { "epoch": 0.6, "learning_rate": 8.335662915993237e-05, "loss": 2.2939, "step": 47912 }, { "epoch": 0.6, "learning_rate": 8.332940572375676e-05, "loss": 2.2872, "step": 47920 }, { "epoch": 0.6, "learning_rate": 8.33021849624906e-05, "loss": 2.2936, "step": 47928 }, { "epoch": 0.6, "learning_rate": 8.327496687886403e-05, "loss": 2.2779, "step": 47936 }, { "epoch": 0.6, "learning_rate": 8.324775147560686e-05, "loss": 2.2987, "step": 47944 }, { "epoch": 0.6, "learning_rate": 8.32205387554486e-05, "loss": 2.2954, "step": 47952 }, { "epoch": 0.6, "learning_rate": 8.31933287211186e-05, "loss": 2.2972, "step": 47960 }, { "epoch": 0.6, "learning_rate": 8.31661213753458e-05, "loss": 2.3026, "step": 47968 }, { "epoch": 0.6, "learning_rate": 8.313891672085899e-05, "loss": 2.2858, "step": 47976 }, { "epoch": 0.6, "learning_rate": 8.311171476038662e-05, "loss": 2.2796, "step": 47984 }, { "epoch": 0.6, "learning_rate": 8.308451549665692e-05, "loss": 2.2926, "step": 47992 }, { "epoch": 0.6, "learning_rate": 8.305731893239781e-05, "loss": 2.2662, "step": 48000 }, { "epoch": 0.6, "learning_rate": 8.303012507033692e-05, "loss": 2.306, "step": 48008 }, { "epoch": 0.6, "learning_rate": 8.300293391320169e-05, "loss": 2.3121, "step": 48016 }, { "epoch": 0.6, "learning_rate": 8.297574546371918e-05, "loss": 2.2752, "step": 48024 }, { "epoch": 0.6, "learning_rate": 8.29485597246163e-05, "loss": 2.2915, "step": 48032 }, { "epoch": 0.6, "learning_rate": 8.292137669861962e-05, "loss": 2.299, "step": 48040 }, { "epoch": 0.6, "learning_rate": 8.289419638845535e-05, "loss": 2.2983, "step": 48048 }, { "epoch": 0.6, "learning_rate": 8.286701879684966e-05, "loss": 2.2676, "step": 48056 }, { "epoch": 0.6, "learning_rate": 8.283984392652821e-05, "loss": 2.3034, "step": 48064 }, { "epoch": 0.6, "learning_rate": 8.281267178021652e-05, "loss": 2.3008, "step": 48072 }, { "epoch": 0.6, "learning_rate": 8.278550236063982e-05, "loss": 2.307, "step": 48080 }, { "epoch": 0.6, "learning_rate": 8.275833567052298e-05, "loss": 2.305, "step": 48088 }, { "epoch": 0.6, "learning_rate": 8.273117171259077e-05, "loss": 2.2898, "step": 48096 }, { "epoch": 0.6, "learning_rate": 8.270401048956748e-05, "loss": 2.2883, "step": 48104 }, { "epoch": 0.6, "learning_rate": 8.267685200417727e-05, "loss": 2.2793, "step": 48112 }, { "epoch": 0.6, "learning_rate": 8.264969625914402e-05, "loss": 2.2816, "step": 48120 }, { "epoch": 0.6, "learning_rate": 8.262254325719121e-05, "loss": 2.2954, "step": 48128 }, { "epoch": 0.6, "learning_rate": 8.259539300104222e-05, "loss": 2.2756, "step": 48136 }, { "epoch": 0.6, "learning_rate": 8.256824549342e-05, "loss": 2.276, "step": 48144 }, { "epoch": 0.6, "learning_rate": 8.254110073704735e-05, "loss": 2.28, "step": 48152 }, { "epoch": 0.6, "learning_rate": 8.251395873464669e-05, "loss": 2.3125, "step": 48160 }, { "epoch": 0.6, "learning_rate": 8.248681948894023e-05, "loss": 2.2883, "step": 48168 }, { "epoch": 0.6, "learning_rate": 8.24596830026499e-05, "loss": 2.2917, "step": 48176 }, { "epoch": 0.6, "learning_rate": 8.243254927849727e-05, "loss": 2.2725, "step": 48184 }, { "epoch": 0.6, "learning_rate": 8.240541831920376e-05, "loss": 2.3109, "step": 48192 }, { "epoch": 0.6, "learning_rate": 8.237829012749041e-05, "loss": 2.2707, "step": 48200 }, { "epoch": 0.6, "learning_rate": 8.235116470607809e-05, "loss": 2.2996, "step": 48208 }, { "epoch": 0.6, "learning_rate": 8.232404205768727e-05, "loss": 2.2963, "step": 48216 }, { "epoch": 0.6, "learning_rate": 8.22969221850382e-05, "loss": 2.2683, "step": 48224 }, { "epoch": 0.6, "learning_rate": 8.226980509085087e-05, "loss": 2.2854, "step": 48232 }, { "epoch": 0.6, "learning_rate": 8.224269077784492e-05, "loss": 2.2784, "step": 48240 }, { "epoch": 0.6, "learning_rate": 8.221557924873986e-05, "loss": 2.2799, "step": 48248 }, { "epoch": 0.6, "learning_rate": 8.218847050625476e-05, "loss": 2.2843, "step": 48256 }, { "epoch": 0.6, "learning_rate": 8.216136455310843e-05, "loss": 2.3051, "step": 48264 }, { "epoch": 0.6, "learning_rate": 8.213426139201956e-05, "loss": 2.2747, "step": 48272 }, { "epoch": 0.6, "learning_rate": 8.210716102570632e-05, "loss": 2.278, "step": 48280 }, { "epoch": 0.6, "learning_rate": 8.208006345688681e-05, "loss": 2.2908, "step": 48288 }, { "epoch": 0.6, "learning_rate": 8.205296868827877e-05, "loss": 2.3108, "step": 48296 }, { "epoch": 0.6, "learning_rate": 8.202587672259951e-05, "loss": 2.2913, "step": 48304 }, { "epoch": 0.6, "learning_rate": 8.199878756256639e-05, "loss": 2.2628, "step": 48312 }, { "epoch": 0.6, "learning_rate": 8.197170121089617e-05, "loss": 2.3054, "step": 48320 }, { "epoch": 0.6, "learning_rate": 8.194461767030554e-05, "loss": 2.2987, "step": 48328 }, { "epoch": 0.6, "learning_rate": 8.191753694351074e-05, "loss": 2.2575, "step": 48336 }, { "epoch": 0.6, "learning_rate": 8.18904590332279e-05, "loss": 2.2703, "step": 48344 }, { "epoch": 0.6, "learning_rate": 8.186338394217274e-05, "loss": 2.2846, "step": 48352 }, { "epoch": 0.6, "learning_rate": 8.183631167306071e-05, "loss": 2.28, "step": 48360 }, { "epoch": 0.6, "learning_rate": 8.180924222860706e-05, "loss": 2.2915, "step": 48368 }, { "epoch": 0.6, "learning_rate": 8.178217561152666e-05, "loss": 2.2846, "step": 48376 }, { "epoch": 0.6, "learning_rate": 8.175511182453418e-05, "loss": 2.2694, "step": 48384 }, { "epoch": 0.6, "learning_rate": 8.172805087034394e-05, "loss": 2.2944, "step": 48392 }, { "epoch": 0.6, "learning_rate": 8.170099275166995e-05, "loss": 2.2867, "step": 48400 }, { "epoch": 0.61, "learning_rate": 8.16739374712261e-05, "loss": 2.2867, "step": 48408 }, { "epoch": 0.61, "learning_rate": 8.164688503172575e-05, "loss": 2.2918, "step": 48416 }, { "epoch": 0.61, "learning_rate": 8.161983543588225e-05, "loss": 2.2513, "step": 48424 }, { "epoch": 0.61, "learning_rate": 8.159278868640838e-05, "loss": 2.2913, "step": 48432 }, { "epoch": 0.61, "learning_rate": 8.156574478601686e-05, "loss": 2.2958, "step": 48440 }, { "epoch": 0.61, "learning_rate": 8.153870373742005e-05, "loss": 2.287, "step": 48448 }, { "epoch": 0.61, "learning_rate": 8.151166554332995e-05, "loss": 2.2893, "step": 48456 }, { "epoch": 0.61, "learning_rate": 8.14846302064584e-05, "loss": 2.2622, "step": 48464 }, { "epoch": 0.61, "learning_rate": 8.145759772951685e-05, "loss": 2.3132, "step": 48472 }, { "epoch": 0.61, "learning_rate": 8.14305681152165e-05, "loss": 2.2758, "step": 48480 }, { "epoch": 0.61, "learning_rate": 8.140354136626831e-05, "loss": 2.3069, "step": 48488 }, { "epoch": 0.61, "learning_rate": 8.137651748538286e-05, "loss": 2.2954, "step": 48496 }, { "epoch": 0.61, "learning_rate": 8.134949647527053e-05, "loss": 2.2896, "step": 48504 }, { "epoch": 0.61, "learning_rate": 8.132247833864135e-05, "loss": 2.2764, "step": 48512 }, { "epoch": 0.61, "learning_rate": 8.129546307820512e-05, "loss": 2.3077, "step": 48520 }, { "epoch": 0.61, "learning_rate": 8.12684506966713e-05, "loss": 2.2945, "step": 48528 }, { "epoch": 0.61, "learning_rate": 8.124144119674903e-05, "loss": 2.2856, "step": 48536 }, { "epoch": 0.61, "learning_rate": 8.12144345811473e-05, "loss": 2.2969, "step": 48544 }, { "epoch": 0.61, "learning_rate": 8.118743085257463e-05, "loss": 2.2788, "step": 48552 }, { "epoch": 0.61, "learning_rate": 8.116043001373944e-05, "loss": 2.2875, "step": 48560 }, { "epoch": 0.61, "learning_rate": 8.113343206734967e-05, "loss": 2.2855, "step": 48568 }, { "epoch": 0.61, "learning_rate": 8.11064370161131e-05, "loss": 2.2914, "step": 48576 }, { "epoch": 0.61, "learning_rate": 8.107944486273717e-05, "loss": 2.2845, "step": 48584 }, { "epoch": 0.61, "learning_rate": 8.105245560992904e-05, "loss": 2.2944, "step": 48592 }, { "epoch": 0.61, "learning_rate": 8.102546926039563e-05, "loss": 2.2795, "step": 48600 }, { "epoch": 0.61, "learning_rate": 8.099848581684345e-05, "loss": 2.2873, "step": 48608 }, { "epoch": 0.61, "learning_rate": 8.097150528197878e-05, "loss": 2.2982, "step": 48616 }, { "epoch": 0.61, "learning_rate": 8.094452765850768e-05, "loss": 2.2899, "step": 48624 }, { "epoch": 0.61, "learning_rate": 8.09175529491358e-05, "loss": 2.2689, "step": 48632 }, { "epoch": 0.61, "learning_rate": 8.089058115656858e-05, "loss": 2.304, "step": 48640 }, { "epoch": 0.61, "learning_rate": 8.086361228351114e-05, "loss": 2.2851, "step": 48648 }, { "epoch": 0.61, "learning_rate": 8.083664633266825e-05, "loss": 2.2791, "step": 48656 }, { "epoch": 0.61, "learning_rate": 8.080968330674454e-05, "loss": 2.2945, "step": 48664 }, { "epoch": 0.61, "learning_rate": 8.078272320844415e-05, "loss": 2.2925, "step": 48672 }, { "epoch": 0.61, "learning_rate": 8.075576604047108e-05, "loss": 2.2793, "step": 48680 }, { "epoch": 0.61, "learning_rate": 8.072881180552896e-05, "loss": 2.2949, "step": 48688 }, { "epoch": 0.61, "learning_rate": 8.070186050632119e-05, "loss": 2.2985, "step": 48696 }, { "epoch": 0.61, "learning_rate": 8.067491214555079e-05, "loss": 2.3011, "step": 48704 }, { "epoch": 0.61, "learning_rate": 8.06479667259205e-05, "loss": 2.2753, "step": 48712 }, { "epoch": 0.61, "learning_rate": 8.062102425013287e-05, "loss": 2.3052, "step": 48720 }, { "epoch": 0.61, "learning_rate": 8.059408472089e-05, "loss": 2.2969, "step": 48728 }, { "epoch": 0.61, "learning_rate": 8.056714814089386e-05, "loss": 2.2744, "step": 48736 }, { "epoch": 0.61, "learning_rate": 8.054021451284595e-05, "loss": 2.2753, "step": 48744 }, { "epoch": 0.61, "learning_rate": 8.051328383944758e-05, "loss": 2.2866, "step": 48752 }, { "epoch": 0.61, "learning_rate": 8.048635612339981e-05, "loss": 2.287, "step": 48760 }, { "epoch": 0.61, "learning_rate": 8.045943136740323e-05, "loss": 2.2632, "step": 48768 }, { "epoch": 0.61, "learning_rate": 8.043250957415833e-05, "loss": 2.2922, "step": 48776 }, { "epoch": 0.61, "learning_rate": 8.040559074636522e-05, "loss": 2.3004, "step": 48784 }, { "epoch": 0.61, "learning_rate": 8.03786748867236e-05, "loss": 2.2882, "step": 48792 }, { "epoch": 0.61, "learning_rate": 8.035176199793309e-05, "loss": 2.2954, "step": 48800 }, { "epoch": 0.61, "learning_rate": 8.03248520826928e-05, "loss": 2.2685, "step": 48808 }, { "epoch": 0.61, "learning_rate": 8.029794514370174e-05, "loss": 2.2691, "step": 48816 }, { "epoch": 0.61, "learning_rate": 8.027104118365851e-05, "loss": 2.2626, "step": 48824 }, { "epoch": 0.61, "learning_rate": 8.024414020526134e-05, "loss": 2.3043, "step": 48832 }, { "epoch": 0.61, "learning_rate": 8.021724221120832e-05, "loss": 2.2813, "step": 48840 }, { "epoch": 0.61, "learning_rate": 8.019034720419713e-05, "loss": 2.2723, "step": 48848 }, { "epoch": 0.61, "learning_rate": 8.016345518692525e-05, "loss": 2.3087, "step": 48856 }, { "epoch": 0.61, "learning_rate": 8.013656616208968e-05, "loss": 2.2964, "step": 48864 }, { "epoch": 0.61, "learning_rate": 8.01096801323874e-05, "loss": 2.2818, "step": 48872 }, { "epoch": 0.61, "learning_rate": 8.008279710051478e-05, "loss": 2.2719, "step": 48880 }, { "epoch": 0.61, "learning_rate": 8.005591706916809e-05, "loss": 2.2977, "step": 48888 }, { "epoch": 0.61, "learning_rate": 8.002904004104325e-05, "loss": 2.3191, "step": 48896 }, { "epoch": 0.61, "learning_rate": 8.000216601883588e-05, "loss": 2.2987, "step": 48904 }, { "epoch": 0.61, "learning_rate": 7.997529500524126e-05, "loss": 2.292, "step": 48912 }, { "epoch": 0.61, "learning_rate": 7.994842700295447e-05, "loss": 2.2781, "step": 48920 }, { "epoch": 0.61, "learning_rate": 7.992156201467011e-05, "loss": 2.2619, "step": 48928 }, { "epoch": 0.61, "learning_rate": 7.989470004308271e-05, "loss": 2.2873, "step": 48936 }, { "epoch": 0.61, "learning_rate": 7.986784109088623e-05, "loss": 2.2732, "step": 48944 }, { "epoch": 0.61, "learning_rate": 7.984098516077461e-05, "loss": 2.2924, "step": 48952 }, { "epoch": 0.61, "learning_rate": 7.98141322554413e-05, "loss": 2.2995, "step": 48960 }, { "epoch": 0.61, "learning_rate": 7.978728237757942e-05, "loss": 2.2665, "step": 48968 }, { "epoch": 0.61, "learning_rate": 7.976043552988194e-05, "loss": 2.2926, "step": 48976 }, { "epoch": 0.61, "learning_rate": 7.973359171504144e-05, "loss": 2.311, "step": 48984 }, { "epoch": 0.61, "learning_rate": 7.970675093575021e-05, "loss": 2.2715, "step": 48992 }, { "epoch": 0.61, "learning_rate": 7.967991319470023e-05, "loss": 2.2823, "step": 49000 }, { "epoch": 0.61, "learning_rate": 7.965307849458313e-05, "loss": 2.2758, "step": 49008 }, { "epoch": 0.61, "learning_rate": 7.962624683809028e-05, "loss": 2.2909, "step": 49016 }, { "epoch": 0.61, "learning_rate": 7.959941822791275e-05, "loss": 2.278, "step": 49024 }, { "epoch": 0.61, "learning_rate": 7.957259266674136e-05, "loss": 2.2647, "step": 49032 }, { "epoch": 0.61, "learning_rate": 7.954577015726648e-05, "loss": 2.2941, "step": 49040 }, { "epoch": 0.61, "learning_rate": 7.95189507021783e-05, "loss": 2.2716, "step": 49048 }, { "epoch": 0.61, "learning_rate": 7.949213430416667e-05, "loss": 2.2819, "step": 49056 }, { "epoch": 0.61, "learning_rate": 7.946532096592108e-05, "loss": 2.2656, "step": 49064 }, { "epoch": 0.61, "learning_rate": 7.94385106901308e-05, "loss": 2.3214, "step": 49072 }, { "epoch": 0.61, "learning_rate": 7.941170347948468e-05, "loss": 2.2943, "step": 49080 }, { "epoch": 0.61, "learning_rate": 7.938489933667144e-05, "loss": 2.2697, "step": 49088 }, { "epoch": 0.61, "learning_rate": 7.93580982643793e-05, "loss": 2.2941, "step": 49096 }, { "epoch": 0.61, "learning_rate": 7.933130026529625e-05, "loss": 2.29, "step": 49104 }, { "epoch": 0.61, "learning_rate": 7.930450534211002e-05, "loss": 2.3026, "step": 49112 }, { "epoch": 0.61, "learning_rate": 7.927771349750796e-05, "loss": 2.2832, "step": 49120 }, { "epoch": 0.61, "learning_rate": 7.925092473417719e-05, "loss": 2.3065, "step": 49128 }, { "epoch": 0.61, "learning_rate": 7.922413905480444e-05, "loss": 2.285, "step": 49136 }, { "epoch": 0.61, "learning_rate": 7.919735646207609e-05, "loss": 2.285, "step": 49144 }, { "epoch": 0.61, "learning_rate": 7.917057695867843e-05, "loss": 2.2637, "step": 49152 }, { "epoch": 0.61, "learning_rate": 7.914380054729715e-05, "loss": 2.2922, "step": 49160 }, { "epoch": 0.61, "learning_rate": 7.911702723061787e-05, "loss": 2.299, "step": 49168 }, { "epoch": 0.61, "learning_rate": 7.909025701132577e-05, "loss": 2.2707, "step": 49176 }, { "epoch": 0.61, "learning_rate": 7.906348989210571e-05, "loss": 2.3058, "step": 49184 }, { "epoch": 0.61, "learning_rate": 7.903672587564237e-05, "loss": 2.2814, "step": 49192 }, { "epoch": 0.61, "learning_rate": 7.900996496461992e-05, "loss": 2.2585, "step": 49200 }, { "epoch": 0.62, "learning_rate": 7.898320716172243e-05, "loss": 2.2833, "step": 49208 }, { "epoch": 0.62, "learning_rate": 7.895645246963348e-05, "loss": 2.2823, "step": 49216 }, { "epoch": 0.62, "learning_rate": 7.892970089103646e-05, "loss": 2.3014, "step": 49224 }, { "epoch": 0.62, "learning_rate": 7.890295242861441e-05, "loss": 2.2855, "step": 49232 }, { "epoch": 0.62, "learning_rate": 7.887620708504999e-05, "loss": 2.2654, "step": 49240 }, { "epoch": 0.62, "learning_rate": 7.884946486302564e-05, "loss": 2.2692, "step": 49248 }, { "epoch": 0.62, "learning_rate": 7.882272576522344e-05, "loss": 2.2812, "step": 49256 }, { "epoch": 0.62, "learning_rate": 7.879598979432526e-05, "loss": 2.2812, "step": 49264 }, { "epoch": 0.62, "learning_rate": 7.876925695301245e-05, "loss": 2.2949, "step": 49272 }, { "epoch": 0.62, "learning_rate": 7.874252724396618e-05, "loss": 2.2824, "step": 49280 }, { "epoch": 0.62, "learning_rate": 7.871580066986734e-05, "loss": 2.2542, "step": 49288 }, { "epoch": 0.62, "learning_rate": 7.868907723339643e-05, "loss": 2.2893, "step": 49296 }, { "epoch": 0.62, "learning_rate": 7.866235693723365e-05, "loss": 2.2784, "step": 49304 }, { "epoch": 0.62, "learning_rate": 7.86356397840589e-05, "loss": 2.2868, "step": 49312 }, { "epoch": 0.62, "learning_rate": 7.860892577655175e-05, "loss": 2.2769, "step": 49320 }, { "epoch": 0.62, "learning_rate": 7.858221491739149e-05, "loss": 2.2822, "step": 49328 }, { "epoch": 0.62, "learning_rate": 7.855550720925701e-05, "loss": 2.2797, "step": 49336 }, { "epoch": 0.62, "learning_rate": 7.852880265482702e-05, "loss": 2.2764, "step": 49344 }, { "epoch": 0.62, "learning_rate": 7.850210125677982e-05, "loss": 2.2706, "step": 49352 }, { "epoch": 0.62, "learning_rate": 7.847540301779333e-05, "loss": 2.2817, "step": 49360 }, { "epoch": 0.62, "learning_rate": 7.844870794054536e-05, "loss": 2.2736, "step": 49368 }, { "epoch": 0.62, "learning_rate": 7.842201602771314e-05, "loss": 2.2831, "step": 49376 }, { "epoch": 0.62, "learning_rate": 7.839532728197379e-05, "loss": 2.2632, "step": 49384 }, { "epoch": 0.62, "learning_rate": 7.836864170600401e-05, "loss": 2.313, "step": 49392 }, { "epoch": 0.62, "learning_rate": 7.83419593024803e-05, "loss": 2.2779, "step": 49400 }, { "epoch": 0.62, "learning_rate": 7.831528007407865e-05, "loss": 2.2927, "step": 49408 }, { "epoch": 0.62, "learning_rate": 7.828860402347487e-05, "loss": 2.2876, "step": 49416 }, { "epoch": 0.62, "learning_rate": 7.826193115334444e-05, "loss": 2.2898, "step": 49424 }, { "epoch": 0.62, "learning_rate": 7.823526146636246e-05, "loss": 2.2773, "step": 49432 }, { "epoch": 0.62, "learning_rate": 7.820859496520378e-05, "loss": 2.2946, "step": 49440 }, { "epoch": 0.62, "learning_rate": 7.818193165254289e-05, "loss": 2.2693, "step": 49448 }, { "epoch": 0.62, "learning_rate": 7.815527153105393e-05, "loss": 2.3034, "step": 49456 }, { "epoch": 0.62, "learning_rate": 7.812861460341083e-05, "loss": 2.2945, "step": 49464 }, { "epoch": 0.62, "learning_rate": 7.810196087228705e-05, "loss": 2.2733, "step": 49472 }, { "epoch": 0.62, "learning_rate": 7.807531034035589e-05, "loss": 2.2989, "step": 49480 }, { "epoch": 0.62, "learning_rate": 7.804866301029022e-05, "loss": 2.2804, "step": 49488 }, { "epoch": 0.62, "learning_rate": 7.802201888476255e-05, "loss": 2.2679, "step": 49496 }, { "epoch": 0.62, "learning_rate": 7.799537796644525e-05, "loss": 2.2695, "step": 49504 }, { "epoch": 0.62, "learning_rate": 7.796874025801013e-05, "loss": 2.3016, "step": 49512 }, { "epoch": 0.62, "learning_rate": 7.79421057621289e-05, "loss": 2.2896, "step": 49520 }, { "epoch": 0.62, "learning_rate": 7.79154744814728e-05, "loss": 2.2851, "step": 49528 }, { "epoch": 0.62, "learning_rate": 7.788884641871281e-05, "loss": 2.2932, "step": 49536 }, { "epoch": 0.62, "learning_rate": 7.786222157651959e-05, "loss": 2.2895, "step": 49544 }, { "epoch": 0.62, "learning_rate": 7.78355999575634e-05, "loss": 2.2882, "step": 49552 }, { "epoch": 0.62, "learning_rate": 7.780898156451433e-05, "loss": 2.2759, "step": 49560 }, { "epoch": 0.62, "learning_rate": 7.778236640004197e-05, "loss": 2.2738, "step": 49568 }, { "epoch": 0.62, "learning_rate": 7.775575446681574e-05, "loss": 2.3054, "step": 49576 }, { "epoch": 0.62, "learning_rate": 7.772914576750461e-05, "loss": 2.2918, "step": 49584 }, { "epoch": 0.62, "learning_rate": 7.770254030477729e-05, "loss": 2.2742, "step": 49592 }, { "epoch": 0.62, "learning_rate": 7.767593808130218e-05, "loss": 2.2668, "step": 49600 }, { "epoch": 0.62, "learning_rate": 7.764933909974732e-05, "loss": 2.304, "step": 49608 }, { "epoch": 0.62, "learning_rate": 7.762274336278044e-05, "loss": 2.2829, "step": 49616 }, { "epoch": 0.62, "learning_rate": 7.759615087306897e-05, "loss": 2.3082, "step": 49624 }, { "epoch": 0.62, "learning_rate": 7.756956163327991e-05, "loss": 2.283, "step": 49632 }, { "epoch": 0.62, "learning_rate": 7.75429756460801e-05, "loss": 2.2905, "step": 49640 }, { "epoch": 0.62, "learning_rate": 7.751639291413589e-05, "loss": 2.2738, "step": 49648 }, { "epoch": 0.62, "learning_rate": 7.748981344011341e-05, "loss": 2.2819, "step": 49656 }, { "epoch": 0.62, "learning_rate": 7.746323722667846e-05, "loss": 2.2842, "step": 49664 }, { "epoch": 0.62, "learning_rate": 7.743666427649641e-05, "loss": 2.2713, "step": 49672 }, { "epoch": 0.62, "learning_rate": 7.741009459223244e-05, "loss": 2.2873, "step": 49680 }, { "epoch": 0.62, "learning_rate": 7.73835281765513e-05, "loss": 2.2688, "step": 49688 }, { "epoch": 0.62, "learning_rate": 7.735696503211751e-05, "loss": 2.2603, "step": 49696 }, { "epoch": 0.62, "learning_rate": 7.733040516159516e-05, "loss": 2.2864, "step": 49704 }, { "epoch": 0.62, "learning_rate": 7.730384856764801e-05, "loss": 2.2808, "step": 49712 }, { "epoch": 0.62, "learning_rate": 7.727729525293961e-05, "loss": 2.2821, "step": 49720 }, { "epoch": 0.62, "learning_rate": 7.725074522013305e-05, "loss": 2.2922, "step": 49728 }, { "epoch": 0.62, "learning_rate": 7.722419847189122e-05, "loss": 2.2855, "step": 49736 }, { "epoch": 0.62, "learning_rate": 7.719765501087652e-05, "loss": 2.2881, "step": 49744 }, { "epoch": 0.62, "learning_rate": 7.717111483975119e-05, "loss": 2.2889, "step": 49752 }, { "epoch": 0.62, "learning_rate": 7.714457796117705e-05, "loss": 2.26, "step": 49760 }, { "epoch": 0.62, "learning_rate": 7.711804437781551e-05, "loss": 2.2757, "step": 49768 }, { "epoch": 0.62, "learning_rate": 7.709151409232784e-05, "loss": 2.2863, "step": 49776 }, { "epoch": 0.62, "learning_rate": 7.70649871073748e-05, "loss": 2.3026, "step": 49784 }, { "epoch": 0.62, "learning_rate": 7.703846342561696e-05, "loss": 2.2784, "step": 49792 }, { "epoch": 0.62, "learning_rate": 7.701194304971449e-05, "loss": 2.2677, "step": 49800 }, { "epoch": 0.62, "learning_rate": 7.698542598232717e-05, "loss": 2.2586, "step": 49808 }, { "epoch": 0.62, "learning_rate": 7.695891222611456e-05, "loss": 2.2885, "step": 49816 }, { "epoch": 0.62, "learning_rate": 7.693240178373581e-05, "loss": 2.2854, "step": 49824 }, { "epoch": 0.62, "learning_rate": 7.690589465784985e-05, "loss": 2.2772, "step": 49832 }, { "epoch": 0.62, "learning_rate": 7.687939085111512e-05, "loss": 2.2681, "step": 49840 }, { "epoch": 0.62, "learning_rate": 7.68528903661898e-05, "loss": 2.291, "step": 49848 }, { "epoch": 0.62, "learning_rate": 7.682639320573173e-05, "loss": 2.2708, "step": 49856 }, { "epoch": 0.62, "learning_rate": 7.679989937239846e-05, "loss": 2.2966, "step": 49864 }, { "epoch": 0.62, "learning_rate": 7.67734088688472e-05, "loss": 2.305, "step": 49872 }, { "epoch": 0.62, "learning_rate": 7.674692169773472e-05, "loss": 2.2856, "step": 49880 }, { "epoch": 0.62, "learning_rate": 7.672043786171758e-05, "loss": 2.2915, "step": 49888 }, { "epoch": 0.62, "learning_rate": 7.669395736345198e-05, "loss": 2.2819, "step": 49896 }, { "epoch": 0.62, "learning_rate": 7.666748020559369e-05, "loss": 2.2512, "step": 49904 }, { "epoch": 0.62, "learning_rate": 7.664100639079829e-05, "loss": 2.2822, "step": 49912 }, { "epoch": 0.62, "learning_rate": 7.661453592172092e-05, "loss": 2.2865, "step": 49920 }, { "epoch": 0.62, "learning_rate": 7.65880688010164e-05, "loss": 2.2882, "step": 49928 }, { "epoch": 0.62, "learning_rate": 7.656160503133931e-05, "loss": 2.2555, "step": 49936 }, { "epoch": 0.62, "learning_rate": 7.653514461534372e-05, "loss": 2.2797, "step": 49944 }, { "epoch": 0.62, "learning_rate": 7.65086875556835e-05, "loss": 2.2911, "step": 49952 }, { "epoch": 0.62, "learning_rate": 7.648223385501214e-05, "loss": 2.2704, "step": 49960 }, { "epoch": 0.62, "learning_rate": 7.645578351598286e-05, "loss": 2.2787, "step": 49968 }, { "epoch": 0.62, "learning_rate": 7.64293365412484e-05, "loss": 2.2889, "step": 49976 }, { "epoch": 0.62, "learning_rate": 7.640289293346124e-05, "loss": 2.2693, "step": 49984 }, { "epoch": 0.62, "learning_rate": 7.637645269527354e-05, "loss": 2.2801, "step": 49992 }, { "epoch": 0.62, "learning_rate": 7.635001582933712e-05, "loss": 2.2737, "step": 50000 }, { "epoch": 0.63, "learning_rate": 7.632358233830345e-05, "loss": 2.2853, "step": 50008 }, { "epoch": 0.63, "learning_rate": 7.629715222482365e-05, "loss": 2.2999, "step": 50016 }, { "epoch": 0.63, "learning_rate": 7.62707254915485e-05, "loss": 2.2692, "step": 50024 }, { "epoch": 0.63, "learning_rate": 7.624430214112849e-05, "loss": 2.2808, "step": 50032 }, { "epoch": 0.63, "learning_rate": 7.621788217621366e-05, "loss": 2.2785, "step": 50040 }, { "epoch": 0.63, "learning_rate": 7.619146559945389e-05, "loss": 2.3031, "step": 50048 }, { "epoch": 0.63, "learning_rate": 7.616505241349847e-05, "loss": 2.2807, "step": 50056 }, { "epoch": 0.63, "learning_rate": 7.613864262099665e-05, "loss": 2.2801, "step": 50064 }, { "epoch": 0.63, "learning_rate": 7.611223622459709e-05, "loss": 2.263, "step": 50072 }, { "epoch": 0.63, "learning_rate": 7.60858332269482e-05, "loss": 2.2784, "step": 50080 }, { "epoch": 0.63, "learning_rate": 7.605943363069808e-05, "loss": 2.2842, "step": 50088 }, { "epoch": 0.63, "learning_rate": 7.603303743849441e-05, "loss": 2.282, "step": 50096 }, { "epoch": 0.63, "learning_rate": 7.600664465298466e-05, "loss": 2.2884, "step": 50104 }, { "epoch": 0.63, "learning_rate": 7.598025527681585e-05, "loss": 2.2678, "step": 50112 }, { "epoch": 0.63, "learning_rate": 7.59538693126346e-05, "loss": 2.2912, "step": 50120 }, { "epoch": 0.63, "learning_rate": 7.59274867630874e-05, "loss": 2.2705, "step": 50128 }, { "epoch": 0.63, "learning_rate": 7.59011076308202e-05, "loss": 2.2812, "step": 50136 }, { "epoch": 0.63, "learning_rate": 7.587473191847869e-05, "loss": 2.2687, "step": 50144 }, { "epoch": 0.63, "learning_rate": 7.58483596287082e-05, "loss": 2.2838, "step": 50152 }, { "epoch": 0.63, "learning_rate": 7.582199076415371e-05, "loss": 2.291, "step": 50160 }, { "epoch": 0.63, "learning_rate": 7.579562532745991e-05, "loss": 2.2623, "step": 50168 }, { "epoch": 0.63, "learning_rate": 7.576926332127105e-05, "loss": 2.2933, "step": 50176 }, { "epoch": 0.63, "learning_rate": 7.574290474823116e-05, "loss": 2.2897, "step": 50184 }, { "epoch": 0.63, "learning_rate": 7.57165496109838e-05, "loss": 2.2824, "step": 50192 }, { "epoch": 0.63, "learning_rate": 7.56901979121722e-05, "loss": 2.2773, "step": 50200 }, { "epoch": 0.63, "learning_rate": 7.56638496544394e-05, "loss": 2.2895, "step": 50208 }, { "epoch": 0.63, "learning_rate": 7.563750484042789e-05, "loss": 2.2807, "step": 50216 }, { "epoch": 0.63, "learning_rate": 7.561116347277994e-05, "loss": 2.2932, "step": 50224 }, { "epoch": 0.63, "learning_rate": 7.558482555413743e-05, "loss": 2.2614, "step": 50232 }, { "epoch": 0.63, "learning_rate": 7.555849108714192e-05, "loss": 2.2808, "step": 50240 }, { "epoch": 0.63, "learning_rate": 7.55321600744346e-05, "loss": 2.2882, "step": 50248 }, { "epoch": 0.63, "learning_rate": 7.550583251865631e-05, "loss": 2.2964, "step": 50256 }, { "epoch": 0.63, "learning_rate": 7.54795084224476e-05, "loss": 2.2811, "step": 50264 }, { "epoch": 0.63, "learning_rate": 7.545318778844854e-05, "loss": 2.2666, "step": 50272 }, { "epoch": 0.63, "learning_rate": 7.542687061929903e-05, "loss": 2.2777, "step": 50280 }, { "epoch": 0.63, "learning_rate": 7.540055691763847e-05, "loss": 2.2693, "step": 50288 }, { "epoch": 0.63, "learning_rate": 7.5374246686106e-05, "loss": 2.3016, "step": 50296 }, { "epoch": 0.63, "learning_rate": 7.534793992734042e-05, "loss": 2.3021, "step": 50304 }, { "epoch": 0.63, "learning_rate": 7.532163664398007e-05, "loss": 2.2787, "step": 50312 }, { "epoch": 0.63, "learning_rate": 7.529533683866307e-05, "loss": 2.2508, "step": 50320 }, { "epoch": 0.63, "learning_rate": 7.526904051402719e-05, "loss": 2.2961, "step": 50328 }, { "epoch": 0.63, "learning_rate": 7.52427476727097e-05, "loss": 2.2905, "step": 50336 }, { "epoch": 0.63, "learning_rate": 7.521645831734769e-05, "loss": 2.2832, "step": 50344 }, { "epoch": 0.63, "learning_rate": 7.51901724505778e-05, "loss": 2.2688, "step": 50352 }, { "epoch": 0.63, "learning_rate": 7.516389007503639e-05, "loss": 2.2739, "step": 50360 }, { "epoch": 0.63, "learning_rate": 7.513761119335943e-05, "loss": 2.2749, "step": 50368 }, { "epoch": 0.63, "learning_rate": 7.511133580818248e-05, "loss": 2.284, "step": 50376 }, { "epoch": 0.63, "learning_rate": 7.508506392214087e-05, "loss": 2.2799, "step": 50384 }, { "epoch": 0.63, "learning_rate": 7.505879553786952e-05, "loss": 2.2635, "step": 50392 }, { "epoch": 0.63, "learning_rate": 7.5032530658003e-05, "loss": 2.2772, "step": 50400 }, { "epoch": 0.63, "learning_rate": 7.500626928517549e-05, "loss": 2.2578, "step": 50408 }, { "epoch": 0.63, "learning_rate": 7.498001142202094e-05, "loss": 2.2858, "step": 50416 }, { "epoch": 0.63, "learning_rate": 7.495375707117276e-05, "loss": 2.2848, "step": 50424 }, { "epoch": 0.63, "learning_rate": 7.492750623526417e-05, "loss": 2.2847, "step": 50432 }, { "epoch": 0.63, "learning_rate": 7.490125891692798e-05, "loss": 2.3052, "step": 50440 }, { "epoch": 0.63, "learning_rate": 7.487501511879664e-05, "loss": 2.2923, "step": 50448 }, { "epoch": 0.63, "learning_rate": 7.484877484350225e-05, "loss": 2.2606, "step": 50456 }, { "epoch": 0.63, "learning_rate": 7.482253809367659e-05, "loss": 2.2817, "step": 50464 }, { "epoch": 0.63, "learning_rate": 7.4796304871951e-05, "loss": 2.2803, "step": 50472 }, { "epoch": 0.63, "learning_rate": 7.477007518095658e-05, "loss": 2.2906, "step": 50480 }, { "epoch": 0.63, "learning_rate": 7.474384902332396e-05, "loss": 2.2884, "step": 50488 }, { "epoch": 0.63, "learning_rate": 7.471762640168354e-05, "loss": 2.2819, "step": 50496 }, { "epoch": 0.63, "learning_rate": 7.469140731866528e-05, "loss": 2.2925, "step": 50504 }, { "epoch": 0.63, "learning_rate": 7.466519177689877e-05, "loss": 2.2674, "step": 50512 }, { "epoch": 0.63, "learning_rate": 7.463897977901333e-05, "loss": 2.2873, "step": 50520 }, { "epoch": 0.63, "learning_rate": 7.461277132763782e-05, "loss": 2.2626, "step": 50528 }, { "epoch": 0.63, "learning_rate": 7.458656642540087e-05, "loss": 2.2828, "step": 50536 }, { "epoch": 0.63, "learning_rate": 7.456036507493064e-05, "loss": 2.2733, "step": 50544 }, { "epoch": 0.63, "learning_rate": 7.453416727885495e-05, "loss": 2.3076, "step": 50552 }, { "epoch": 0.63, "learning_rate": 7.450797303980134e-05, "loss": 2.3074, "step": 50560 }, { "epoch": 0.63, "learning_rate": 7.44817823603969e-05, "loss": 2.2839, "step": 50568 }, { "epoch": 0.63, "learning_rate": 7.445559524326848e-05, "loss": 2.261, "step": 50576 }, { "epoch": 0.63, "learning_rate": 7.442941169104241e-05, "loss": 2.2978, "step": 50584 }, { "epoch": 0.63, "learning_rate": 7.440323170634482e-05, "loss": 2.2911, "step": 50592 }, { "epoch": 0.63, "learning_rate": 7.43770552918014e-05, "loss": 2.2726, "step": 50600 }, { "epoch": 0.63, "learning_rate": 7.435088245003743e-05, "loss": 2.2753, "step": 50608 }, { "epoch": 0.63, "learning_rate": 7.432471318367802e-05, "loss": 2.2742, "step": 50616 }, { "epoch": 0.63, "learning_rate": 7.429854749534765e-05, "loss": 2.2814, "step": 50624 }, { "epoch": 0.63, "learning_rate": 7.427238538767072e-05, "loss": 2.2731, "step": 50632 }, { "epoch": 0.63, "learning_rate": 7.424622686327112e-05, "loss": 2.2716, "step": 50640 }, { "epoch": 0.63, "learning_rate": 7.422007192477232e-05, "loss": 2.2924, "step": 50648 }, { "epoch": 0.63, "learning_rate": 7.419392057479757e-05, "loss": 2.2891, "step": 50656 }, { "epoch": 0.63, "learning_rate": 7.416777281596972e-05, "loss": 2.2673, "step": 50664 }, { "epoch": 0.63, "learning_rate": 7.414162865091121e-05, "loss": 2.274, "step": 50672 }, { "epoch": 0.63, "learning_rate": 7.41154880822442e-05, "loss": 2.2897, "step": 50680 }, { "epoch": 0.63, "learning_rate": 7.408935111259034e-05, "loss": 2.2947, "step": 50688 }, { "epoch": 0.63, "learning_rate": 7.40632177445711e-05, "loss": 2.2702, "step": 50696 }, { "epoch": 0.63, "learning_rate": 7.403708798080749e-05, "loss": 2.2882, "step": 50704 }, { "epoch": 0.63, "learning_rate": 7.40109618239202e-05, "loss": 2.2869, "step": 50712 }, { "epoch": 0.63, "learning_rate": 7.39848392765295e-05, "loss": 2.2868, "step": 50720 }, { "epoch": 0.63, "learning_rate": 7.395872034125535e-05, "loss": 2.2703, "step": 50728 }, { "epoch": 0.63, "learning_rate": 7.393260502071733e-05, "loss": 2.2806, "step": 50736 }, { "epoch": 0.63, "learning_rate": 7.390649331753463e-05, "loss": 2.2814, "step": 50744 }, { "epoch": 0.63, "learning_rate": 7.388038523432619e-05, "loss": 2.2717, "step": 50752 }, { "epoch": 0.63, "learning_rate": 7.38542807737104e-05, "loss": 2.2858, "step": 50760 }, { "epoch": 0.63, "learning_rate": 7.382817993830544e-05, "loss": 2.2936, "step": 50768 }, { "epoch": 0.63, "learning_rate": 7.380208273072911e-05, "loss": 2.2609, "step": 50776 }, { "epoch": 0.63, "learning_rate": 7.377598915359873e-05, "loss": 2.2859, "step": 50784 }, { "epoch": 0.63, "learning_rate": 7.37498992095314e-05, "loss": 2.2694, "step": 50792 }, { "epoch": 0.64, "learning_rate": 7.372381290114374e-05, "loss": 2.2618, "step": 50800 }, { "epoch": 0.64, "learning_rate": 7.369773023105215e-05, "loss": 2.2814, "step": 50808 }, { "epoch": 0.64, "learning_rate": 7.367165120187252e-05, "loss": 2.2567, "step": 50816 }, { "epoch": 0.64, "learning_rate": 7.364557581622038e-05, "loss": 2.2814, "step": 50824 }, { "epoch": 0.64, "learning_rate": 7.361950407671101e-05, "loss": 2.2868, "step": 50832 }, { "epoch": 0.64, "learning_rate": 7.359343598595922e-05, "loss": 2.2778, "step": 50840 }, { "epoch": 0.64, "learning_rate": 7.356737154657954e-05, "loss": 2.286, "step": 50848 }, { "epoch": 0.64, "learning_rate": 7.354131076118605e-05, "loss": 2.2811, "step": 50856 }, { "epoch": 0.64, "learning_rate": 7.351525363239246e-05, "loss": 2.2797, "step": 50864 }, { "epoch": 0.64, "learning_rate": 7.348920016281227e-05, "loss": 2.2872, "step": 50872 }, { "epoch": 0.64, "learning_rate": 7.346315035505837e-05, "loss": 2.2826, "step": 50880 }, { "epoch": 0.64, "learning_rate": 7.343710421174348e-05, "loss": 2.2785, "step": 50888 }, { "epoch": 0.64, "learning_rate": 7.341106173547987e-05, "loss": 2.2672, "step": 50896 }, { "epoch": 0.64, "learning_rate": 7.33850229288794e-05, "loss": 2.2885, "step": 50904 }, { "epoch": 0.64, "learning_rate": 7.335898779455372e-05, "loss": 2.281, "step": 50912 }, { "epoch": 0.64, "learning_rate": 7.33329563351139e-05, "loss": 2.297, "step": 50920 }, { "epoch": 0.64, "learning_rate": 7.33069285531708e-05, "loss": 2.2994, "step": 50928 }, { "epoch": 0.64, "learning_rate": 7.328090445133485e-05, "loss": 2.2789, "step": 50936 }, { "epoch": 0.64, "learning_rate": 7.325488403221614e-05, "loss": 2.2551, "step": 50944 }, { "epoch": 0.64, "learning_rate": 7.322886729842435e-05, "loss": 2.2858, "step": 50952 }, { "epoch": 0.64, "learning_rate": 7.320285425256877e-05, "loss": 2.2884, "step": 50960 }, { "epoch": 0.64, "learning_rate": 7.317684489725847e-05, "loss": 2.2933, "step": 50968 }, { "epoch": 0.64, "learning_rate": 7.315083923510191e-05, "loss": 2.2718, "step": 50976 }, { "epoch": 0.64, "learning_rate": 7.312483726870745e-05, "loss": 2.2781, "step": 50984 }, { "epoch": 0.64, "learning_rate": 7.309883900068282e-05, "loss": 2.2918, "step": 50992 }, { "epoch": 0.64, "learning_rate": 7.307284443363553e-05, "loss": 2.2843, "step": 51000 }, { "epoch": 0.64, "learning_rate": 7.304685357017273e-05, "loss": 2.2558, "step": 51008 }, { "epoch": 0.64, "learning_rate": 7.302086641290112e-05, "loss": 2.3004, "step": 51016 }, { "epoch": 0.64, "learning_rate": 7.299488296442706e-05, "loss": 2.2812, "step": 51024 }, { "epoch": 0.64, "learning_rate": 7.29689032273566e-05, "loss": 2.305, "step": 51032 }, { "epoch": 0.64, "learning_rate": 7.294292720429527e-05, "loss": 2.2794, "step": 51040 }, { "epoch": 0.64, "learning_rate": 7.29169548978484e-05, "loss": 2.2841, "step": 51048 }, { "epoch": 0.64, "learning_rate": 7.289098631062081e-05, "loss": 2.281, "step": 51056 }, { "epoch": 0.64, "learning_rate": 7.286502144521701e-05, "loss": 2.2823, "step": 51064 }, { "epoch": 0.64, "learning_rate": 7.283906030424119e-05, "loss": 2.2798, "step": 51072 }, { "epoch": 0.64, "learning_rate": 7.281310289029699e-05, "loss": 2.2783, "step": 51080 }, { "epoch": 0.64, "learning_rate": 7.278714920598788e-05, "loss": 2.2764, "step": 51088 }, { "epoch": 0.64, "learning_rate": 7.276119925391685e-05, "loss": 2.287, "step": 51096 }, { "epoch": 0.64, "learning_rate": 7.273525303668653e-05, "loss": 2.287, "step": 51104 }, { "epoch": 0.64, "learning_rate": 7.270931055689918e-05, "loss": 2.2818, "step": 51112 }, { "epoch": 0.64, "learning_rate": 7.26833718171567e-05, "loss": 2.2844, "step": 51120 }, { "epoch": 0.64, "learning_rate": 7.265743682006054e-05, "loss": 2.2911, "step": 51128 }, { "epoch": 0.64, "learning_rate": 7.26315055682119e-05, "loss": 2.2866, "step": 51136 }, { "epoch": 0.64, "learning_rate": 7.260557806421152e-05, "loss": 2.3046, "step": 51144 }, { "epoch": 0.64, "learning_rate": 7.257965431065971e-05, "loss": 2.2969, "step": 51152 }, { "epoch": 0.64, "learning_rate": 7.25537343101566e-05, "loss": 2.2809, "step": 51160 }, { "epoch": 0.64, "learning_rate": 7.252781806530173e-05, "loss": 2.2655, "step": 51168 }, { "epoch": 0.64, "learning_rate": 7.25019055786944e-05, "loss": 2.3136, "step": 51176 }, { "epoch": 0.64, "learning_rate": 7.247599685293345e-05, "loss": 2.2816, "step": 51184 }, { "epoch": 0.64, "learning_rate": 7.245009189061736e-05, "loss": 2.2842, "step": 51192 }, { "epoch": 0.64, "learning_rate": 7.242419069434434e-05, "loss": 2.2568, "step": 51200 }, { "epoch": 0.64, "learning_rate": 7.239829326671206e-05, "loss": 2.2993, "step": 51208 }, { "epoch": 0.64, "learning_rate": 7.237239961031785e-05, "loss": 2.2776, "step": 51216 }, { "epoch": 0.64, "learning_rate": 7.234650972775885e-05, "loss": 2.2768, "step": 51224 }, { "epoch": 0.64, "learning_rate": 7.232062362163145e-05, "loss": 2.2978, "step": 51232 }, { "epoch": 0.64, "learning_rate": 7.229474129453212e-05, "loss": 2.2981, "step": 51240 }, { "epoch": 0.64, "learning_rate": 7.226886274905653e-05, "loss": 2.2841, "step": 51248 }, { "epoch": 0.64, "learning_rate": 7.224298798780016e-05, "loss": 2.2849, "step": 51256 }, { "epoch": 0.64, "learning_rate": 7.221711701335825e-05, "loss": 2.2789, "step": 51264 }, { "epoch": 0.64, "learning_rate": 7.219124982832532e-05, "loss": 2.2816, "step": 51272 }, { "epoch": 0.64, "learning_rate": 7.216538643529584e-05, "loss": 2.2631, "step": 51280 }, { "epoch": 0.64, "learning_rate": 7.213952683686371e-05, "loss": 2.2641, "step": 51288 }, { "epoch": 0.64, "learning_rate": 7.211367103562253e-05, "loss": 2.2966, "step": 51296 }, { "epoch": 0.64, "learning_rate": 7.208781903416548e-05, "loss": 2.2889, "step": 51304 }, { "epoch": 0.64, "learning_rate": 7.20619708350853e-05, "loss": 2.2868, "step": 51312 }, { "epoch": 0.64, "learning_rate": 7.203612644097452e-05, "loss": 2.2752, "step": 51320 }, { "epoch": 0.64, "learning_rate": 7.201028585442513e-05, "loss": 2.2658, "step": 51328 }, { "epoch": 0.64, "learning_rate": 7.198444907802881e-05, "loss": 2.28, "step": 51336 }, { "epoch": 0.64, "learning_rate": 7.195861611437685e-05, "loss": 2.2611, "step": 51344 }, { "epoch": 0.64, "learning_rate": 7.193278696606014e-05, "loss": 2.2846, "step": 51352 }, { "epoch": 0.64, "learning_rate": 7.190696163566919e-05, "loss": 2.286, "step": 51360 }, { "epoch": 0.64, "learning_rate": 7.188114012579412e-05, "loss": 2.2942, "step": 51368 }, { "epoch": 0.64, "learning_rate": 7.185532243902474e-05, "loss": 2.264, "step": 51376 }, { "epoch": 0.64, "learning_rate": 7.182950857795035e-05, "loss": 2.2863, "step": 51384 }, { "epoch": 0.64, "learning_rate": 7.180369854515995e-05, "loss": 2.2785, "step": 51392 }, { "epoch": 0.64, "learning_rate": 7.177789234324219e-05, "loss": 2.2961, "step": 51400 }, { "epoch": 0.64, "learning_rate": 7.175208997478525e-05, "loss": 2.2723, "step": 51408 }, { "epoch": 0.64, "learning_rate": 7.172629144237694e-05, "loss": 2.2939, "step": 51416 }, { "epoch": 0.64, "learning_rate": 7.170049674860473e-05, "loss": 2.2835, "step": 51424 }, { "epoch": 0.64, "learning_rate": 7.16747058960557e-05, "loss": 2.2826, "step": 51432 }, { "epoch": 0.64, "learning_rate": 7.164891888731649e-05, "loss": 2.2873, "step": 51440 }, { "epoch": 0.64, "learning_rate": 7.162313572497336e-05, "loss": 2.2834, "step": 51448 }, { "epoch": 0.64, "learning_rate": 7.159735641161234e-05, "loss": 2.2841, "step": 51456 }, { "epoch": 0.64, "learning_rate": 7.157158094981882e-05, "loss": 2.2986, "step": 51464 }, { "epoch": 0.64, "learning_rate": 7.154580934217803e-05, "loss": 2.2891, "step": 51472 }, { "epoch": 0.64, "learning_rate": 7.152004159127463e-05, "loss": 2.2804, "step": 51480 }, { "epoch": 0.64, "learning_rate": 7.149427769969301e-05, "loss": 2.2863, "step": 51488 }, { "epoch": 0.64, "learning_rate": 7.14685176700172e-05, "loss": 2.2873, "step": 51496 }, { "epoch": 0.64, "learning_rate": 7.144276150483067e-05, "loss": 2.252, "step": 51504 }, { "epoch": 0.64, "learning_rate": 7.141700920671673e-05, "loss": 2.2907, "step": 51512 }, { "epoch": 0.64, "learning_rate": 7.139126077825817e-05, "loss": 2.278, "step": 51520 }, { "epoch": 0.64, "learning_rate": 7.13655162220373e-05, "loss": 2.2674, "step": 51528 }, { "epoch": 0.64, "learning_rate": 7.133977554063634e-05, "loss": 2.258, "step": 51536 }, { "epoch": 0.64, "learning_rate": 7.131403873663673e-05, "loss": 2.2839, "step": 51544 }, { "epoch": 0.64, "learning_rate": 7.128830581261987e-05, "loss": 2.2718, "step": 51552 }, { "epoch": 0.64, "learning_rate": 7.126257677116663e-05, "loss": 2.2713, "step": 51560 }, { "epoch": 0.64, "learning_rate": 7.123685161485738e-05, "loss": 2.2934, "step": 51568 }, { "epoch": 0.64, "learning_rate": 7.121113034627229e-05, "loss": 2.2814, "step": 51576 }, { "epoch": 0.64, "learning_rate": 7.118541296799104e-05, "loss": 2.2717, "step": 51584 }, { "epoch": 0.64, "learning_rate": 7.115969948259293e-05, "loss": 2.2928, "step": 51592 }, { "epoch": 0.65, "learning_rate": 7.113398989265691e-05, "loss": 2.2868, "step": 51600 }, { "epoch": 0.65, "learning_rate": 7.110828420076143e-05, "loss": 2.2616, "step": 51608 }, { "epoch": 0.65, "learning_rate": 7.108258240948469e-05, "loss": 2.2741, "step": 51616 }, { "epoch": 0.65, "learning_rate": 7.105688452140442e-05, "loss": 2.2704, "step": 51624 }, { "epoch": 0.65, "learning_rate": 7.103119053909797e-05, "loss": 2.2696, "step": 51632 }, { "epoch": 0.65, "learning_rate": 7.10055004651423e-05, "loss": 2.2927, "step": 51640 }, { "epoch": 0.65, "learning_rate": 7.097981430211395e-05, "loss": 2.2569, "step": 51648 }, { "epoch": 0.65, "learning_rate": 7.095413205258916e-05, "loss": 2.284, "step": 51656 }, { "epoch": 0.65, "learning_rate": 7.092845371914367e-05, "loss": 2.2688, "step": 51664 }, { "epoch": 0.65, "learning_rate": 7.09027793043529e-05, "loss": 2.2819, "step": 51672 }, { "epoch": 0.65, "learning_rate": 7.087710881079179e-05, "loss": 2.2877, "step": 51680 }, { "epoch": 0.65, "learning_rate": 7.085144224103499e-05, "loss": 2.2501, "step": 51688 }, { "epoch": 0.65, "learning_rate": 7.082577959765672e-05, "loss": 2.2829, "step": 51696 }, { "epoch": 0.65, "learning_rate": 7.08001208832308e-05, "loss": 2.2829, "step": 51704 }, { "epoch": 0.65, "learning_rate": 7.077446610033061e-05, "loss": 2.2597, "step": 51712 }, { "epoch": 0.65, "learning_rate": 7.074881525152919e-05, "loss": 2.2776, "step": 51720 }, { "epoch": 0.65, "learning_rate": 7.072316833939923e-05, "loss": 2.2745, "step": 51728 }, { "epoch": 0.65, "learning_rate": 7.069752536651291e-05, "loss": 2.2633, "step": 51736 }, { "epoch": 0.65, "learning_rate": 7.067188633544211e-05, "loss": 2.2577, "step": 51744 }, { "epoch": 0.65, "learning_rate": 7.064625124875825e-05, "loss": 2.271, "step": 51752 }, { "epoch": 0.65, "learning_rate": 7.062062010903239e-05, "loss": 2.2964, "step": 51760 }, { "epoch": 0.65, "learning_rate": 7.059499291883524e-05, "loss": 2.2872, "step": 51768 }, { "epoch": 0.65, "learning_rate": 7.056936968073697e-05, "loss": 2.2943, "step": 51776 }, { "epoch": 0.65, "learning_rate": 7.054375039730749e-05, "loss": 2.2775, "step": 51784 }, { "epoch": 0.65, "learning_rate": 7.051813507111634e-05, "loss": 2.3028, "step": 51792 }, { "epoch": 0.65, "learning_rate": 7.049252370473245e-05, "loss": 2.2656, "step": 51800 }, { "epoch": 0.65, "learning_rate": 7.046691630072464e-05, "loss": 2.2737, "step": 51808 }, { "epoch": 0.65, "learning_rate": 7.044131286166104e-05, "loss": 2.2872, "step": 51816 }, { "epoch": 0.65, "learning_rate": 7.041571339010966e-05, "loss": 2.2812, "step": 51824 }, { "epoch": 0.65, "learning_rate": 7.039011788863796e-05, "loss": 2.2974, "step": 51832 }, { "epoch": 0.65, "learning_rate": 7.036452635981292e-05, "loss": 2.2546, "step": 51840 }, { "epoch": 0.65, "learning_rate": 7.033893880620132e-05, "loss": 2.2738, "step": 51848 }, { "epoch": 0.65, "learning_rate": 7.031335523036944e-05, "loss": 2.2607, "step": 51856 }, { "epoch": 0.65, "learning_rate": 7.028777563488316e-05, "loss": 2.2566, "step": 51864 }, { "epoch": 0.65, "learning_rate": 7.026220002230799e-05, "loss": 2.2674, "step": 51872 }, { "epoch": 0.65, "learning_rate": 7.023662839520892e-05, "loss": 2.2842, "step": 51880 }, { "epoch": 0.65, "learning_rate": 7.021106075615076e-05, "loss": 2.2684, "step": 51888 }, { "epoch": 0.65, "learning_rate": 7.018549710769773e-05, "loss": 2.2813, "step": 51896 }, { "epoch": 0.65, "learning_rate": 7.015993745241374e-05, "loss": 2.2962, "step": 51904 }, { "epoch": 0.65, "learning_rate": 7.013438179286229e-05, "loss": 2.3061, "step": 51912 }, { "epoch": 0.65, "learning_rate": 7.010883013160645e-05, "loss": 2.2899, "step": 51920 }, { "epoch": 0.65, "learning_rate": 7.00832824712089e-05, "loss": 2.2693, "step": 51928 }, { "epoch": 0.65, "learning_rate": 7.005773881423197e-05, "loss": 2.267, "step": 51936 }, { "epoch": 0.65, "learning_rate": 7.003219916323747e-05, "loss": 2.2926, "step": 51944 }, { "epoch": 0.65, "learning_rate": 7.000666352078695e-05, "loss": 2.2925, "step": 51952 }, { "epoch": 0.65, "learning_rate": 6.998113188944146e-05, "loss": 2.2763, "step": 51960 }, { "epoch": 0.65, "learning_rate": 6.995560427176166e-05, "loss": 2.2742, "step": 51968 }, { "epoch": 0.65, "learning_rate": 6.993008067030788e-05, "loss": 2.2603, "step": 51976 }, { "epoch": 0.65, "learning_rate": 6.990456108763995e-05, "loss": 2.2819, "step": 51984 }, { "epoch": 0.65, "learning_rate": 6.987904552631731e-05, "loss": 2.292, "step": 51992 }, { "epoch": 0.65, "learning_rate": 6.985353398889913e-05, "loss": 2.2897, "step": 52000 }, { "epoch": 0.65, "learning_rate": 6.982802647794398e-05, "loss": 2.2672, "step": 52008 }, { "epoch": 0.65, "learning_rate": 6.980252299601015e-05, "loss": 2.2743, "step": 52016 }, { "epoch": 0.65, "learning_rate": 6.977702354565549e-05, "loss": 2.2691, "step": 52024 }, { "epoch": 0.65, "learning_rate": 6.975152812943742e-05, "loss": 2.2864, "step": 52032 }, { "epoch": 0.65, "learning_rate": 6.972603674991308e-05, "loss": 2.287, "step": 52040 }, { "epoch": 0.65, "learning_rate": 6.970054940963903e-05, "loss": 2.2924, "step": 52048 }, { "epoch": 0.65, "learning_rate": 6.967506611117147e-05, "loss": 2.2605, "step": 52056 }, { "epoch": 0.65, "learning_rate": 6.964958685706637e-05, "loss": 2.284, "step": 52064 }, { "epoch": 0.65, "learning_rate": 6.962411164987898e-05, "loss": 2.2652, "step": 52072 }, { "epoch": 0.65, "learning_rate": 6.959864049216451e-05, "loss": 2.2705, "step": 52080 }, { "epoch": 0.65, "learning_rate": 6.957317338647742e-05, "loss": 2.2751, "step": 52088 }, { "epoch": 0.65, "learning_rate": 6.954771033537195e-05, "loss": 2.2833, "step": 52096 }, { "epoch": 0.65, "learning_rate": 6.952225134140197e-05, "loss": 2.2667, "step": 52104 }, { "epoch": 0.65, "learning_rate": 6.949679640712074e-05, "loss": 2.2702, "step": 52112 }, { "epoch": 0.65, "learning_rate": 6.947134553508138e-05, "loss": 2.2823, "step": 52120 }, { "epoch": 0.65, "learning_rate": 6.944589872783645e-05, "loss": 2.2729, "step": 52128 }, { "epoch": 0.65, "learning_rate": 6.942045598793801e-05, "loss": 2.2863, "step": 52136 }, { "epoch": 0.65, "learning_rate": 6.939501731793796e-05, "loss": 2.2566, "step": 52144 }, { "epoch": 0.65, "learning_rate": 6.936958272038753e-05, "loss": 2.2851, "step": 52152 }, { "epoch": 0.65, "learning_rate": 6.934415219783777e-05, "loss": 2.2822, "step": 52160 }, { "epoch": 0.65, "learning_rate": 6.931872575283916e-05, "loss": 2.2661, "step": 52168 }, { "epoch": 0.65, "learning_rate": 6.929330338794186e-05, "loss": 2.2544, "step": 52176 }, { "epoch": 0.65, "learning_rate": 6.926788510569558e-05, "loss": 2.276, "step": 52184 }, { "epoch": 0.65, "learning_rate": 6.92424709086496e-05, "loss": 2.2695, "step": 52192 }, { "epoch": 0.65, "learning_rate": 6.921706079935284e-05, "loss": 2.2744, "step": 52200 }, { "epoch": 0.65, "learning_rate": 6.919165478035382e-05, "loss": 2.249, "step": 52208 }, { "epoch": 0.65, "learning_rate": 6.916625285420057e-05, "loss": 2.2891, "step": 52216 }, { "epoch": 0.65, "learning_rate": 6.91408550234408e-05, "loss": 2.2749, "step": 52224 }, { "epoch": 0.65, "learning_rate": 6.911546129062174e-05, "loss": 2.2731, "step": 52232 }, { "epoch": 0.65, "learning_rate": 6.909007165829024e-05, "loss": 2.2604, "step": 52240 }, { "epoch": 0.65, "learning_rate": 6.906468612899278e-05, "loss": 2.2928, "step": 52248 }, { "epoch": 0.65, "learning_rate": 6.903930470527531e-05, "loss": 2.2838, "step": 52256 }, { "epoch": 0.65, "learning_rate": 6.901392738968349e-05, "loss": 2.2608, "step": 52264 }, { "epoch": 0.65, "learning_rate": 6.898855418476252e-05, "loss": 2.268, "step": 52272 }, { "epoch": 0.65, "learning_rate": 6.896318509305718e-05, "loss": 2.2768, "step": 52280 }, { "epoch": 0.65, "learning_rate": 6.893782011711182e-05, "loss": 2.295, "step": 52288 }, { "epoch": 0.65, "learning_rate": 6.891245925947048e-05, "loss": 2.2872, "step": 52296 }, { "epoch": 0.65, "learning_rate": 6.888710252267665e-05, "loss": 2.2949, "step": 52304 }, { "epoch": 0.65, "learning_rate": 6.886174990927348e-05, "loss": 2.2843, "step": 52312 }, { "epoch": 0.65, "learning_rate": 6.883640142180368e-05, "loss": 2.2809, "step": 52320 }, { "epoch": 0.65, "learning_rate": 6.881105706280953e-05, "loss": 2.2787, "step": 52328 }, { "epoch": 0.65, "learning_rate": 6.878571683483304e-05, "loss": 2.283, "step": 52336 }, { "epoch": 0.65, "learning_rate": 6.876038074041555e-05, "loss": 2.2846, "step": 52344 }, { "epoch": 0.65, "learning_rate": 6.873504878209823e-05, "loss": 2.2898, "step": 52352 }, { "epoch": 0.65, "learning_rate": 6.870972096242174e-05, "loss": 2.2833, "step": 52360 }, { "epoch": 0.65, "learning_rate": 6.86843972839262e-05, "loss": 2.2726, "step": 52368 }, { "epoch": 0.65, "learning_rate": 6.865907774915157e-05, "loss": 2.2843, "step": 52376 }, { "epoch": 0.65, "learning_rate": 6.863376236063712e-05, "loss": 2.2916, "step": 52384 }, { "epoch": 0.65, "learning_rate": 6.860845112092195e-05, "loss": 2.2659, "step": 52392 }, { "epoch": 0.66, "learning_rate": 6.858314403254464e-05, "loss": 2.2758, "step": 52400 }, { "epoch": 0.66, "learning_rate": 6.855784109804323e-05, "loss": 2.2861, "step": 52408 }, { "epoch": 0.66, "learning_rate": 6.853254231995556e-05, "loss": 2.2619, "step": 52416 }, { "epoch": 0.66, "learning_rate": 6.850724770081894e-05, "loss": 2.259, "step": 52424 }, { "epoch": 0.66, "learning_rate": 6.848195724317024e-05, "loss": 2.2812, "step": 52432 }, { "epoch": 0.66, "learning_rate": 6.845667094954601e-05, "loss": 2.269, "step": 52440 }, { "epoch": 0.66, "learning_rate": 6.843138882248225e-05, "loss": 2.2673, "step": 52448 }, { "epoch": 0.66, "learning_rate": 6.840611086451467e-05, "loss": 2.2668, "step": 52456 }, { "epoch": 0.66, "learning_rate": 6.838083707817848e-05, "loss": 2.2826, "step": 52464 }, { "epoch": 0.66, "learning_rate": 6.83555674660085e-05, "loss": 2.282, "step": 52472 }, { "epoch": 0.66, "learning_rate": 6.833030203053913e-05, "loss": 2.2647, "step": 52480 }, { "epoch": 0.66, "learning_rate": 6.830504077430437e-05, "loss": 2.2569, "step": 52488 }, { "epoch": 0.66, "learning_rate": 6.827978369983776e-05, "loss": 2.2892, "step": 52496 }, { "epoch": 0.66, "learning_rate": 6.825453080967244e-05, "loss": 2.2619, "step": 52504 }, { "epoch": 0.66, "learning_rate": 6.822928210634114e-05, "loss": 2.2944, "step": 52512 }, { "epoch": 0.66, "learning_rate": 6.820403759237615e-05, "loss": 2.2842, "step": 52520 }, { "epoch": 0.66, "learning_rate": 6.817879727030938e-05, "loss": 2.2615, "step": 52528 }, { "epoch": 0.66, "learning_rate": 6.815356114267224e-05, "loss": 2.2687, "step": 52536 }, { "epoch": 0.66, "learning_rate": 6.812832921199584e-05, "loss": 2.2757, "step": 52544 }, { "epoch": 0.66, "learning_rate": 6.810310148081074e-05, "loss": 2.2693, "step": 52552 }, { "epoch": 0.66, "learning_rate": 6.807787795164712e-05, "loss": 2.2876, "step": 52560 }, { "epoch": 0.66, "learning_rate": 6.805265862703487e-05, "loss": 2.2892, "step": 52568 }, { "epoch": 0.66, "learning_rate": 6.802744350950326e-05, "loss": 2.2786, "step": 52576 }, { "epoch": 0.66, "learning_rate": 6.80022326015812e-05, "loss": 2.2513, "step": 52584 }, { "epoch": 0.66, "learning_rate": 6.797702590579726e-05, "loss": 2.2718, "step": 52592 }, { "epoch": 0.66, "learning_rate": 6.795182342467948e-05, "loss": 2.2647, "step": 52600 }, { "epoch": 0.66, "learning_rate": 6.792662516075561e-05, "loss": 2.2937, "step": 52608 }, { "epoch": 0.66, "learning_rate": 6.79014311165528e-05, "loss": 2.2727, "step": 52616 }, { "epoch": 0.66, "learning_rate": 6.787624129459788e-05, "loss": 2.2667, "step": 52624 }, { "epoch": 0.66, "learning_rate": 6.785105569741734e-05, "loss": 2.268, "step": 52632 }, { "epoch": 0.66, "learning_rate": 6.7825874327537e-05, "loss": 2.2886, "step": 52640 }, { "epoch": 0.66, "learning_rate": 6.780069718748256e-05, "loss": 2.2785, "step": 52648 }, { "epoch": 0.66, "learning_rate": 6.777552427977906e-05, "loss": 2.2725, "step": 52656 }, { "epoch": 0.66, "learning_rate": 6.775035560695117e-05, "loss": 2.2701, "step": 52664 }, { "epoch": 0.66, "learning_rate": 6.77251911715233e-05, "loss": 2.2621, "step": 52672 }, { "epoch": 0.66, "learning_rate": 6.770003097601913e-05, "loss": 2.2788, "step": 52680 }, { "epoch": 0.66, "learning_rate": 6.767487502296223e-05, "loss": 2.2999, "step": 52688 }, { "epoch": 0.66, "learning_rate": 6.764972331487551e-05, "loss": 2.272, "step": 52696 }, { "epoch": 0.66, "learning_rate": 6.762457585428157e-05, "loss": 2.2705, "step": 52704 }, { "epoch": 0.66, "learning_rate": 6.75994326437026e-05, "loss": 2.2687, "step": 52712 }, { "epoch": 0.66, "learning_rate": 6.757429368566022e-05, "loss": 2.2663, "step": 52720 }, { "epoch": 0.66, "learning_rate": 6.754915898267579e-05, "loss": 2.2976, "step": 52728 }, { "epoch": 0.66, "learning_rate": 6.752402853727023e-05, "loss": 2.2605, "step": 52736 }, { "epoch": 0.66, "learning_rate": 6.749890235196387e-05, "loss": 2.2931, "step": 52744 }, { "epoch": 0.66, "learning_rate": 6.747378042927681e-05, "loss": 2.2759, "step": 52752 }, { "epoch": 0.66, "learning_rate": 6.74486627717286e-05, "loss": 2.267, "step": 52760 }, { "epoch": 0.66, "learning_rate": 6.74235493818384e-05, "loss": 2.2635, "step": 52768 }, { "epoch": 0.66, "learning_rate": 6.739844026212494e-05, "loss": 2.2744, "step": 52776 }, { "epoch": 0.66, "learning_rate": 6.737333541510656e-05, "loss": 2.2937, "step": 52784 }, { "epoch": 0.66, "learning_rate": 6.734823484330106e-05, "loss": 2.2804, "step": 52792 }, { "epoch": 0.66, "learning_rate": 6.732313854922594e-05, "loss": 2.2481, "step": 52800 }, { "epoch": 0.66, "learning_rate": 6.729804653539823e-05, "loss": 2.2934, "step": 52808 }, { "epoch": 0.66, "learning_rate": 6.727295880433446e-05, "loss": 2.2371, "step": 52816 }, { "epoch": 0.66, "learning_rate": 6.724787535855081e-05, "loss": 2.2699, "step": 52824 }, { "epoch": 0.66, "learning_rate": 6.722279620056306e-05, "loss": 2.2522, "step": 52832 }, { "epoch": 0.66, "learning_rate": 6.719772133288642e-05, "loss": 2.254, "step": 52840 }, { "epoch": 0.66, "learning_rate": 6.717265075803581e-05, "loss": 2.2726, "step": 52848 }, { "epoch": 0.66, "learning_rate": 6.714758447852566e-05, "loss": 2.286, "step": 52856 }, { "epoch": 0.66, "learning_rate": 6.712252249686996e-05, "loss": 2.2798, "step": 52864 }, { "epoch": 0.66, "learning_rate": 6.709746481558228e-05, "loss": 2.2871, "step": 52872 }, { "epoch": 0.66, "learning_rate": 6.707241143717584e-05, "loss": 2.2921, "step": 52880 }, { "epoch": 0.66, "learning_rate": 6.704736236416326e-05, "loss": 2.2625, "step": 52888 }, { "epoch": 0.66, "learning_rate": 6.702231759905682e-05, "loss": 2.2784, "step": 52896 }, { "epoch": 0.66, "learning_rate": 6.699727714436846e-05, "loss": 2.3037, "step": 52904 }, { "epoch": 0.66, "learning_rate": 6.697224100260947e-05, "loss": 2.285, "step": 52912 }, { "epoch": 0.66, "learning_rate": 6.694720917629096e-05, "loss": 2.2763, "step": 52920 }, { "epoch": 0.66, "learning_rate": 6.692218166792339e-05, "loss": 2.276, "step": 52928 }, { "epoch": 0.66, "learning_rate": 6.689715848001688e-05, "loss": 2.2715, "step": 52936 }, { "epoch": 0.66, "learning_rate": 6.687213961508121e-05, "loss": 2.2522, "step": 52944 }, { "epoch": 0.66, "learning_rate": 6.684712507562548e-05, "loss": 2.2733, "step": 52952 }, { "epoch": 0.66, "learning_rate": 6.682211486415862e-05, "loss": 2.2649, "step": 52960 }, { "epoch": 0.66, "learning_rate": 6.679710898318903e-05, "loss": 2.3027, "step": 52968 }, { "epoch": 0.66, "learning_rate": 6.677210743522453e-05, "loss": 2.276, "step": 52976 }, { "epoch": 0.66, "learning_rate": 6.674711022277278e-05, "loss": 2.2645, "step": 52984 }, { "epoch": 0.66, "learning_rate": 6.672211734834072e-05, "loss": 2.256, "step": 52992 }, { "epoch": 0.66, "learning_rate": 6.66971288144351e-05, "loss": 2.2754, "step": 53000 }, { "epoch": 0.66, "learning_rate": 6.667214462356212e-05, "loss": 2.2688, "step": 53008 }, { "epoch": 0.66, "learning_rate": 6.664716477822747e-05, "loss": 2.2851, "step": 53016 }, { "epoch": 0.66, "learning_rate": 6.662218928093656e-05, "loss": 2.2589, "step": 53024 }, { "epoch": 0.66, "learning_rate": 6.65972181341943e-05, "loss": 2.2824, "step": 53032 }, { "epoch": 0.66, "learning_rate": 6.65722513405051e-05, "loss": 2.2812, "step": 53040 }, { "epoch": 0.66, "learning_rate": 6.654728890237302e-05, "loss": 2.2744, "step": 53048 }, { "epoch": 0.66, "learning_rate": 6.652233082230167e-05, "loss": 2.2756, "step": 53056 }, { "epoch": 0.66, "learning_rate": 6.649737710279415e-05, "loss": 2.2789, "step": 53064 }, { "epoch": 0.66, "learning_rate": 6.647242774635323e-05, "loss": 2.2598, "step": 53072 }, { "epoch": 0.66, "learning_rate": 6.644748275548113e-05, "loss": 2.2871, "step": 53080 }, { "epoch": 0.66, "learning_rate": 6.642254213267978e-05, "loss": 2.2648, "step": 53088 }, { "epoch": 0.66, "learning_rate": 6.63976058804505e-05, "loss": 2.2792, "step": 53096 }, { "epoch": 0.66, "learning_rate": 6.637267400129428e-05, "loss": 2.2696, "step": 53104 }, { "epoch": 0.66, "learning_rate": 6.634774649771166e-05, "loss": 2.2694, "step": 53112 }, { "epoch": 0.66, "learning_rate": 6.632282337220273e-05, "loss": 2.2551, "step": 53120 }, { "epoch": 0.66, "learning_rate": 6.629790462726712e-05, "loss": 2.2857, "step": 53128 }, { "epoch": 0.66, "learning_rate": 6.627299026540404e-05, "loss": 2.2881, "step": 53136 }, { "epoch": 0.66, "learning_rate": 6.624808028911227e-05, "loss": 2.2535, "step": 53144 }, { "epoch": 0.66, "learning_rate": 6.622317470089013e-05, "loss": 2.2861, "step": 53152 }, { "epoch": 0.66, "learning_rate": 6.619827350323551e-05, "loss": 2.2669, "step": 53160 }, { "epoch": 0.66, "learning_rate": 6.617337669864585e-05, "loss": 2.2894, "step": 53168 }, { "epoch": 0.66, "learning_rate": 6.614848428961822e-05, "loss": 2.2506, "step": 53176 }, { "epoch": 0.66, "learning_rate": 6.612359627864911e-05, "loss": 2.2699, "step": 53184 }, { "epoch": 0.66, "learning_rate": 6.609871266823469e-05, "loss": 2.2736, "step": 53192 }, { "epoch": 0.67, "learning_rate": 6.607383346087062e-05, "loss": 2.2744, "step": 53200 }, { "epoch": 0.67, "learning_rate": 6.604895865905211e-05, "loss": 2.2612, "step": 53208 }, { "epoch": 0.67, "learning_rate": 6.602408826527408e-05, "loss": 2.2646, "step": 53216 }, { "epoch": 0.67, "learning_rate": 6.599922228203076e-05, "loss": 2.2841, "step": 53224 }, { "epoch": 0.67, "learning_rate": 6.597436071181616e-05, "loss": 2.2816, "step": 53232 }, { "epoch": 0.67, "learning_rate": 6.594950355712372e-05, "loss": 2.2712, "step": 53240 }, { "epoch": 0.67, "learning_rate": 6.592465082044642e-05, "loss": 2.2515, "step": 53248 }, { "epoch": 0.67, "learning_rate": 6.589980250427697e-05, "loss": 2.2737, "step": 53256 }, { "epoch": 0.67, "learning_rate": 6.587495861110738e-05, "loss": 2.2694, "step": 53264 }, { "epoch": 0.67, "learning_rate": 6.585011914342944e-05, "loss": 2.2542, "step": 53272 }, { "epoch": 0.67, "learning_rate": 6.582528410373441e-05, "loss": 2.2778, "step": 53280 }, { "epoch": 0.67, "learning_rate": 6.580045349451302e-05, "loss": 2.2696, "step": 53288 }, { "epoch": 0.67, "learning_rate": 6.577562731825573e-05, "loss": 2.2844, "step": 53296 }, { "epoch": 0.67, "learning_rate": 6.575080557745244e-05, "loss": 2.2577, "step": 53304 }, { "epoch": 0.67, "learning_rate": 6.57259882745926e-05, "loss": 2.272, "step": 53312 }, { "epoch": 0.67, "learning_rate": 6.570117541216532e-05, "loss": 2.2651, "step": 53320 }, { "epoch": 0.67, "learning_rate": 6.567636699265904e-05, "loss": 2.2732, "step": 53328 }, { "epoch": 0.67, "learning_rate": 6.565156301856206e-05, "loss": 2.2705, "step": 53336 }, { "epoch": 0.67, "learning_rate": 6.562676349236201e-05, "loss": 2.2632, "step": 53344 }, { "epoch": 0.67, "learning_rate": 6.560196841654613e-05, "loss": 2.2637, "step": 53352 }, { "epoch": 0.67, "learning_rate": 6.557717779360127e-05, "loss": 2.2885, "step": 53360 }, { "epoch": 0.67, "learning_rate": 6.555239162601375e-05, "loss": 2.302, "step": 53368 }, { "epoch": 0.67, "learning_rate": 6.552760991626949e-05, "loss": 2.2661, "step": 53376 }, { "epoch": 0.67, "learning_rate": 6.550283266685399e-05, "loss": 2.2732, "step": 53384 }, { "epoch": 0.67, "learning_rate": 6.547805988025222e-05, "loss": 2.2884, "step": 53392 }, { "epoch": 0.67, "learning_rate": 6.545329155894872e-05, "loss": 2.2969, "step": 53400 }, { "epoch": 0.67, "learning_rate": 6.542852770542775e-05, "loss": 2.2764, "step": 53408 }, { "epoch": 0.67, "learning_rate": 6.540376832217285e-05, "loss": 2.2663, "step": 53416 }, { "epoch": 0.67, "learning_rate": 6.53790134116673e-05, "loss": 2.2682, "step": 53424 }, { "epoch": 0.67, "learning_rate": 6.535426297639386e-05, "loss": 2.2653, "step": 53432 }, { "epoch": 0.67, "learning_rate": 6.532951701883483e-05, "loss": 2.2732, "step": 53440 }, { "epoch": 0.67, "learning_rate": 6.530477554147221e-05, "loss": 2.2731, "step": 53448 }, { "epoch": 0.67, "learning_rate": 6.52800385467873e-05, "loss": 2.2818, "step": 53456 }, { "epoch": 0.67, "learning_rate": 6.525530603726108e-05, "loss": 2.2946, "step": 53464 }, { "epoch": 0.67, "learning_rate": 6.523057801537422e-05, "loss": 2.2812, "step": 53472 }, { "epoch": 0.67, "learning_rate": 6.520585448360664e-05, "loss": 2.2719, "step": 53480 }, { "epoch": 0.67, "learning_rate": 6.51811354444381e-05, "loss": 2.2912, "step": 53488 }, { "epoch": 0.67, "learning_rate": 6.515642090034768e-05, "loss": 2.2606, "step": 53496 }, { "epoch": 0.67, "learning_rate": 6.51317108538141e-05, "loss": 2.2778, "step": 53504 }, { "epoch": 0.67, "learning_rate": 6.510700530731577e-05, "loss": 2.2814, "step": 53512 }, { "epoch": 0.67, "learning_rate": 6.508230426333035e-05, "loss": 2.2885, "step": 53520 }, { "epoch": 0.67, "learning_rate": 6.505760772433533e-05, "loss": 2.2791, "step": 53528 }, { "epoch": 0.67, "learning_rate": 6.503291569280763e-05, "loss": 2.2717, "step": 53536 }, { "epoch": 0.67, "learning_rate": 6.500822817122363e-05, "loss": 2.2665, "step": 53544 }, { "epoch": 0.67, "learning_rate": 6.498354516205947e-05, "loss": 2.27, "step": 53552 }, { "epoch": 0.67, "learning_rate": 6.495886666779059e-05, "loss": 2.279, "step": 53560 }, { "epoch": 0.67, "learning_rate": 6.49341926908922e-05, "loss": 2.2633, "step": 53568 }, { "epoch": 0.67, "learning_rate": 6.490952323383892e-05, "loss": 2.2409, "step": 53576 }, { "epoch": 0.67, "learning_rate": 6.488485829910495e-05, "loss": 2.2768, "step": 53584 }, { "epoch": 0.67, "learning_rate": 6.486019788916409e-05, "loss": 2.2809, "step": 53592 }, { "epoch": 0.67, "learning_rate": 6.483554200648957e-05, "loss": 2.2848, "step": 53600 }, { "epoch": 0.67, "learning_rate": 6.481089065355428e-05, "loss": 2.2872, "step": 53608 }, { "epoch": 0.67, "learning_rate": 6.478624383283062e-05, "loss": 2.2808, "step": 53616 }, { "epoch": 0.67, "learning_rate": 6.47616015467905e-05, "loss": 2.2836, "step": 53624 }, { "epoch": 0.67, "learning_rate": 6.473696379790541e-05, "loss": 2.2655, "step": 53632 }, { "epoch": 0.67, "learning_rate": 6.471233058864637e-05, "loss": 2.2716, "step": 53640 }, { "epoch": 0.67, "learning_rate": 6.468770192148396e-05, "loss": 2.2783, "step": 53648 }, { "epoch": 0.67, "learning_rate": 6.466307779888829e-05, "loss": 2.2704, "step": 53656 }, { "epoch": 0.67, "learning_rate": 6.463845822332903e-05, "loss": 2.2637, "step": 53664 }, { "epoch": 0.67, "learning_rate": 6.461384319727537e-05, "loss": 2.2746, "step": 53672 }, { "epoch": 0.67, "learning_rate": 6.458923272319608e-05, "loss": 2.2786, "step": 53680 }, { "epoch": 0.67, "learning_rate": 6.456462680355944e-05, "loss": 2.2658, "step": 53688 }, { "epoch": 0.67, "learning_rate": 6.454002544083327e-05, "loss": 2.2716, "step": 53696 }, { "epoch": 0.67, "learning_rate": 6.451542863748494e-05, "loss": 2.2689, "step": 53704 }, { "epoch": 0.67, "learning_rate": 6.449083639598142e-05, "loss": 2.2737, "step": 53712 }, { "epoch": 0.67, "learning_rate": 6.44662487187891e-05, "loss": 2.2613, "step": 53720 }, { "epoch": 0.67, "learning_rate": 6.444166560837406e-05, "loss": 2.2867, "step": 53728 }, { "epoch": 0.67, "learning_rate": 6.441708706720177e-05, "loss": 2.2574, "step": 53736 }, { "epoch": 0.67, "learning_rate": 6.439251309773742e-05, "loss": 2.2724, "step": 53744 }, { "epoch": 0.67, "learning_rate": 6.436794370244552e-05, "loss": 2.2693, "step": 53752 }, { "epoch": 0.67, "learning_rate": 6.434337888379037e-05, "loss": 2.2665, "step": 53760 }, { "epoch": 0.67, "learning_rate": 6.431881864423557e-05, "loss": 2.269, "step": 53768 }, { "epoch": 0.67, "learning_rate": 6.429426298624439e-05, "loss": 2.2772, "step": 53776 }, { "epoch": 0.67, "learning_rate": 6.42697119122797e-05, "loss": 2.2908, "step": 53784 }, { "epoch": 0.67, "learning_rate": 6.424516542480374e-05, "loss": 2.2569, "step": 53792 }, { "epoch": 0.67, "learning_rate": 6.422062352627844e-05, "loss": 2.2412, "step": 53800 }, { "epoch": 0.67, "learning_rate": 6.419608621916526e-05, "loss": 2.2548, "step": 53808 }, { "epoch": 0.67, "learning_rate": 6.4171553505925e-05, "loss": 2.2814, "step": 53816 }, { "epoch": 0.67, "learning_rate": 6.414702538901833e-05, "loss": 2.2739, "step": 53824 }, { "epoch": 0.67, "learning_rate": 6.412250187090511e-05, "loss": 2.2709, "step": 53832 }, { "epoch": 0.67, "learning_rate": 6.409798295404506e-05, "loss": 2.2543, "step": 53840 }, { "epoch": 0.67, "learning_rate": 6.407346864089724e-05, "loss": 2.2834, "step": 53848 }, { "epoch": 0.67, "learning_rate": 6.40489589339202e-05, "loss": 2.286, "step": 53856 }, { "epoch": 0.67, "learning_rate": 6.402445383557225e-05, "loss": 2.2441, "step": 53864 }, { "epoch": 0.67, "learning_rate": 6.399995334831108e-05, "loss": 2.265, "step": 53872 }, { "epoch": 0.67, "learning_rate": 6.397545747459393e-05, "loss": 2.2759, "step": 53880 }, { "epoch": 0.67, "learning_rate": 6.395096621687761e-05, "loss": 2.2908, "step": 53888 }, { "epoch": 0.67, "learning_rate": 6.392647957761846e-05, "loss": 2.2623, "step": 53896 }, { "epoch": 0.67, "learning_rate": 6.390199755927231e-05, "loss": 2.2807, "step": 53904 }, { "epoch": 0.67, "learning_rate": 6.387752016429462e-05, "loss": 2.2465, "step": 53912 }, { "epoch": 0.67, "learning_rate": 6.38530473951403e-05, "loss": 2.276, "step": 53920 }, { "epoch": 0.67, "learning_rate": 6.382857925426387e-05, "loss": 2.2514, "step": 53928 }, { "epoch": 0.67, "learning_rate": 6.380411574411931e-05, "loss": 2.2681, "step": 53936 }, { "epoch": 0.67, "learning_rate": 6.377965686716017e-05, "loss": 2.2814, "step": 53944 }, { "epoch": 0.67, "learning_rate": 6.375520262583954e-05, "loss": 2.2729, "step": 53952 }, { "epoch": 0.67, "learning_rate": 6.373075302261006e-05, "loss": 2.2882, "step": 53960 }, { "epoch": 0.67, "learning_rate": 6.370630805992387e-05, "loss": 2.2634, "step": 53968 }, { "epoch": 0.67, "learning_rate": 6.368186774023268e-05, "loss": 2.2844, "step": 53976 }, { "epoch": 0.67, "learning_rate": 6.36574320659877e-05, "loss": 2.2724, "step": 53984 }, { "epoch": 0.67, "learning_rate": 6.363300103963967e-05, "loss": 2.26, "step": 53992 }, { "epoch": 0.68, "learning_rate": 6.360857466363893e-05, "loss": 2.2622, "step": 54000 }, { "epoch": 0.68, "learning_rate": 6.358415294043525e-05, "loss": 2.2565, "step": 54008 }, { "epoch": 0.68, "learning_rate": 6.355973587247807e-05, "loss": 2.2832, "step": 54016 }, { "epoch": 0.68, "learning_rate": 6.353532346221622e-05, "loss": 2.2691, "step": 54024 }, { "epoch": 0.68, "learning_rate": 6.351091571209816e-05, "loss": 2.2593, "step": 54032 }, { "epoch": 0.68, "learning_rate": 6.348651262457179e-05, "loss": 2.2622, "step": 54040 }, { "epoch": 0.68, "learning_rate": 6.346211420208463e-05, "loss": 2.2536, "step": 54048 }, { "epoch": 0.68, "learning_rate": 6.343772044708381e-05, "loss": 2.2908, "step": 54056 }, { "epoch": 0.68, "learning_rate": 6.341333136201568e-05, "loss": 2.2839, "step": 54064 }, { "epoch": 0.68, "learning_rate": 6.338894694932651e-05, "loss": 2.2628, "step": 54072 }, { "epoch": 0.68, "learning_rate": 6.336456721146185e-05, "loss": 2.273, "step": 54080 }, { "epoch": 0.68, "learning_rate": 6.334019215086682e-05, "loss": 2.2552, "step": 54088 }, { "epoch": 0.68, "learning_rate": 6.331582176998616e-05, "loss": 2.2683, "step": 54096 }, { "epoch": 0.68, "learning_rate": 6.3291456071264e-05, "loss": 2.2824, "step": 54104 }, { "epoch": 0.68, "learning_rate": 6.326709505714417e-05, "loss": 2.2882, "step": 54112 }, { "epoch": 0.68, "learning_rate": 6.324273873006992e-05, "loss": 2.2738, "step": 54120 }, { "epoch": 0.68, "learning_rate": 6.321838709248397e-05, "loss": 2.2767, "step": 54128 }, { "epoch": 0.68, "learning_rate": 6.319404014682875e-05, "loss": 2.2539, "step": 54136 }, { "epoch": 0.68, "learning_rate": 6.316969789554607e-05, "loss": 2.2655, "step": 54144 }, { "epoch": 0.68, "learning_rate": 6.314536034107736e-05, "loss": 2.2856, "step": 54152 }, { "epoch": 0.68, "learning_rate": 6.312102748586355e-05, "loss": 2.2747, "step": 54160 }, { "epoch": 0.68, "learning_rate": 6.309669933234498e-05, "loss": 2.2792, "step": 54168 }, { "epoch": 0.68, "learning_rate": 6.307237588296173e-05, "loss": 2.2684, "step": 54176 }, { "epoch": 0.68, "learning_rate": 6.304805714015327e-05, "loss": 2.2682, "step": 54184 }, { "epoch": 0.68, "learning_rate": 6.302374310635863e-05, "loss": 2.2747, "step": 54192 }, { "epoch": 0.68, "learning_rate": 6.29994337840164e-05, "loss": 2.2831, "step": 54200 }, { "epoch": 0.68, "learning_rate": 6.297512917556461e-05, "loss": 2.2631, "step": 54208 }, { "epoch": 0.68, "learning_rate": 6.295082928344092e-05, "loss": 2.2917, "step": 54216 }, { "epoch": 0.68, "learning_rate": 6.292653411008246e-05, "loss": 2.281, "step": 54224 }, { "epoch": 0.68, "learning_rate": 6.290224365792588e-05, "loss": 2.2734, "step": 54232 }, { "epoch": 0.68, "learning_rate": 6.287795792940737e-05, "loss": 2.2574, "step": 54240 }, { "epoch": 0.68, "learning_rate": 6.285367692696273e-05, "loss": 2.2587, "step": 54248 }, { "epoch": 0.68, "learning_rate": 6.282940065302714e-05, "loss": 2.2796, "step": 54256 }, { "epoch": 0.68, "learning_rate": 6.280512911003536e-05, "loss": 2.264, "step": 54264 }, { "epoch": 0.68, "learning_rate": 6.278086230042172e-05, "loss": 2.2584, "step": 54272 }, { "epoch": 0.68, "learning_rate": 6.275660022661999e-05, "loss": 2.2865, "step": 54280 }, { "epoch": 0.68, "learning_rate": 6.273234289106363e-05, "loss": 2.274, "step": 54288 }, { "epoch": 0.68, "learning_rate": 6.27080902961854e-05, "loss": 2.2589, "step": 54296 }, { "epoch": 0.68, "learning_rate": 6.268384244441773e-05, "loss": 2.2627, "step": 54304 }, { "epoch": 0.68, "learning_rate": 6.265959933819261e-05, "loss": 2.2744, "step": 54312 }, { "epoch": 0.68, "learning_rate": 6.263536097994136e-05, "loss": 2.2822, "step": 54320 }, { "epoch": 0.68, "learning_rate": 6.26111273720951e-05, "loss": 2.2866, "step": 54328 }, { "epoch": 0.68, "learning_rate": 6.258689851708421e-05, "loss": 2.2814, "step": 54336 }, { "epoch": 0.68, "learning_rate": 6.25626744173387e-05, "loss": 2.2806, "step": 54344 }, { "epoch": 0.68, "learning_rate": 6.253845507528822e-05, "loss": 2.2825, "step": 54352 }, { "epoch": 0.68, "learning_rate": 6.25142404933617e-05, "loss": 2.2819, "step": 54360 }, { "epoch": 0.68, "learning_rate": 6.249003067398782e-05, "loss": 2.2882, "step": 54368 }, { "epoch": 0.68, "learning_rate": 6.246582561959468e-05, "loss": 2.2593, "step": 54376 }, { "epoch": 0.68, "learning_rate": 6.244162533260984e-05, "loss": 2.2862, "step": 54384 }, { "epoch": 0.68, "learning_rate": 6.241742981546058e-05, "loss": 2.2794, "step": 54392 }, { "epoch": 0.68, "learning_rate": 6.239323907057337e-05, "loss": 2.2554, "step": 54400 }, { "epoch": 0.68, "learning_rate": 6.23690531003746e-05, "loss": 2.2451, "step": 54408 }, { "epoch": 0.68, "learning_rate": 6.234487190728991e-05, "loss": 2.2504, "step": 54416 }, { "epoch": 0.68, "learning_rate": 6.232069549374453e-05, "loss": 2.2822, "step": 54424 }, { "epoch": 0.68, "learning_rate": 6.229652386216323e-05, "loss": 2.2772, "step": 54432 }, { "epoch": 0.68, "learning_rate": 6.227235701497027e-05, "loss": 2.2761, "step": 54440 }, { "epoch": 0.68, "learning_rate": 6.224819495458949e-05, "loss": 2.2802, "step": 54448 }, { "epoch": 0.68, "learning_rate": 6.222403768344415e-05, "loss": 2.2857, "step": 54456 }, { "epoch": 0.68, "learning_rate": 6.219988520395714e-05, "loss": 2.2694, "step": 54464 }, { "epoch": 0.68, "learning_rate": 6.21757375185508e-05, "loss": 2.2837, "step": 54472 }, { "epoch": 0.68, "learning_rate": 6.215159462964698e-05, "loss": 2.2831, "step": 54480 }, { "epoch": 0.68, "learning_rate": 6.21274565396671e-05, "loss": 2.2381, "step": 54488 }, { "epoch": 0.68, "learning_rate": 6.210332325103206e-05, "loss": 2.2809, "step": 54496 }, { "epoch": 0.68, "learning_rate": 6.20791947661623e-05, "loss": 2.272, "step": 54504 }, { "epoch": 0.68, "learning_rate": 6.205507108747778e-05, "loss": 2.2464, "step": 54512 }, { "epoch": 0.68, "learning_rate": 6.203095221739795e-05, "loss": 2.2502, "step": 54520 }, { "epoch": 0.68, "learning_rate": 6.200683815834182e-05, "loss": 2.2613, "step": 54528 }, { "epoch": 0.68, "learning_rate": 6.198272891272787e-05, "loss": 2.2576, "step": 54536 }, { "epoch": 0.68, "learning_rate": 6.195862448297411e-05, "loss": 2.2672, "step": 54544 }, { "epoch": 0.68, "learning_rate": 6.193452487149813e-05, "loss": 2.2606, "step": 54552 }, { "epoch": 0.68, "learning_rate": 6.191043008071693e-05, "loss": 2.2686, "step": 54560 }, { "epoch": 0.68, "learning_rate": 6.188634011304712e-05, "loss": 2.2691, "step": 54568 }, { "epoch": 0.68, "learning_rate": 6.186225497090473e-05, "loss": 2.2628, "step": 54576 }, { "epoch": 0.68, "learning_rate": 6.183817465670547e-05, "loss": 2.2769, "step": 54584 }, { "epoch": 0.68, "learning_rate": 6.181409917286431e-05, "loss": 2.2716, "step": 54592 }, { "epoch": 0.68, "learning_rate": 6.179002852179605e-05, "loss": 2.2835, "step": 54600 }, { "epoch": 0.68, "learning_rate": 6.176596270591473e-05, "loss": 2.2653, "step": 54608 }, { "epoch": 0.68, "learning_rate": 6.174190172763397e-05, "loss": 2.2832, "step": 54616 }, { "epoch": 0.68, "learning_rate": 6.171784558936713e-05, "loss": 2.2436, "step": 54624 }, { "epoch": 0.68, "learning_rate": 6.169379429352671e-05, "loss": 2.2732, "step": 54632 }, { "epoch": 0.68, "learning_rate": 6.166974784252504e-05, "loss": 2.261, "step": 54640 }, { "epoch": 0.68, "learning_rate": 6.164570623877384e-05, "loss": 2.2606, "step": 54648 }, { "epoch": 0.68, "learning_rate": 6.162166948468425e-05, "loss": 2.257, "step": 54656 }, { "epoch": 0.68, "learning_rate": 6.159763758266715e-05, "loss": 2.2697, "step": 54664 }, { "epoch": 0.68, "learning_rate": 6.157361053513266e-05, "loss": 2.2682, "step": 54672 }, { "epoch": 0.68, "learning_rate": 6.154958834449068e-05, "loss": 2.268, "step": 54680 }, { "epoch": 0.68, "learning_rate": 6.152557101315049e-05, "loss": 2.2837, "step": 54688 }, { "epoch": 0.68, "learning_rate": 6.15015585435208e-05, "loss": 2.2711, "step": 54696 }, { "epoch": 0.68, "learning_rate": 6.147755093800997e-05, "loss": 2.2931, "step": 54704 }, { "epoch": 0.68, "learning_rate": 6.145354819902587e-05, "loss": 2.2788, "step": 54712 }, { "epoch": 0.68, "learning_rate": 6.142955032897581e-05, "loss": 2.2638, "step": 54720 }, { "epoch": 0.68, "learning_rate": 6.140555733026667e-05, "loss": 2.2666, "step": 54728 }, { "epoch": 0.68, "learning_rate": 6.138156920530469e-05, "loss": 2.2791, "step": 54736 }, { "epoch": 0.68, "learning_rate": 6.135758595649588e-05, "loss": 2.2696, "step": 54744 }, { "epoch": 0.68, "learning_rate": 6.133360758624557e-05, "loss": 2.2699, "step": 54752 }, { "epoch": 0.68, "learning_rate": 6.130963409695866e-05, "loss": 2.2608, "step": 54760 }, { "epoch": 0.68, "learning_rate": 6.128566549103957e-05, "loss": 2.2895, "step": 54768 }, { "epoch": 0.68, "learning_rate": 6.126170177089219e-05, "loss": 2.2695, "step": 54776 }, { "epoch": 0.68, "learning_rate": 6.123774293891995e-05, "loss": 2.2903, "step": 54784 }, { "epoch": 0.68, "learning_rate": 6.12137889975258e-05, "loss": 2.2801, "step": 54792 }, { "epoch": 0.69, "learning_rate": 6.118983994911218e-05, "loss": 2.2504, "step": 54800 }, { "epoch": 0.69, "learning_rate": 6.116589579608103e-05, "loss": 2.2872, "step": 54808 }, { "epoch": 0.69, "learning_rate": 6.114195654083382e-05, "loss": 2.2883, "step": 54816 }, { "epoch": 0.69, "learning_rate": 6.111802218577154e-05, "loss": 2.2679, "step": 54824 }, { "epoch": 0.69, "learning_rate": 6.109409273329463e-05, "loss": 2.2644, "step": 54832 }, { "epoch": 0.69, "learning_rate": 6.107016818580312e-05, "loss": 2.2748, "step": 54840 }, { "epoch": 0.69, "learning_rate": 6.104624854569645e-05, "loss": 2.2744, "step": 54848 }, { "epoch": 0.69, "learning_rate": 6.1022333815373746e-05, "loss": 2.2944, "step": 54856 }, { "epoch": 0.69, "learning_rate": 6.099842399723338e-05, "loss": 2.2649, "step": 54864 }, { "epoch": 0.69, "learning_rate": 6.097451909367343e-05, "loss": 2.2415, "step": 54872 }, { "epoch": 0.69, "learning_rate": 6.095061910709143e-05, "loss": 2.2486, "step": 54880 }, { "epoch": 0.69, "learning_rate": 6.0926724039884376e-05, "loss": 2.2646, "step": 54888 }, { "epoch": 0.69, "learning_rate": 6.090283389444891e-05, "loss": 2.2895, "step": 54896 }, { "epoch": 0.69, "learning_rate": 6.0878948673180935e-05, "loss": 2.2561, "step": 54904 }, { "epoch": 0.69, "learning_rate": 6.085506837847608e-05, "loss": 2.2644, "step": 54912 }, { "epoch": 0.69, "learning_rate": 6.083119301272944e-05, "loss": 2.27, "step": 54920 }, { "epoch": 0.69, "learning_rate": 6.080732257833548e-05, "loss": 2.2816, "step": 54928 }, { "epoch": 0.69, "learning_rate": 6.078345707768838e-05, "loss": 2.2742, "step": 54936 }, { "epoch": 0.69, "learning_rate": 6.0759596513181595e-05, "loss": 2.286, "step": 54944 }, { "epoch": 0.69, "learning_rate": 6.07357408872083e-05, "loss": 2.2715, "step": 54952 }, { "epoch": 0.69, "learning_rate": 6.071189020216109e-05, "loss": 2.2711, "step": 54960 }, { "epoch": 0.69, "learning_rate": 6.0688044460431944e-05, "loss": 2.2957, "step": 54968 }, { "epoch": 0.69, "learning_rate": 6.0664203664412545e-05, "loss": 2.275, "step": 54976 }, { "epoch": 0.69, "learning_rate": 6.064036781649397e-05, "loss": 2.2658, "step": 54984 }, { "epoch": 0.69, "learning_rate": 6.0616536919066814e-05, "loss": 2.2451, "step": 54992 }, { "epoch": 0.69, "learning_rate": 6.059271097452124e-05, "loss": 2.2754, "step": 55000 }, { "epoch": 0.69, "learning_rate": 6.05688899852467e-05, "loss": 2.2712, "step": 55008 }, { "epoch": 0.69, "learning_rate": 6.054507395363245e-05, "loss": 2.2475, "step": 55016 }, { "epoch": 0.69, "learning_rate": 6.052126288206705e-05, "loss": 2.2858, "step": 55024 }, { "epoch": 0.69, "learning_rate": 6.049745677293863e-05, "loss": 2.2794, "step": 55032 }, { "epoch": 0.69, "learning_rate": 6.0473655628634786e-05, "loss": 2.2723, "step": 55040 }, { "epoch": 0.69, "learning_rate": 6.0449859451542666e-05, "loss": 2.2859, "step": 55048 }, { "epoch": 0.69, "learning_rate": 6.042606824404886e-05, "loss": 2.2635, "step": 55056 }, { "epoch": 0.69, "learning_rate": 6.04022820085395e-05, "loss": 2.2732, "step": 55064 }, { "epoch": 0.69, "learning_rate": 6.037850074740025e-05, "loss": 2.2564, "step": 55072 }, { "epoch": 0.69, "learning_rate": 6.0354724463016174e-05, "loss": 2.2786, "step": 55080 }, { "epoch": 0.69, "learning_rate": 6.0330953157771955e-05, "loss": 2.2669, "step": 55088 }, { "epoch": 0.69, "learning_rate": 6.030718683405168e-05, "loss": 2.2575, "step": 55096 }, { "epoch": 0.69, "learning_rate": 6.0283425494238996e-05, "loss": 2.2893, "step": 55104 }, { "epoch": 0.69, "learning_rate": 6.025966914071701e-05, "loss": 2.2761, "step": 55112 }, { "epoch": 0.69, "learning_rate": 6.0235917775868346e-05, "loss": 2.278, "step": 55120 }, { "epoch": 0.69, "learning_rate": 6.0212171402075224e-05, "loss": 2.2733, "step": 55128 }, { "epoch": 0.69, "learning_rate": 6.018843002171914e-05, "loss": 2.2978, "step": 55136 }, { "epoch": 0.69, "learning_rate": 6.016469363718127e-05, "loss": 2.2715, "step": 55144 }, { "epoch": 0.69, "learning_rate": 6.014096225084229e-05, "loss": 2.2603, "step": 55152 }, { "epoch": 0.69, "learning_rate": 6.011723586508222e-05, "loss": 2.2685, "step": 55160 }, { "epoch": 0.69, "learning_rate": 6.009351448228081e-05, "loss": 2.2771, "step": 55168 }, { "epoch": 0.69, "learning_rate": 6.0069798104817075e-05, "loss": 2.266, "step": 55176 }, { "epoch": 0.69, "learning_rate": 6.004608673506965e-05, "loss": 2.2639, "step": 55184 }, { "epoch": 0.69, "learning_rate": 6.002238037541672e-05, "loss": 2.2898, "step": 55192 }, { "epoch": 0.69, "learning_rate": 5.999867902823579e-05, "loss": 2.2684, "step": 55200 }, { "epoch": 0.69, "learning_rate": 5.997498269590407e-05, "loss": 2.2887, "step": 55208 }, { "epoch": 0.69, "learning_rate": 5.995129138079816e-05, "loss": 2.289, "step": 55216 }, { "epoch": 0.69, "learning_rate": 5.992760508529405e-05, "loss": 2.2609, "step": 55224 }, { "epoch": 0.69, "learning_rate": 5.990392381176751e-05, "loss": 2.2702, "step": 55232 }, { "epoch": 0.69, "learning_rate": 5.988024756259348e-05, "loss": 2.2953, "step": 55240 }, { "epoch": 0.69, "learning_rate": 5.985657634014665e-05, "loss": 2.2795, "step": 55248 }, { "epoch": 0.69, "learning_rate": 5.9832910146801125e-05, "loss": 2.2674, "step": 55256 }, { "epoch": 0.69, "learning_rate": 5.980924898493039e-05, "loss": 2.2614, "step": 55264 }, { "epoch": 0.69, "learning_rate": 5.9785592856907614e-05, "loss": 2.2792, "step": 55272 }, { "epoch": 0.69, "learning_rate": 5.976194176510533e-05, "loss": 2.2681, "step": 55280 }, { "epoch": 0.69, "learning_rate": 5.973829571189564e-05, "loss": 2.2708, "step": 55288 }, { "epoch": 0.69, "learning_rate": 5.9714654699650075e-05, "loss": 2.2622, "step": 55296 }, { "epoch": 0.69, "learning_rate": 5.9691018730739726e-05, "loss": 2.2725, "step": 55304 }, { "epoch": 0.69, "learning_rate": 5.966738780753514e-05, "loss": 2.2564, "step": 55312 }, { "epoch": 0.69, "learning_rate": 5.964376193240634e-05, "loss": 2.276, "step": 55320 }, { "epoch": 0.69, "learning_rate": 5.962014110772289e-05, "loss": 2.2865, "step": 55328 }, { "epoch": 0.69, "learning_rate": 5.9596525335853815e-05, "loss": 2.2658, "step": 55336 }, { "epoch": 0.69, "learning_rate": 5.957291461916765e-05, "loss": 2.2823, "step": 55344 }, { "epoch": 0.69, "learning_rate": 5.95493089600324e-05, "loss": 2.2641, "step": 55352 }, { "epoch": 0.69, "learning_rate": 5.952570836081561e-05, "loss": 2.2554, "step": 55360 }, { "epoch": 0.69, "learning_rate": 5.950211282388427e-05, "loss": 2.2621, "step": 55368 }, { "epoch": 0.69, "learning_rate": 5.947852235160486e-05, "loss": 2.2807, "step": 55376 }, { "epoch": 0.69, "learning_rate": 5.945493694634341e-05, "loss": 2.2777, "step": 55384 }, { "epoch": 0.69, "learning_rate": 5.943135661046536e-05, "loss": 2.2646, "step": 55392 }, { "epoch": 0.69, "learning_rate": 5.940778134633571e-05, "loss": 2.2526, "step": 55400 }, { "epoch": 0.69, "learning_rate": 5.938421115631892e-05, "loss": 2.2508, "step": 55408 }, { "epoch": 0.69, "learning_rate": 5.936064604277891e-05, "loss": 2.2786, "step": 55416 }, { "epoch": 0.69, "learning_rate": 5.933708600807924e-05, "loss": 2.2653, "step": 55424 }, { "epoch": 0.69, "learning_rate": 5.931353105458273e-05, "loss": 2.2778, "step": 55432 }, { "epoch": 0.69, "learning_rate": 5.928998118465185e-05, "loss": 2.2677, "step": 55440 }, { "epoch": 0.69, "learning_rate": 5.926643640064852e-05, "loss": 2.2546, "step": 55448 }, { "epoch": 0.69, "learning_rate": 5.924289670493413e-05, "loss": 2.2786, "step": 55456 }, { "epoch": 0.69, "learning_rate": 5.921936209986962e-05, "loss": 2.2825, "step": 55464 }, { "epoch": 0.69, "learning_rate": 5.919583258781531e-05, "loss": 2.2567, "step": 55472 }, { "epoch": 0.69, "learning_rate": 5.9172308171131173e-05, "loss": 2.2801, "step": 55480 }, { "epoch": 0.69, "learning_rate": 5.914878885217653e-05, "loss": 2.2859, "step": 55488 }, { "epoch": 0.69, "learning_rate": 5.912527463331016e-05, "loss": 2.2617, "step": 55496 }, { "epoch": 0.69, "learning_rate": 5.910176551689055e-05, "loss": 2.2625, "step": 55504 }, { "epoch": 0.69, "learning_rate": 5.907826150527538e-05, "loss": 2.2537, "step": 55512 }, { "epoch": 0.69, "learning_rate": 5.905476260082208e-05, "loss": 2.2667, "step": 55520 }, { "epoch": 0.69, "learning_rate": 5.903126880588744e-05, "loss": 2.2586, "step": 55528 }, { "epoch": 0.69, "learning_rate": 5.900778012282767e-05, "loss": 2.2778, "step": 55536 }, { "epoch": 0.69, "learning_rate": 5.8984296553998666e-05, "loss": 2.2604, "step": 55544 }, { "epoch": 0.69, "learning_rate": 5.8960818101755636e-05, "loss": 2.2686, "step": 55552 }, { "epoch": 0.69, "learning_rate": 5.893734476845334e-05, "loss": 2.2647, "step": 55560 }, { "epoch": 0.69, "learning_rate": 5.891387655644607e-05, "loss": 2.2729, "step": 55568 }, { "epoch": 0.69, "learning_rate": 5.889041346808743e-05, "loss": 2.2707, "step": 55576 }, { "epoch": 0.69, "learning_rate": 5.886695550573076e-05, "loss": 2.2921, "step": 55584 }, { "epoch": 0.69, "learning_rate": 5.884350267172874e-05, "loss": 2.2302, "step": 55592 }, { "epoch": 0.69, "learning_rate": 5.88200549684335e-05, "loss": 2.282, "step": 55600 }, { "epoch": 0.7, "learning_rate": 5.879661239819676e-05, "loss": 2.2733, "step": 55608 }, { "epoch": 0.7, "learning_rate": 5.877317496336965e-05, "loss": 2.2822, "step": 55616 }, { "epoch": 0.7, "learning_rate": 5.874974266630284e-05, "loss": 2.2679, "step": 55624 }, { "epoch": 0.7, "learning_rate": 5.872631550934643e-05, "loss": 2.262, "step": 55632 }, { "epoch": 0.7, "learning_rate": 5.870289349485004e-05, "loss": 2.2876, "step": 55640 }, { "epoch": 0.7, "learning_rate": 5.867947662516278e-05, "loss": 2.2759, "step": 55648 }, { "epoch": 0.7, "learning_rate": 5.8656064902633204e-05, "loss": 2.258, "step": 55656 }, { "epoch": 0.7, "learning_rate": 5.863265832960939e-05, "loss": 2.265, "step": 55664 }, { "epoch": 0.7, "learning_rate": 5.860925690843888e-05, "loss": 2.2727, "step": 55672 }, { "epoch": 0.7, "learning_rate": 5.858586064146872e-05, "loss": 2.2719, "step": 55680 }, { "epoch": 0.7, "learning_rate": 5.8562469531045364e-05, "loss": 2.2517, "step": 55688 }, { "epoch": 0.7, "learning_rate": 5.853908357951492e-05, "loss": 2.2744, "step": 55696 }, { "epoch": 0.7, "learning_rate": 5.851570278922276e-05, "loss": 2.2578, "step": 55704 }, { "epoch": 0.7, "learning_rate": 5.849232716251389e-05, "loss": 2.2551, "step": 55712 }, { "epoch": 0.7, "learning_rate": 5.846895670173276e-05, "loss": 2.277, "step": 55720 }, { "epoch": 0.7, "learning_rate": 5.844559140922323e-05, "loss": 2.282, "step": 55728 }, { "epoch": 0.7, "learning_rate": 5.842223128732882e-05, "loss": 2.2623, "step": 55736 }, { "epoch": 0.7, "learning_rate": 5.839887633839234e-05, "loss": 2.2765, "step": 55744 }, { "epoch": 0.7, "learning_rate": 5.837552656475614e-05, "loss": 2.2713, "step": 55752 }, { "epoch": 0.7, "learning_rate": 5.835218196876217e-05, "loss": 2.2692, "step": 55760 }, { "epoch": 0.7, "learning_rate": 5.832884255275163e-05, "loss": 2.2497, "step": 55768 }, { "epoch": 0.7, "learning_rate": 5.830550831906546e-05, "loss": 2.2845, "step": 55776 }, { "epoch": 0.7, "learning_rate": 5.828217927004386e-05, "loss": 2.2795, "step": 55784 }, { "epoch": 0.7, "learning_rate": 5.825885540802658e-05, "loss": 2.2622, "step": 55792 }, { "epoch": 0.7, "learning_rate": 5.8235536735353e-05, "loss": 2.2656, "step": 55800 }, { "epoch": 0.7, "learning_rate": 5.821222325436172e-05, "loss": 2.2807, "step": 55808 }, { "epoch": 0.7, "learning_rate": 5.8188914967391016e-05, "loss": 2.2577, "step": 55816 }, { "epoch": 0.7, "learning_rate": 5.816561187677856e-05, "loss": 2.2703, "step": 55824 }, { "epoch": 0.7, "learning_rate": 5.814231398486154e-05, "loss": 2.2639, "step": 55832 }, { "epoch": 0.7, "learning_rate": 5.8119021293976596e-05, "loss": 2.2767, "step": 55840 }, { "epoch": 0.7, "learning_rate": 5.809573380645981e-05, "loss": 2.2713, "step": 55848 }, { "epoch": 0.7, "learning_rate": 5.807245152464682e-05, "loss": 2.2572, "step": 55856 }, { "epoch": 0.7, "learning_rate": 5.8049174450872726e-05, "loss": 2.2706, "step": 55864 }, { "epoch": 0.7, "learning_rate": 5.802590258747205e-05, "loss": 2.2631, "step": 55872 }, { "epoch": 0.7, "learning_rate": 5.8002635936778834e-05, "loss": 2.271, "step": 55880 }, { "epoch": 0.7, "learning_rate": 5.7979374501126624e-05, "loss": 2.266, "step": 55888 }, { "epoch": 0.7, "learning_rate": 5.795611828284837e-05, "loss": 2.2911, "step": 55896 }, { "epoch": 0.7, "learning_rate": 5.793286728427656e-05, "loss": 2.2669, "step": 55904 }, { "epoch": 0.7, "learning_rate": 5.790962150774313e-05, "loss": 2.2657, "step": 55912 }, { "epoch": 0.7, "learning_rate": 5.78863809555795e-05, "loss": 2.2661, "step": 55920 }, { "epoch": 0.7, "learning_rate": 5.786314563011658e-05, "loss": 2.2503, "step": 55928 }, { "epoch": 0.7, "learning_rate": 5.783991553368473e-05, "loss": 2.2751, "step": 55936 }, { "epoch": 0.7, "learning_rate": 5.781669066861378e-05, "loss": 2.2949, "step": 55944 }, { "epoch": 0.7, "learning_rate": 5.7793471037233084e-05, "loss": 2.2709, "step": 55952 }, { "epoch": 0.7, "learning_rate": 5.7770256641871414e-05, "loss": 2.2662, "step": 55960 }, { "epoch": 0.7, "learning_rate": 5.7747047484857065e-05, "loss": 2.2744, "step": 55968 }, { "epoch": 0.7, "learning_rate": 5.772384356851777e-05, "loss": 2.2479, "step": 55976 }, { "epoch": 0.7, "learning_rate": 5.7700644895180714e-05, "loss": 2.2681, "step": 55984 }, { "epoch": 0.7, "learning_rate": 5.767745146717269e-05, "loss": 2.2463, "step": 55992 }, { "epoch": 0.7, "learning_rate": 5.7654263286819756e-05, "loss": 2.2881, "step": 56000 }, { "epoch": 0.7, "learning_rate": 5.763108035644766e-05, "loss": 2.2432, "step": 56008 }, { "epoch": 0.7, "learning_rate": 5.760790267838143e-05, "loss": 2.2554, "step": 56016 }, { "epoch": 0.7, "learning_rate": 5.7584730254945675e-05, "loss": 2.2619, "step": 56024 }, { "epoch": 0.7, "learning_rate": 5.756156308846452e-05, "loss": 2.28, "step": 56032 }, { "epoch": 0.7, "learning_rate": 5.753840118126141e-05, "loss": 2.2596, "step": 56040 }, { "epoch": 0.7, "learning_rate": 5.7515244535659416e-05, "loss": 2.239, "step": 56048 }, { "epoch": 0.7, "learning_rate": 5.749209315398103e-05, "loss": 2.2789, "step": 56056 }, { "epoch": 0.7, "learning_rate": 5.746894703854813e-05, "loss": 2.2553, "step": 56064 }, { "epoch": 0.7, "learning_rate": 5.744580619168223e-05, "loss": 2.2766, "step": 56072 }, { "epoch": 0.7, "learning_rate": 5.742267061570412e-05, "loss": 2.2847, "step": 56080 }, { "epoch": 0.7, "learning_rate": 5.739954031293428e-05, "loss": 2.2683, "step": 56088 }, { "epoch": 0.7, "learning_rate": 5.7376415285692507e-05, "loss": 2.2767, "step": 56096 }, { "epoch": 0.7, "learning_rate": 5.735329553629802e-05, "loss": 2.2476, "step": 56104 }, { "epoch": 0.7, "learning_rate": 5.7330181067069746e-05, "loss": 2.2882, "step": 56112 }, { "epoch": 0.7, "learning_rate": 5.730707188032585e-05, "loss": 2.2634, "step": 56120 }, { "epoch": 0.7, "learning_rate": 5.7283967978384066e-05, "loss": 2.2764, "step": 56128 }, { "epoch": 0.7, "learning_rate": 5.726086936356162e-05, "loss": 2.2598, "step": 56136 }, { "epoch": 0.7, "learning_rate": 5.723777603817508e-05, "loss": 2.2751, "step": 56144 }, { "epoch": 0.7, "learning_rate": 5.721468800454067e-05, "loss": 2.2564, "step": 56152 }, { "epoch": 0.7, "learning_rate": 5.719160526497396e-05, "loss": 2.2599, "step": 56160 }, { "epoch": 0.7, "learning_rate": 5.716852782179001e-05, "loss": 2.2691, "step": 56168 }, { "epoch": 0.7, "learning_rate": 5.714545567730334e-05, "loss": 2.2672, "step": 56176 }, { "epoch": 0.7, "learning_rate": 5.7122388833828e-05, "loss": 2.2682, "step": 56184 }, { "epoch": 0.7, "learning_rate": 5.709932729367744e-05, "loss": 2.2751, "step": 56192 }, { "epoch": 0.7, "learning_rate": 5.707627105916459e-05, "loss": 2.2817, "step": 56200 }, { "epoch": 0.7, "learning_rate": 5.705322013260186e-05, "loss": 2.2707, "step": 56208 }, { "epoch": 0.7, "learning_rate": 5.703017451630115e-05, "loss": 2.2448, "step": 56216 }, { "epoch": 0.7, "learning_rate": 5.70071342125738e-05, "loss": 2.2641, "step": 56224 }, { "epoch": 0.7, "learning_rate": 5.69840992237306e-05, "loss": 2.2874, "step": 56232 }, { "epoch": 0.7, "learning_rate": 5.6961069552081846e-05, "loss": 2.2596, "step": 56240 }, { "epoch": 0.7, "learning_rate": 5.693804519993728e-05, "loss": 2.2775, "step": 56248 }, { "epoch": 0.7, "learning_rate": 5.69150261696061e-05, "loss": 2.2741, "step": 56256 }, { "epoch": 0.7, "learning_rate": 5.689201246339705e-05, "loss": 2.294, "step": 56264 }, { "epoch": 0.7, "learning_rate": 5.6869004083618196e-05, "loss": 2.2568, "step": 56272 }, { "epoch": 0.7, "learning_rate": 5.684600103257716e-05, "loss": 2.2354, "step": 56280 }, { "epoch": 0.7, "learning_rate": 5.682300331258104e-05, "loss": 2.2833, "step": 56288 }, { "epoch": 0.7, "learning_rate": 5.680001092593634e-05, "loss": 2.2695, "step": 56296 }, { "epoch": 0.7, "learning_rate": 5.6777023874949166e-05, "loss": 2.2639, "step": 56304 }, { "epoch": 0.7, "learning_rate": 5.675404216192489e-05, "loss": 2.2588, "step": 56312 }, { "epoch": 0.7, "learning_rate": 5.673106578916845e-05, "loss": 2.2589, "step": 56320 }, { "epoch": 0.7, "learning_rate": 5.670809475898432e-05, "loss": 2.2599, "step": 56328 }, { "epoch": 0.7, "learning_rate": 5.668512907367626e-05, "loss": 2.2749, "step": 56336 }, { "epoch": 0.7, "learning_rate": 5.6662168735547704e-05, "loss": 2.2416, "step": 56344 }, { "epoch": 0.7, "learning_rate": 5.6639213746901354e-05, "loss": 2.2671, "step": 56352 }, { "epoch": 0.7, "learning_rate": 5.661626411003953e-05, "loss": 2.2778, "step": 56360 }, { "epoch": 0.7, "learning_rate": 5.6593319827263955e-05, "loss": 2.261, "step": 56368 }, { "epoch": 0.7, "learning_rate": 5.6570380900875716e-05, "loss": 2.2711, "step": 56376 }, { "epoch": 0.7, "learning_rate": 5.6547447333175574e-05, "loss": 2.2877, "step": 56384 }, { "epoch": 0.7, "learning_rate": 5.6524519126463573e-05, "loss": 2.2705, "step": 56392 }, { "epoch": 0.7, "learning_rate": 5.65015962830393e-05, "loss": 2.2777, "step": 56400 }, { "epoch": 0.71, "learning_rate": 5.647867880520181e-05, "loss": 2.2828, "step": 56408 }, { "epoch": 0.71, "learning_rate": 5.6455766695249505e-05, "loss": 2.2532, "step": 56416 }, { "epoch": 0.71, "learning_rate": 5.643285995548042e-05, "loss": 2.2847, "step": 56424 }, { "epoch": 0.71, "learning_rate": 5.640995858819196e-05, "loss": 2.2827, "step": 56432 }, { "epoch": 0.71, "learning_rate": 5.6387062595681006e-05, "loss": 2.2645, "step": 56440 }, { "epoch": 0.71, "learning_rate": 5.6364171980243886e-05, "loss": 2.2786, "step": 56448 }, { "epoch": 0.71, "learning_rate": 5.634128674417638e-05, "loss": 2.281, "step": 56456 }, { "epoch": 0.71, "learning_rate": 5.631840688977379e-05, "loss": 2.245, "step": 56464 }, { "epoch": 0.71, "learning_rate": 5.629553241933079e-05, "loss": 2.2676, "step": 56472 }, { "epoch": 0.71, "learning_rate": 5.627266333514161e-05, "loss": 2.2848, "step": 56480 }, { "epoch": 0.71, "learning_rate": 5.6249799639499835e-05, "loss": 2.2738, "step": 56488 }, { "epoch": 0.71, "learning_rate": 5.622694133469861e-05, "loss": 2.2708, "step": 56496 }, { "epoch": 0.71, "learning_rate": 5.6204088423030466e-05, "loss": 2.259, "step": 56504 }, { "epoch": 0.71, "learning_rate": 5.618124090678742e-05, "loss": 2.2692, "step": 56512 }, { "epoch": 0.71, "learning_rate": 5.6158398788260965e-05, "loss": 2.2709, "step": 56520 }, { "epoch": 0.71, "learning_rate": 5.6135562069742e-05, "loss": 2.2678, "step": 56528 }, { "epoch": 0.71, "learning_rate": 5.6112730753521e-05, "loss": 2.2614, "step": 56536 }, { "epoch": 0.71, "learning_rate": 5.608990484188774e-05, "loss": 2.2572, "step": 56544 }, { "epoch": 0.71, "learning_rate": 5.606708433713155e-05, "loss": 2.2752, "step": 56552 }, { "epoch": 0.71, "learning_rate": 5.6044269241541206e-05, "loss": 2.2738, "step": 56560 }, { "epoch": 0.71, "learning_rate": 5.60214595574049e-05, "loss": 2.2668, "step": 56568 }, { "epoch": 0.71, "learning_rate": 5.5998655287010385e-05, "loss": 2.2562, "step": 56576 }, { "epoch": 0.71, "learning_rate": 5.597585643264474e-05, "loss": 2.2596, "step": 56584 }, { "epoch": 0.71, "learning_rate": 5.595306299659454e-05, "loss": 2.2523, "step": 56592 }, { "epoch": 0.71, "learning_rate": 5.5930274981145935e-05, "loss": 2.2567, "step": 56600 }, { "epoch": 0.71, "learning_rate": 5.590749238858432e-05, "loss": 2.2804, "step": 56608 }, { "epoch": 0.71, "learning_rate": 5.588471522119476e-05, "loss": 2.2616, "step": 56616 }, { "epoch": 0.71, "learning_rate": 5.5861943481261616e-05, "loss": 2.2752, "step": 56624 }, { "epoch": 0.71, "learning_rate": 5.5839177171068735e-05, "loss": 2.2702, "step": 56632 }, { "epoch": 0.71, "learning_rate": 5.581641629289956e-05, "loss": 2.2637, "step": 56640 }, { "epoch": 0.71, "learning_rate": 5.579366084903675e-05, "loss": 2.2654, "step": 56648 }, { "epoch": 0.71, "learning_rate": 5.5770910841762626e-05, "loss": 2.2566, "step": 56656 }, { "epoch": 0.71, "learning_rate": 5.57481662733589e-05, "loss": 2.2758, "step": 56664 }, { "epoch": 0.71, "learning_rate": 5.5725427146106625e-05, "loss": 2.2694, "step": 56672 }, { "epoch": 0.71, "learning_rate": 5.5702693462286546e-05, "loss": 2.2783, "step": 56680 }, { "epoch": 0.71, "learning_rate": 5.567996522417858e-05, "loss": 2.2866, "step": 56688 }, { "epoch": 0.71, "learning_rate": 5.565724243406234e-05, "loss": 2.2718, "step": 56696 }, { "epoch": 0.71, "learning_rate": 5.563452509421674e-05, "loss": 2.2679, "step": 56704 }, { "epoch": 0.71, "learning_rate": 5.5611813206920246e-05, "loss": 2.2636, "step": 56712 }, { "epoch": 0.71, "learning_rate": 5.5589106774450697e-05, "loss": 2.2554, "step": 56720 }, { "epoch": 0.71, "learning_rate": 5.556640579908543e-05, "loss": 2.2621, "step": 56728 }, { "epoch": 0.71, "learning_rate": 5.554371028310122e-05, "loss": 2.2629, "step": 56736 }, { "epoch": 0.71, "learning_rate": 5.552102022877431e-05, "loss": 2.2645, "step": 56744 }, { "epoch": 0.71, "learning_rate": 5.549833563838037e-05, "loss": 2.2709, "step": 56752 }, { "epoch": 0.71, "learning_rate": 5.547565651419455e-05, "loss": 2.2756, "step": 56760 }, { "epoch": 0.71, "learning_rate": 5.545298285849143e-05, "loss": 2.2616, "step": 56768 }, { "epoch": 0.71, "learning_rate": 5.543031467354505e-05, "loss": 2.2743, "step": 56776 }, { "epoch": 0.71, "learning_rate": 5.540765196162888e-05, "loss": 2.2647, "step": 56784 }, { "epoch": 0.71, "learning_rate": 5.5384994725015896e-05, "loss": 2.2598, "step": 56792 }, { "epoch": 0.71, "learning_rate": 5.536234296597846e-05, "loss": 2.2608, "step": 56800 }, { "epoch": 0.71, "learning_rate": 5.5339696686788466e-05, "loss": 2.2827, "step": 56808 }, { "epoch": 0.71, "learning_rate": 5.531705588971714e-05, "loss": 2.2723, "step": 56816 }, { "epoch": 0.71, "learning_rate": 5.5294420577035244e-05, "loss": 2.2785, "step": 56824 }, { "epoch": 0.71, "learning_rate": 5.527179075101303e-05, "loss": 2.2646, "step": 56832 }, { "epoch": 0.71, "learning_rate": 5.5249166413920085e-05, "loss": 2.2802, "step": 56840 }, { "epoch": 0.71, "learning_rate": 5.52265475680255e-05, "loss": 2.2693, "step": 56848 }, { "epoch": 0.71, "learning_rate": 5.520393421559783e-05, "loss": 2.2755, "step": 56856 }, { "epoch": 0.71, "learning_rate": 5.518132635890504e-05, "loss": 2.26, "step": 56864 }, { "epoch": 0.71, "learning_rate": 5.5158724000214655e-05, "loss": 2.2723, "step": 56872 }, { "epoch": 0.71, "learning_rate": 5.513612714179345e-05, "loss": 2.2801, "step": 56880 }, { "epoch": 0.71, "learning_rate": 5.511353578590785e-05, "loss": 2.2602, "step": 56888 }, { "epoch": 0.71, "learning_rate": 5.509094993482362e-05, "loss": 2.2683, "step": 56896 }, { "epoch": 0.71, "learning_rate": 5.506836959080593e-05, "loss": 2.2729, "step": 56904 }, { "epoch": 0.71, "learning_rate": 5.504579475611957e-05, "loss": 2.2713, "step": 56912 }, { "epoch": 0.71, "learning_rate": 5.502322543302856e-05, "loss": 2.258, "step": 56920 }, { "epoch": 0.71, "learning_rate": 5.5000661623796537e-05, "loss": 2.2705, "step": 56928 }, { "epoch": 0.71, "learning_rate": 5.497810333068654e-05, "loss": 2.2685, "step": 56936 }, { "epoch": 0.71, "learning_rate": 5.4955550555960954e-05, "loss": 2.2703, "step": 56944 }, { "epoch": 0.71, "learning_rate": 5.493300330188178e-05, "loss": 2.2767, "step": 56952 }, { "epoch": 0.71, "learning_rate": 5.491046157071034e-05, "loss": 2.2705, "step": 56960 }, { "epoch": 0.71, "learning_rate": 5.488792536470746e-05, "loss": 2.2525, "step": 56968 }, { "epoch": 0.71, "learning_rate": 5.486539468613341e-05, "loss": 2.2978, "step": 56976 }, { "epoch": 0.71, "learning_rate": 5.4842869537247796e-05, "loss": 2.2742, "step": 56984 }, { "epoch": 0.71, "learning_rate": 5.4820349920309864e-05, "loss": 2.2796, "step": 56992 }, { "epoch": 0.71, "learning_rate": 5.4797835837578184e-05, "loss": 2.2635, "step": 57000 }, { "epoch": 0.71, "learning_rate": 5.477532729131076e-05, "loss": 2.2512, "step": 57008 }, { "epoch": 0.71, "learning_rate": 5.475282428376509e-05, "loss": 2.2744, "step": 57016 }, { "epoch": 0.71, "learning_rate": 5.473032681719809e-05, "loss": 2.2679, "step": 57024 }, { "epoch": 0.71, "learning_rate": 5.470783489386615e-05, "loss": 2.2667, "step": 57032 }, { "epoch": 0.71, "learning_rate": 5.468534851602507e-05, "loss": 2.2784, "step": 57040 }, { "epoch": 0.71, "learning_rate": 5.46628676859301e-05, "loss": 2.2628, "step": 57048 }, { "epoch": 0.71, "learning_rate": 5.464039240583594e-05, "loss": 2.2626, "step": 57056 }, { "epoch": 0.71, "learning_rate": 5.4617922677996726e-05, "loss": 2.2883, "step": 57064 }, { "epoch": 0.71, "learning_rate": 5.459545850466607e-05, "loss": 2.2652, "step": 57072 }, { "epoch": 0.71, "learning_rate": 5.4572999888096974e-05, "loss": 2.255, "step": 57080 }, { "epoch": 0.71, "learning_rate": 5.455054683054194e-05, "loss": 2.2658, "step": 57088 }, { "epoch": 0.71, "learning_rate": 5.452809933425282e-05, "loss": 2.266, "step": 57096 }, { "epoch": 0.71, "learning_rate": 5.450565740148108e-05, "loss": 2.2655, "step": 57104 }, { "epoch": 0.71, "learning_rate": 5.448322103447743e-05, "loss": 2.2552, "step": 57112 }, { "epoch": 0.71, "learning_rate": 5.446079023549212e-05, "loss": 2.262, "step": 57120 }, { "epoch": 0.71, "learning_rate": 5.443836500677486e-05, "loss": 2.2891, "step": 57128 }, { "epoch": 0.71, "learning_rate": 5.4415945350574724e-05, "loss": 2.2806, "step": 57136 }, { "epoch": 0.71, "learning_rate": 5.4393531269140374e-05, "loss": 2.2686, "step": 57144 }, { "epoch": 0.71, "learning_rate": 5.437112276471974e-05, "loss": 2.2849, "step": 57152 }, { "epoch": 0.71, "learning_rate": 5.4348719839560235e-05, "loss": 2.2605, "step": 57160 }, { "epoch": 0.71, "learning_rate": 5.432632249590885e-05, "loss": 2.269, "step": 57168 }, { "epoch": 0.71, "learning_rate": 5.430393073601181e-05, "loss": 2.2482, "step": 57176 }, { "epoch": 0.71, "learning_rate": 5.428154456211496e-05, "loss": 2.2798, "step": 57184 }, { "epoch": 0.71, "learning_rate": 5.425916397646347e-05, "loss": 2.264, "step": 57192 }, { "epoch": 0.71, "learning_rate": 5.423678898130194e-05, "loss": 2.2343, "step": 57200 }, { "epoch": 0.72, "learning_rate": 5.421441957887457e-05, "loss": 2.2502, "step": 57208 }, { "epoch": 0.72, "learning_rate": 5.419205577142476e-05, "loss": 2.2836, "step": 57216 }, { "epoch": 0.72, "learning_rate": 5.416969756119556e-05, "loss": 2.2618, "step": 57224 }, { "epoch": 0.72, "learning_rate": 5.414734495042935e-05, "loss": 2.2657, "step": 57232 }, { "epoch": 0.72, "learning_rate": 5.412499794136794e-05, "loss": 2.2765, "step": 57240 }, { "epoch": 0.72, "learning_rate": 5.410265653625268e-05, "loss": 2.2722, "step": 57248 }, { "epoch": 0.72, "learning_rate": 5.408032073732416e-05, "loss": 2.2637, "step": 57256 }, { "epoch": 0.72, "learning_rate": 5.4057990546822654e-05, "loss": 2.2567, "step": 57264 }, { "epoch": 0.72, "learning_rate": 5.4035665966987726e-05, "loss": 2.2322, "step": 57272 }, { "epoch": 0.72, "learning_rate": 5.4013347000058366e-05, "loss": 2.2844, "step": 57280 }, { "epoch": 0.72, "learning_rate": 5.399103364827307e-05, "loss": 2.272, "step": 57288 }, { "epoch": 0.72, "learning_rate": 5.396872591386974e-05, "loss": 2.2665, "step": 57296 }, { "epoch": 0.72, "learning_rate": 5.3946423799085724e-05, "loss": 2.2653, "step": 57304 }, { "epoch": 0.72, "learning_rate": 5.392412730615777e-05, "loss": 2.2621, "step": 57312 }, { "epoch": 0.72, "learning_rate": 5.390183643732209e-05, "loss": 2.2858, "step": 57320 }, { "epoch": 0.72, "learning_rate": 5.387955119481436e-05, "loss": 2.2604, "step": 57328 }, { "epoch": 0.72, "learning_rate": 5.385727158086965e-05, "loss": 2.2699, "step": 57336 }, { "epoch": 0.72, "learning_rate": 5.383499759772248e-05, "loss": 2.2819, "step": 57344 }, { "epoch": 0.72, "learning_rate": 5.3812729247606785e-05, "loss": 2.2717, "step": 57352 }, { "epoch": 0.72, "learning_rate": 5.379046653275599e-05, "loss": 2.2726, "step": 57360 }, { "epoch": 0.72, "learning_rate": 5.3768209455402896e-05, "loss": 2.2539, "step": 57368 }, { "epoch": 0.72, "learning_rate": 5.374595801777977e-05, "loss": 2.2691, "step": 57376 }, { "epoch": 0.72, "learning_rate": 5.372371222211829e-05, "loss": 2.2676, "step": 57384 }, { "epoch": 0.72, "learning_rate": 5.3701472070649606e-05, "loss": 2.2384, "step": 57392 }, { "epoch": 0.72, "learning_rate": 5.3679237565604266e-05, "loss": 2.2666, "step": 57400 }, { "epoch": 0.72, "learning_rate": 5.3657008709212243e-05, "loss": 2.2604, "step": 57408 }, { "epoch": 0.72, "learning_rate": 5.3634785503703046e-05, "loss": 2.2726, "step": 57416 }, { "epoch": 0.72, "learning_rate": 5.361256795130544e-05, "loss": 2.2547, "step": 57424 }, { "epoch": 0.72, "learning_rate": 5.359035605424774e-05, "loss": 2.2619, "step": 57432 }, { "epoch": 0.72, "learning_rate": 5.356814981475774e-05, "loss": 2.2696, "step": 57440 }, { "epoch": 0.72, "learning_rate": 5.354594923506251e-05, "loss": 2.2559, "step": 57448 }, { "epoch": 0.72, "learning_rate": 5.352375431738874e-05, "loss": 2.2776, "step": 57456 }, { "epoch": 0.72, "learning_rate": 5.350156506396236e-05, "loss": 2.2533, "step": 57464 }, { "epoch": 0.72, "learning_rate": 5.347938147700885e-05, "loss": 2.2783, "step": 57472 }, { "epoch": 0.72, "learning_rate": 5.3457203558753166e-05, "loss": 2.259, "step": 57480 }, { "epoch": 0.72, "learning_rate": 5.3435031311419514e-05, "loss": 2.2464, "step": 57488 }, { "epoch": 0.72, "learning_rate": 5.341286473723175e-05, "loss": 2.2748, "step": 57496 }, { "epoch": 0.72, "learning_rate": 5.339070383841304e-05, "loss": 2.2657, "step": 57504 }, { "epoch": 0.72, "learning_rate": 5.3368548617185895e-05, "loss": 2.265, "step": 57512 }, { "epoch": 0.72, "learning_rate": 5.33463990757725e-05, "loss": 2.2693, "step": 57520 }, { "epoch": 0.72, "learning_rate": 5.3324255216394194e-05, "loss": 2.2854, "step": 57528 }, { "epoch": 0.72, "learning_rate": 5.330211704127199e-05, "loss": 2.2615, "step": 57536 }, { "epoch": 0.72, "learning_rate": 5.3279984552626203e-05, "loss": 2.2776, "step": 57544 }, { "epoch": 0.72, "learning_rate": 5.325785775267652e-05, "loss": 2.2665, "step": 57552 }, { "epoch": 0.72, "learning_rate": 5.323573664364221e-05, "loss": 2.2507, "step": 57560 }, { "epoch": 0.72, "learning_rate": 5.321362122774186e-05, "loss": 2.2547, "step": 57568 }, { "epoch": 0.72, "learning_rate": 5.319151150719355e-05, "loss": 2.2663, "step": 57576 }, { "epoch": 0.72, "learning_rate": 5.316940748421473e-05, "loss": 2.2796, "step": 57584 }, { "epoch": 0.72, "learning_rate": 5.314730916102231e-05, "loss": 2.2959, "step": 57592 }, { "epoch": 0.72, "learning_rate": 5.3125216539832645e-05, "loss": 2.2668, "step": 57600 }, { "epoch": 0.72, "learning_rate": 5.31031296228615e-05, "loss": 2.2696, "step": 57608 }, { "epoch": 0.72, "learning_rate": 5.3081048412324045e-05, "loss": 2.2499, "step": 57616 }, { "epoch": 0.72, "learning_rate": 5.305897291043492e-05, "loss": 2.2821, "step": 57624 }, { "epoch": 0.72, "learning_rate": 5.303690311940817e-05, "loss": 2.2699, "step": 57632 }, { "epoch": 0.72, "learning_rate": 5.3014839041457254e-05, "loss": 2.2495, "step": 57640 }, { "epoch": 0.72, "learning_rate": 5.2992780678795105e-05, "loss": 2.2517, "step": 57648 }, { "epoch": 0.72, "learning_rate": 5.297072803363402e-05, "loss": 2.261, "step": 57656 }, { "epoch": 0.72, "learning_rate": 5.2948681108185763e-05, "loss": 2.256, "step": 57664 }, { "epoch": 0.72, "learning_rate": 5.2926639904661534e-05, "loss": 2.2452, "step": 57672 }, { "epoch": 0.72, "learning_rate": 5.290460442527192e-05, "loss": 2.2529, "step": 57680 }, { "epoch": 0.72, "learning_rate": 5.288257467222697e-05, "loss": 2.2699, "step": 57688 }, { "epoch": 0.72, "learning_rate": 5.286055064773613e-05, "loss": 2.2599, "step": 57696 }, { "epoch": 0.72, "learning_rate": 5.283853235400825e-05, "loss": 2.2443, "step": 57704 }, { "epoch": 0.72, "learning_rate": 5.281651979325175e-05, "loss": 2.2547, "step": 57712 }, { "epoch": 0.72, "learning_rate": 5.279451296767426e-05, "loss": 2.27, "step": 57720 }, { "epoch": 0.72, "learning_rate": 5.2772511879482976e-05, "loss": 2.2542, "step": 57728 }, { "epoch": 0.72, "learning_rate": 5.27505165308845e-05, "loss": 2.2607, "step": 57736 }, { "epoch": 0.72, "learning_rate": 5.272852692408476e-05, "loss": 2.2777, "step": 57744 }, { "epoch": 0.72, "learning_rate": 5.270654306128934e-05, "loss": 2.2735, "step": 57752 }, { "epoch": 0.72, "learning_rate": 5.268456494470293e-05, "loss": 2.2563, "step": 57760 }, { "epoch": 0.72, "learning_rate": 5.2662592576529924e-05, "loss": 2.2809, "step": 57768 }, { "epoch": 0.72, "learning_rate": 5.264062595897403e-05, "loss": 2.2711, "step": 57776 }, { "epoch": 0.72, "learning_rate": 5.261866509423827e-05, "loss": 2.2724, "step": 57784 }, { "epoch": 0.72, "learning_rate": 5.259670998452533e-05, "loss": 2.2523, "step": 57792 }, { "epoch": 0.72, "learning_rate": 5.257476063203703e-05, "loss": 2.2774, "step": 57800 }, { "epoch": 0.72, "learning_rate": 5.255281703897489e-05, "loss": 2.2759, "step": 57808 }, { "epoch": 0.72, "learning_rate": 5.253087920753972e-05, "loss": 2.2686, "step": 57816 }, { "epoch": 0.72, "learning_rate": 5.250894713993166e-05, "loss": 2.2651, "step": 57824 }, { "epoch": 0.72, "learning_rate": 5.248702083835049e-05, "loss": 2.2669, "step": 57832 }, { "epoch": 0.72, "learning_rate": 5.246510030499522e-05, "loss": 2.2789, "step": 57840 }, { "epoch": 0.72, "learning_rate": 5.244318554206439e-05, "loss": 2.267, "step": 57848 }, { "epoch": 0.72, "learning_rate": 5.242127655175595e-05, "loss": 2.2503, "step": 57856 }, { "epoch": 0.72, "learning_rate": 5.2399373336267145e-05, "loss": 2.2873, "step": 57864 }, { "epoch": 0.72, "learning_rate": 5.2377475897794835e-05, "loss": 2.2617, "step": 57872 }, { "epoch": 0.72, "learning_rate": 5.235558423853519e-05, "loss": 2.2638, "step": 57880 }, { "epoch": 0.72, "learning_rate": 5.2333698360683825e-05, "loss": 2.2769, "step": 57888 }, { "epoch": 0.72, "learning_rate": 5.2311818266435744e-05, "loss": 2.2754, "step": 57896 }, { "epoch": 0.72, "learning_rate": 5.228994395798542e-05, "loss": 2.2696, "step": 57904 }, { "epoch": 0.72, "learning_rate": 5.226807543752672e-05, "loss": 2.2594, "step": 57912 }, { "epoch": 0.72, "learning_rate": 5.2246212707252915e-05, "loss": 2.25, "step": 57920 }, { "epoch": 0.72, "learning_rate": 5.222435576935674e-05, "loss": 2.2746, "step": 57928 }, { "epoch": 0.72, "learning_rate": 5.220250462603026e-05, "loss": 2.2557, "step": 57936 }, { "epoch": 0.72, "learning_rate": 5.218065927946514e-05, "loss": 2.2697, "step": 57944 }, { "epoch": 0.72, "learning_rate": 5.2158819731852226e-05, "loss": 2.2683, "step": 57952 }, { "epoch": 0.72, "learning_rate": 5.213698598538195e-05, "loss": 2.2706, "step": 57960 }, { "epoch": 0.72, "learning_rate": 5.2115158042244125e-05, "loss": 2.2706, "step": 57968 }, { "epoch": 0.72, "learning_rate": 5.2093335904627915e-05, "loss": 2.2562, "step": 57976 }, { "epoch": 0.72, "learning_rate": 5.207151957472205e-05, "loss": 2.2473, "step": 57984 }, { "epoch": 0.72, "learning_rate": 5.2049709054714515e-05, "loss": 2.2694, "step": 57992 }, { "epoch": 0.72, "learning_rate": 5.2027904346792766e-05, "loss": 2.2525, "step": 58000 }, { "epoch": 0.73, "learning_rate": 5.200610545314377e-05, "loss": 2.2458, "step": 58008 }, { "epoch": 0.73, "learning_rate": 5.198431237595374e-05, "loss": 2.2497, "step": 58016 }, { "epoch": 0.73, "learning_rate": 5.196252511740849e-05, "loss": 2.2732, "step": 58024 }, { "epoch": 0.73, "learning_rate": 5.1940743679693084e-05, "loss": 2.2718, "step": 58032 }, { "epoch": 0.73, "learning_rate": 5.191896806499208e-05, "loss": 2.2768, "step": 58040 }, { "epoch": 0.73, "learning_rate": 5.1897198275489534e-05, "loss": 2.2617, "step": 58048 }, { "epoch": 0.73, "learning_rate": 5.187543431336871e-05, "loss": 2.2784, "step": 58056 }, { "epoch": 0.73, "learning_rate": 5.1853676180812493e-05, "loss": 2.2603, "step": 58064 }, { "epoch": 0.73, "learning_rate": 5.1831923880003106e-05, "loss": 2.2429, "step": 58072 }, { "epoch": 0.73, "learning_rate": 5.1810177413122144e-05, "loss": 2.2496, "step": 58080 }, { "epoch": 0.73, "learning_rate": 5.178843678235068e-05, "loss": 2.2738, "step": 58088 }, { "epoch": 0.73, "learning_rate": 5.1766701989869106e-05, "loss": 2.273, "step": 58096 }, { "epoch": 0.73, "learning_rate": 5.1744973037857405e-05, "loss": 2.2488, "step": 58104 }, { "epoch": 0.73, "learning_rate": 5.1723249928494796e-05, "loss": 2.2882, "step": 58112 }, { "epoch": 0.73, "learning_rate": 5.170153266396003e-05, "loss": 2.2522, "step": 58120 }, { "epoch": 0.73, "learning_rate": 5.167982124643118e-05, "loss": 2.2537, "step": 58128 }, { "epoch": 0.73, "learning_rate": 5.165811567808578e-05, "loss": 2.2554, "step": 58136 }, { "epoch": 0.73, "learning_rate": 5.163641596110083e-05, "loss": 2.2703, "step": 58144 }, { "epoch": 0.73, "learning_rate": 5.161472209765263e-05, "loss": 2.2505, "step": 58152 }, { "epoch": 0.73, "learning_rate": 5.159303408991699e-05, "loss": 2.2432, "step": 58160 }, { "epoch": 0.73, "learning_rate": 5.157135194006908e-05, "loss": 2.2623, "step": 58168 }, { "epoch": 0.73, "learning_rate": 5.154967565028348e-05, "loss": 2.2529, "step": 58176 }, { "epoch": 0.73, "learning_rate": 5.1528005222734224e-05, "loss": 2.2724, "step": 58184 }, { "epoch": 0.73, "learning_rate": 5.150634065959472e-05, "loss": 2.2669, "step": 58192 }, { "epoch": 0.73, "learning_rate": 5.148468196303781e-05, "loss": 2.2745, "step": 58200 }, { "epoch": 0.73, "learning_rate": 5.1463029135235726e-05, "loss": 2.2594, "step": 58208 }, { "epoch": 0.73, "learning_rate": 5.1441382178360144e-05, "loss": 2.2645, "step": 58216 }, { "epoch": 0.73, "learning_rate": 5.1419741094582095e-05, "loss": 2.2529, "step": 58224 }, { "epoch": 0.73, "learning_rate": 5.13981058860721e-05, "loss": 2.2685, "step": 58232 }, { "epoch": 0.73, "learning_rate": 5.137647655500002e-05, "loss": 2.2719, "step": 58240 }, { "epoch": 0.73, "learning_rate": 5.135485310353513e-05, "loss": 2.2649, "step": 58248 }, { "epoch": 0.73, "learning_rate": 5.1333235533846236e-05, "loss": 2.2593, "step": 58256 }, { "epoch": 0.73, "learning_rate": 5.1311623848101355e-05, "loss": 2.2612, "step": 58264 }, { "epoch": 0.73, "learning_rate": 5.1290018048468046e-05, "loss": 2.2477, "step": 58272 }, { "epoch": 0.73, "learning_rate": 5.1268418137113304e-05, "loss": 2.2554, "step": 58280 }, { "epoch": 0.73, "learning_rate": 5.1246824116203384e-05, "loss": 2.2758, "step": 58288 }, { "epoch": 0.73, "learning_rate": 5.122523598790413e-05, "loss": 2.2683, "step": 58296 }, { "epoch": 0.73, "learning_rate": 5.120365375438065e-05, "loss": 2.2543, "step": 58304 }, { "epoch": 0.73, "learning_rate": 5.11820774177975e-05, "loss": 2.2582, "step": 58312 }, { "epoch": 0.73, "learning_rate": 5.116050698031878e-05, "loss": 2.2769, "step": 58320 }, { "epoch": 0.73, "learning_rate": 5.113894244410775e-05, "loss": 2.2634, "step": 58328 }, { "epoch": 0.73, "learning_rate": 5.111738381132728e-05, "loss": 2.2719, "step": 58336 }, { "epoch": 0.73, "learning_rate": 5.109583108413962e-05, "loss": 2.259, "step": 58344 }, { "epoch": 0.73, "learning_rate": 5.107428426470625e-05, "loss": 2.2601, "step": 58352 }, { "epoch": 0.73, "learning_rate": 5.105274335518835e-05, "loss": 2.2699, "step": 58360 }, { "epoch": 0.73, "learning_rate": 5.10312083577462e-05, "loss": 2.2618, "step": 58368 }, { "epoch": 0.73, "learning_rate": 5.1009679274539766e-05, "loss": 2.2558, "step": 58376 }, { "epoch": 0.73, "learning_rate": 5.0988156107728266e-05, "loss": 2.258, "step": 58384 }, { "epoch": 0.73, "learning_rate": 5.096663885947026e-05, "loss": 2.2656, "step": 58392 }, { "epoch": 0.73, "learning_rate": 5.094512753192393e-05, "loss": 2.2553, "step": 58400 }, { "epoch": 0.73, "learning_rate": 5.0923622127246665e-05, "loss": 2.2579, "step": 58408 }, { "epoch": 0.73, "learning_rate": 5.090212264759536e-05, "loss": 2.2642, "step": 58416 }, { "epoch": 0.73, "learning_rate": 5.08806290951263e-05, "loss": 2.2649, "step": 58424 }, { "epoch": 0.73, "learning_rate": 5.085914147199513e-05, "loss": 2.2518, "step": 58432 }, { "epoch": 0.73, "learning_rate": 5.083765978035697e-05, "loss": 2.2428, "step": 58440 }, { "epoch": 0.73, "learning_rate": 5.08161840223663e-05, "loss": 2.2589, "step": 58448 }, { "epoch": 0.73, "learning_rate": 5.079471420017701e-05, "loss": 2.2557, "step": 58456 }, { "epoch": 0.73, "learning_rate": 5.077325031594242e-05, "loss": 2.2665, "step": 58464 }, { "epoch": 0.73, "learning_rate": 5.075179237181523e-05, "loss": 2.26, "step": 58472 }, { "epoch": 0.73, "learning_rate": 5.073034036994755e-05, "loss": 2.251, "step": 58480 }, { "epoch": 0.73, "learning_rate": 5.070889431249087e-05, "loss": 2.2564, "step": 58488 }, { "epoch": 0.73, "learning_rate": 5.068745420159615e-05, "loss": 2.2553, "step": 58496 }, { "epoch": 0.73, "learning_rate": 5.066602003941368e-05, "loss": 2.2559, "step": 58504 }, { "epoch": 0.73, "learning_rate": 5.064459182809319e-05, "loss": 2.2671, "step": 58512 }, { "epoch": 0.73, "learning_rate": 5.062316956978381e-05, "loss": 2.2548, "step": 58520 }, { "epoch": 0.73, "learning_rate": 5.06017532666341e-05, "loss": 2.2666, "step": 58528 }, { "epoch": 0.73, "learning_rate": 5.058034292079195e-05, "loss": 2.2443, "step": 58536 }, { "epoch": 0.73, "learning_rate": 5.055893853440468e-05, "loss": 2.2851, "step": 58544 }, { "epoch": 0.73, "learning_rate": 5.053754010961913e-05, "loss": 2.264, "step": 58552 }, { "epoch": 0.73, "learning_rate": 5.0516147648581345e-05, "loss": 2.2671, "step": 58560 }, { "epoch": 0.73, "learning_rate": 5.04947611534369e-05, "loss": 2.2406, "step": 58568 }, { "epoch": 0.73, "learning_rate": 5.0473380626330736e-05, "loss": 2.2823, "step": 58576 }, { "epoch": 0.73, "learning_rate": 5.045200606940717e-05, "loss": 2.2757, "step": 58584 }, { "epoch": 0.73, "learning_rate": 5.0430637484810027e-05, "loss": 2.2609, "step": 58592 }, { "epoch": 0.73, "learning_rate": 5.0409274874682346e-05, "loss": 2.2437, "step": 58600 }, { "epoch": 0.73, "learning_rate": 5.0387918241166775e-05, "loss": 2.2704, "step": 58608 }, { "epoch": 0.73, "learning_rate": 5.036656758640524e-05, "loss": 2.2557, "step": 58616 }, { "epoch": 0.73, "learning_rate": 5.034522291253903e-05, "loss": 2.2417, "step": 58624 }, { "epoch": 0.73, "learning_rate": 5.0323884221708994e-05, "loss": 2.2608, "step": 58632 }, { "epoch": 0.73, "learning_rate": 5.030255151605516e-05, "loss": 2.2723, "step": 58640 }, { "epoch": 0.73, "learning_rate": 5.02812247977172e-05, "loss": 2.2558, "step": 58648 }, { "epoch": 0.73, "learning_rate": 5.0259904068834004e-05, "loss": 2.2481, "step": 58656 }, { "epoch": 0.73, "learning_rate": 5.023858933154388e-05, "loss": 2.2676, "step": 58664 }, { "epoch": 0.73, "learning_rate": 5.021728058798465e-05, "loss": 2.2517, "step": 58672 }, { "epoch": 0.73, "learning_rate": 5.019597784029342e-05, "loss": 2.2712, "step": 58680 }, { "epoch": 0.73, "learning_rate": 5.017468109060674e-05, "loss": 2.254, "step": 58688 }, { "epoch": 0.73, "learning_rate": 5.0153390341060614e-05, "loss": 2.2729, "step": 58696 }, { "epoch": 0.73, "learning_rate": 5.0132105593790256e-05, "loss": 2.2615, "step": 58704 }, { "epoch": 0.73, "learning_rate": 5.0110826850930504e-05, "loss": 2.279, "step": 58712 }, { "epoch": 0.73, "learning_rate": 5.008955411461547e-05, "loss": 2.2556, "step": 58720 }, { "epoch": 0.73, "learning_rate": 5.0068287386978685e-05, "loss": 2.2685, "step": 58728 }, { "epoch": 0.73, "learning_rate": 5.0047026670153076e-05, "loss": 2.2605, "step": 58736 }, { "epoch": 0.73, "learning_rate": 5.002577196627099e-05, "loss": 2.2489, "step": 58744 }, { "epoch": 0.73, "learning_rate": 5.000452327746413e-05, "loss": 2.2541, "step": 58752 }, { "epoch": 0.73, "learning_rate": 4.9983280605863644e-05, "loss": 2.2741, "step": 58760 }, { "epoch": 0.73, "learning_rate": 4.996204395360004e-05, "loss": 2.2745, "step": 58768 }, { "epoch": 0.73, "learning_rate": 4.9940813322803196e-05, "loss": 2.2645, "step": 58776 }, { "epoch": 0.73, "learning_rate": 4.9919588715602534e-05, "loss": 2.2517, "step": 58784 }, { "epoch": 0.73, "learning_rate": 4.989837013412665e-05, "loss": 2.2707, "step": 58792 }, { "epoch": 0.73, "learning_rate": 4.987715758050368e-05, "loss": 2.2534, "step": 58800 }, { "epoch": 0.74, "learning_rate": 4.985595105686114e-05, "loss": 2.2723, "step": 58808 }, { "epoch": 0.74, "learning_rate": 4.9834750565325885e-05, "loss": 2.2646, "step": 58816 }, { "epoch": 0.74, "learning_rate": 4.981355610802429e-05, "loss": 2.2831, "step": 58824 }, { "epoch": 0.74, "learning_rate": 4.9792367687081954e-05, "loss": 2.2833, "step": 58832 }, { "epoch": 0.74, "learning_rate": 4.977118530462395e-05, "loss": 2.254, "step": 58840 }, { "epoch": 0.74, "learning_rate": 4.9750008962774855e-05, "loss": 2.2512, "step": 58848 }, { "epoch": 0.74, "learning_rate": 4.972883866365839e-05, "loss": 2.2677, "step": 58856 }, { "epoch": 0.74, "learning_rate": 4.9707674409397967e-05, "loss": 2.2542, "step": 58864 }, { "epoch": 0.74, "learning_rate": 4.9686516202116125e-05, "loss": 2.2701, "step": 58872 }, { "epoch": 0.74, "learning_rate": 4.966536404393493e-05, "loss": 2.2454, "step": 58880 }, { "epoch": 0.74, "learning_rate": 4.96442179369759e-05, "loss": 2.264, "step": 58888 }, { "epoch": 0.74, "learning_rate": 4.962307788335976e-05, "loss": 2.2557, "step": 58896 }, { "epoch": 0.74, "learning_rate": 4.9601943885206826e-05, "loss": 2.2735, "step": 58904 }, { "epoch": 0.74, "learning_rate": 4.958081594463671e-05, "loss": 2.2647, "step": 58912 }, { "epoch": 0.74, "learning_rate": 4.955969406376835e-05, "loss": 2.264, "step": 58920 }, { "epoch": 0.74, "learning_rate": 4.9538578244720246e-05, "loss": 2.267, "step": 58928 }, { "epoch": 0.74, "learning_rate": 4.951746848961011e-05, "loss": 2.2647, "step": 58936 }, { "epoch": 0.74, "learning_rate": 4.949636480055519e-05, "loss": 2.2571, "step": 58944 }, { "epoch": 0.74, "learning_rate": 4.947526717967204e-05, "loss": 2.2709, "step": 58952 }, { "epoch": 0.74, "learning_rate": 4.945417562907665e-05, "loss": 2.2724, "step": 58960 }, { "epoch": 0.74, "learning_rate": 4.9433090150884376e-05, "loss": 2.254, "step": 58968 }, { "epoch": 0.74, "learning_rate": 4.941201074720997e-05, "loss": 2.26, "step": 58976 }, { "epoch": 0.74, "learning_rate": 4.939093742016757e-05, "loss": 2.2725, "step": 58984 }, { "epoch": 0.74, "learning_rate": 4.936987017187072e-05, "loss": 2.2711, "step": 58992 }, { "epoch": 0.74, "learning_rate": 4.9348809004432336e-05, "loss": 2.2531, "step": 59000 }, { "epoch": 0.74, "learning_rate": 4.9327753919964744e-05, "loss": 2.2927, "step": 59008 }, { "epoch": 0.74, "learning_rate": 4.9306704920579643e-05, "loss": 2.2562, "step": 59016 }, { "epoch": 0.74, "learning_rate": 4.928566200838814e-05, "loss": 2.2695, "step": 59024 }, { "epoch": 0.74, "learning_rate": 4.92646251855007e-05, "loss": 2.2561, "step": 59032 }, { "epoch": 0.74, "learning_rate": 4.924359445402722e-05, "loss": 2.2558, "step": 59040 }, { "epoch": 0.74, "learning_rate": 4.922256981607694e-05, "loss": 2.257, "step": 59048 }, { "epoch": 0.74, "learning_rate": 4.9201551273758534e-05, "loss": 2.266, "step": 59056 }, { "epoch": 0.74, "learning_rate": 4.9180538829180025e-05, "loss": 2.2699, "step": 59064 }, { "epoch": 0.74, "learning_rate": 4.9159532484448856e-05, "loss": 2.256, "step": 59072 }, { "epoch": 0.74, "learning_rate": 4.9138532241671834e-05, "loss": 2.2541, "step": 59080 }, { "epoch": 0.74, "learning_rate": 4.911753810295516e-05, "loss": 2.2645, "step": 59088 }, { "epoch": 0.74, "learning_rate": 4.909655007040445e-05, "loss": 2.2523, "step": 59096 }, { "epoch": 0.74, "learning_rate": 4.907556814612466e-05, "loss": 2.2626, "step": 59104 }, { "epoch": 0.74, "learning_rate": 4.905459233222014e-05, "loss": 2.2592, "step": 59112 }, { "epoch": 0.74, "learning_rate": 4.903362263079474e-05, "loss": 2.2509, "step": 59120 }, { "epoch": 0.74, "learning_rate": 4.901265904395147e-05, "loss": 2.2672, "step": 59128 }, { "epoch": 0.74, "learning_rate": 4.899170157379298e-05, "loss": 2.2619, "step": 59136 }, { "epoch": 0.74, "learning_rate": 4.89707502224211e-05, "loss": 2.2566, "step": 59144 }, { "epoch": 0.74, "learning_rate": 4.894980499193715e-05, "loss": 2.2711, "step": 59152 }, { "epoch": 0.74, "learning_rate": 4.892886588444187e-05, "loss": 2.2482, "step": 59160 }, { "epoch": 0.74, "learning_rate": 4.890793290203524e-05, "loss": 2.2656, "step": 59168 }, { "epoch": 0.74, "learning_rate": 4.8887006046816796e-05, "loss": 2.268, "step": 59176 }, { "epoch": 0.74, "learning_rate": 4.88660853208854e-05, "loss": 2.2701, "step": 59184 }, { "epoch": 0.74, "learning_rate": 4.884517072633918e-05, "loss": 2.2545, "step": 59192 }, { "epoch": 0.74, "learning_rate": 4.8824262265275874e-05, "loss": 2.2785, "step": 59200 }, { "epoch": 0.74, "learning_rate": 4.880335993979236e-05, "loss": 2.2756, "step": 59208 }, { "epoch": 0.74, "learning_rate": 4.8782463751985125e-05, "loss": 2.27, "step": 59216 }, { "epoch": 0.74, "learning_rate": 4.876157370394991e-05, "loss": 2.2473, "step": 59224 }, { "epoch": 0.74, "learning_rate": 4.874068979778181e-05, "loss": 2.2614, "step": 59232 }, { "epoch": 0.74, "learning_rate": 4.871981203557544e-05, "loss": 2.2744, "step": 59240 }, { "epoch": 0.74, "learning_rate": 4.869894041942468e-05, "loss": 2.2613, "step": 59248 }, { "epoch": 0.74, "learning_rate": 4.8678074951422846e-05, "loss": 2.2461, "step": 59256 }, { "epoch": 0.74, "learning_rate": 4.865721563366266e-05, "loss": 2.2814, "step": 59264 }, { "epoch": 0.74, "learning_rate": 4.86363624682361e-05, "loss": 2.2585, "step": 59272 }, { "epoch": 0.74, "learning_rate": 4.8615515457234704e-05, "loss": 2.2589, "step": 59280 }, { "epoch": 0.74, "learning_rate": 4.859467460274929e-05, "loss": 2.2708, "step": 59288 }, { "epoch": 0.74, "learning_rate": 4.8573839906870064e-05, "loss": 2.252, "step": 59296 }, { "epoch": 0.74, "learning_rate": 4.855301137168664e-05, "loss": 2.2657, "step": 59304 }, { "epoch": 0.74, "learning_rate": 4.8532188999288004e-05, "loss": 2.2588, "step": 59312 }, { "epoch": 0.74, "learning_rate": 4.8511372791762504e-05, "loss": 2.2502, "step": 59320 }, { "epoch": 0.74, "learning_rate": 4.849056275119791e-05, "loss": 2.2678, "step": 59328 }, { "epoch": 0.74, "learning_rate": 4.8469758879681324e-05, "loss": 2.2414, "step": 59336 }, { "epoch": 0.74, "learning_rate": 4.844896117929929e-05, "loss": 2.2691, "step": 59344 }, { "epoch": 0.74, "learning_rate": 4.8428169652137666e-05, "loss": 2.2592, "step": 59352 }, { "epoch": 0.74, "learning_rate": 4.840738430028176e-05, "loss": 2.245, "step": 59360 }, { "epoch": 0.74, "learning_rate": 4.838660512581619e-05, "loss": 2.2691, "step": 59368 }, { "epoch": 0.74, "learning_rate": 4.836583213082501e-05, "loss": 2.261, "step": 59376 }, { "epoch": 0.74, "learning_rate": 4.8345065317391604e-05, "loss": 2.2605, "step": 59384 }, { "epoch": 0.74, "learning_rate": 4.832430468759885e-05, "loss": 2.246, "step": 59392 }, { "epoch": 0.74, "learning_rate": 4.830355024352882e-05, "loss": 2.2747, "step": 59400 }, { "epoch": 0.74, "learning_rate": 4.828280198726312e-05, "loss": 2.2543, "step": 59408 }, { "epoch": 0.74, "learning_rate": 4.826205992088267e-05, "loss": 2.2804, "step": 59416 }, { "epoch": 0.74, "learning_rate": 4.8241324046467754e-05, "loss": 2.2683, "step": 59424 }, { "epoch": 0.74, "learning_rate": 4.822059436609815e-05, "loss": 2.2423, "step": 59432 }, { "epoch": 0.74, "learning_rate": 4.819987088185284e-05, "loss": 2.2525, "step": 59440 }, { "epoch": 0.74, "learning_rate": 4.817915359581028e-05, "loss": 2.2587, "step": 59448 }, { "epoch": 0.74, "learning_rate": 4.815844251004836e-05, "loss": 2.2466, "step": 59456 }, { "epoch": 0.74, "learning_rate": 4.8137737626644196e-05, "loss": 2.2624, "step": 59464 }, { "epoch": 0.74, "learning_rate": 4.811703894767447e-05, "loss": 2.2626, "step": 59472 }, { "epoch": 0.74, "learning_rate": 4.809634647521504e-05, "loss": 2.2623, "step": 59480 }, { "epoch": 0.74, "learning_rate": 4.807566021134131e-05, "loss": 2.2652, "step": 59488 }, { "epoch": 0.74, "learning_rate": 4.805498015812802e-05, "loss": 2.2524, "step": 59496 }, { "epoch": 0.74, "learning_rate": 4.803430631764915e-05, "loss": 2.2492, "step": 59504 }, { "epoch": 0.74, "learning_rate": 4.801363869197829e-05, "loss": 2.25, "step": 59512 }, { "epoch": 0.74, "learning_rate": 4.79929772831882e-05, "loss": 2.2514, "step": 59520 }, { "epoch": 0.74, "learning_rate": 4.797232209335117e-05, "loss": 2.2737, "step": 59528 }, { "epoch": 0.74, "learning_rate": 4.795167312453878e-05, "loss": 2.2604, "step": 59536 }, { "epoch": 0.74, "learning_rate": 4.793103037882193e-05, "loss": 2.2621, "step": 59544 }, { "epoch": 0.74, "learning_rate": 4.791039385827108e-05, "loss": 2.2785, "step": 59552 }, { "epoch": 0.74, "learning_rate": 4.788976356495588e-05, "loss": 2.2312, "step": 59560 }, { "epoch": 0.74, "learning_rate": 4.786913950094547e-05, "loss": 2.2622, "step": 59568 }, { "epoch": 0.74, "learning_rate": 4.784852166830831e-05, "loss": 2.2517, "step": 59576 }, { "epoch": 0.74, "learning_rate": 4.782791006911227e-05, "loss": 2.2701, "step": 59584 }, { "epoch": 0.74, "learning_rate": 4.780730470542455e-05, "loss": 2.2509, "step": 59592 }, { "epoch": 0.74, "learning_rate": 4.778670557931177e-05, "loss": 2.2628, "step": 59600 }, { "epoch": 0.75, "learning_rate": 4.77661126928399e-05, "loss": 2.2622, "step": 59608 }, { "epoch": 0.75, "learning_rate": 4.7745526048074293e-05, "loss": 2.2653, "step": 59616 }, { "epoch": 0.75, "learning_rate": 4.7724945647079664e-05, "loss": 2.2535, "step": 59624 }, { "epoch": 0.75, "learning_rate": 4.770437149192012e-05, "loss": 2.2442, "step": 59632 }, { "epoch": 0.75, "learning_rate": 4.768380358465913e-05, "loss": 2.2534, "step": 59640 }, { "epoch": 0.75, "learning_rate": 4.766324192735954e-05, "loss": 2.2732, "step": 59648 }, { "epoch": 0.75, "learning_rate": 4.764268652208353e-05, "loss": 2.2776, "step": 59656 }, { "epoch": 0.75, "learning_rate": 4.762213737089279e-05, "loss": 2.2534, "step": 59664 }, { "epoch": 0.75, "learning_rate": 4.760159447584819e-05, "loss": 2.2387, "step": 59672 }, { "epoch": 0.75, "learning_rate": 4.7581057839010054e-05, "loss": 2.2604, "step": 59680 }, { "epoch": 0.75, "learning_rate": 4.756052746243821e-05, "loss": 2.261, "step": 59688 }, { "epoch": 0.75, "learning_rate": 4.754000334819158e-05, "loss": 2.2597, "step": 59696 }, { "epoch": 0.75, "learning_rate": 4.751948549832877e-05, "loss": 2.2471, "step": 59704 }, { "epoch": 0.75, "learning_rate": 4.74989739149075e-05, "loss": 2.2674, "step": 59712 }, { "epoch": 0.75, "learning_rate": 4.747846859998496e-05, "loss": 2.2687, "step": 59720 }, { "epoch": 0.75, "learning_rate": 4.7457969555617815e-05, "loss": 2.2469, "step": 59728 }, { "epoch": 0.75, "learning_rate": 4.743747678386188e-05, "loss": 2.2625, "step": 59736 }, { "epoch": 0.75, "learning_rate": 4.741699028677256e-05, "loss": 2.2473, "step": 59744 }, { "epoch": 0.75, "learning_rate": 4.7396510066404523e-05, "loss": 2.2488, "step": 59752 }, { "epoch": 0.75, "learning_rate": 4.7376036124811735e-05, "loss": 2.256, "step": 59760 }, { "epoch": 0.75, "learning_rate": 4.735556846404774e-05, "loss": 2.2509, "step": 59768 }, { "epoch": 0.75, "learning_rate": 4.733510708616521e-05, "loss": 2.2807, "step": 59776 }, { "epoch": 0.75, "learning_rate": 4.731465199321638e-05, "loss": 2.2686, "step": 59784 }, { "epoch": 0.75, "learning_rate": 4.72942031872528e-05, "loss": 2.2668, "step": 59792 }, { "epoch": 0.75, "learning_rate": 4.727376067032527e-05, "loss": 2.258, "step": 59800 }, { "epoch": 0.75, "learning_rate": 4.725332444448414e-05, "loss": 2.2759, "step": 59808 }, { "epoch": 0.75, "learning_rate": 4.723289451177903e-05, "loss": 2.249, "step": 59816 }, { "epoch": 0.75, "learning_rate": 4.721247087425894e-05, "loss": 2.2611, "step": 59824 }, { "epoch": 0.75, "learning_rate": 4.719205353397224e-05, "loss": 2.2587, "step": 59832 }, { "epoch": 0.75, "learning_rate": 4.71716424929667e-05, "loss": 2.2451, "step": 59840 }, { "epoch": 0.75, "learning_rate": 4.71512377532894e-05, "loss": 2.2624, "step": 59848 }, { "epoch": 0.75, "learning_rate": 4.713083931698683e-05, "loss": 2.2421, "step": 59856 }, { "epoch": 0.75, "learning_rate": 4.711044718610486e-05, "loss": 2.2491, "step": 59864 }, { "epoch": 0.75, "learning_rate": 4.709006136268866e-05, "loss": 2.2604, "step": 59872 }, { "epoch": 0.75, "learning_rate": 4.706968184878285e-05, "loss": 2.2763, "step": 59880 }, { "epoch": 0.75, "learning_rate": 4.704930864643137e-05, "loss": 2.23, "step": 59888 }, { "epoch": 0.75, "learning_rate": 4.7028941757677536e-05, "loss": 2.2531, "step": 59896 }, { "epoch": 0.75, "learning_rate": 4.7008581184564024e-05, "loss": 2.2575, "step": 59904 }, { "epoch": 0.75, "learning_rate": 4.6988226929132886e-05, "loss": 2.2693, "step": 59912 }, { "epoch": 0.75, "learning_rate": 4.6967878993425544e-05, "loss": 2.2584, "step": 59920 }, { "epoch": 0.75, "learning_rate": 4.6947537379482794e-05, "loss": 2.2517, "step": 59928 }, { "epoch": 0.75, "learning_rate": 4.6927202089344756e-05, "loss": 2.2583, "step": 59936 }, { "epoch": 0.75, "learning_rate": 4.690687312505096e-05, "loss": 2.2711, "step": 59944 }, { "epoch": 0.75, "learning_rate": 4.6886550488640266e-05, "loss": 2.2534, "step": 59952 }, { "epoch": 0.75, "learning_rate": 4.686623418215098e-05, "loss": 2.2674, "step": 59960 }, { "epoch": 0.75, "learning_rate": 4.684592420762065e-05, "loss": 2.2434, "step": 59968 }, { "epoch": 0.75, "learning_rate": 4.682562056708627e-05, "loss": 2.2703, "step": 59976 }, { "epoch": 0.75, "learning_rate": 4.6805323262584185e-05, "loss": 2.2588, "step": 59984 }, { "epoch": 0.75, "learning_rate": 4.6785032296150055e-05, "loss": 2.2544, "step": 59992 }, { "epoch": 0.75, "learning_rate": 4.676474766981906e-05, "loss": 2.2517, "step": 60000 }, { "epoch": 0.75, "learning_rate": 4.67444693856255e-05, "loss": 2.2716, "step": 60008 }, { "epoch": 0.75, "learning_rate": 4.672419744560326e-05, "loss": 2.2362, "step": 60016 }, { "epoch": 0.75, "learning_rate": 4.6703931851785503e-05, "loss": 2.2652, "step": 60024 }, { "epoch": 0.75, "learning_rate": 4.6683672606204674e-05, "loss": 2.26, "step": 60032 }, { "epoch": 0.75, "learning_rate": 4.666341971089277e-05, "loss": 2.2544, "step": 60040 }, { "epoch": 0.75, "learning_rate": 4.6643173167880934e-05, "loss": 2.2547, "step": 60048 }, { "epoch": 0.75, "learning_rate": 4.6622932979199846e-05, "loss": 2.2591, "step": 60056 }, { "epoch": 0.75, "learning_rate": 4.6602699146879495e-05, "loss": 2.2613, "step": 60064 }, { "epoch": 0.75, "learning_rate": 4.658247167294915e-05, "loss": 2.259, "step": 60072 }, { "epoch": 0.75, "learning_rate": 4.656225055943756e-05, "loss": 2.2496, "step": 60080 }, { "epoch": 0.75, "learning_rate": 4.654203580837279e-05, "loss": 2.2542, "step": 60088 }, { "epoch": 0.75, "learning_rate": 4.652182742178226e-05, "loss": 2.2591, "step": 60096 }, { "epoch": 0.75, "learning_rate": 4.6501625401692775e-05, "loss": 2.2519, "step": 60104 }, { "epoch": 0.75, "learning_rate": 4.6481429750130404e-05, "loss": 2.2558, "step": 60112 }, { "epoch": 0.75, "learning_rate": 4.6461240469120746e-05, "loss": 2.2639, "step": 60120 }, { "epoch": 0.75, "learning_rate": 4.644105756068864e-05, "loss": 2.2614, "step": 60128 }, { "epoch": 0.75, "learning_rate": 4.6420881026858306e-05, "loss": 2.2494, "step": 60136 }, { "epoch": 0.75, "learning_rate": 4.640071086965335e-05, "loss": 2.2375, "step": 60144 }, { "epoch": 0.75, "learning_rate": 4.638054709109672e-05, "loss": 2.2415, "step": 60152 }, { "epoch": 0.75, "learning_rate": 4.6360389693210735e-05, "loss": 2.238, "step": 60160 }, { "epoch": 0.75, "learning_rate": 4.634023867801705e-05, "loss": 2.2491, "step": 60168 }, { "epoch": 0.75, "learning_rate": 4.6320094047536716e-05, "loss": 2.2502, "step": 60176 }, { "epoch": 0.75, "learning_rate": 4.629995580379013e-05, "loss": 2.2501, "step": 60184 }, { "epoch": 0.75, "learning_rate": 4.6279823948797024e-05, "loss": 2.2437, "step": 60192 }, { "epoch": 0.75, "learning_rate": 4.6259698484576505e-05, "loss": 2.2367, "step": 60200 }, { "epoch": 0.75, "learning_rate": 4.623957941314707e-05, "loss": 2.2303, "step": 60208 }, { "epoch": 0.75, "learning_rate": 4.6219466736526536e-05, "loss": 2.2475, "step": 60216 }, { "epoch": 0.75, "learning_rate": 4.619936045673205e-05, "loss": 2.2527, "step": 60224 }, { "epoch": 0.75, "learning_rate": 4.617926057578026e-05, "loss": 2.2613, "step": 60232 }, { "epoch": 0.75, "learning_rate": 4.6159167095686974e-05, "loss": 2.268, "step": 60240 }, { "epoch": 0.75, "learning_rate": 4.613908001846747e-05, "loss": 2.2523, "step": 60248 }, { "epoch": 0.75, "learning_rate": 4.611899934613641e-05, "loss": 2.2471, "step": 60256 }, { "epoch": 0.75, "learning_rate": 4.609892508070771e-05, "loss": 2.2448, "step": 60264 }, { "epoch": 0.75, "learning_rate": 4.6078857224194794e-05, "loss": 2.2537, "step": 60272 }, { "epoch": 0.75, "learning_rate": 4.605879577861027e-05, "loss": 2.2655, "step": 60280 }, { "epoch": 0.75, "learning_rate": 4.6038740745966195e-05, "loss": 2.2713, "step": 60288 }, { "epoch": 0.75, "learning_rate": 4.601869212827405e-05, "loss": 2.2501, "step": 60296 }, { "epoch": 0.75, "learning_rate": 4.5998649927544504e-05, "loss": 2.2539, "step": 60304 }, { "epoch": 0.75, "learning_rate": 4.5978614145787766e-05, "loss": 2.2493, "step": 60312 }, { "epoch": 0.75, "learning_rate": 4.595858478501323e-05, "loss": 2.2695, "step": 60320 }, { "epoch": 0.75, "learning_rate": 4.593856184722974e-05, "loss": 2.2677, "step": 60328 }, { "epoch": 0.75, "learning_rate": 4.591854533444556e-05, "loss": 2.2654, "step": 60336 }, { "epoch": 0.75, "learning_rate": 4.589853524866812e-05, "loss": 2.2458, "step": 60344 }, { "epoch": 0.75, "learning_rate": 4.5878531591904404e-05, "loss": 2.2535, "step": 60352 }, { "epoch": 0.75, "learning_rate": 4.585853436616064e-05, "loss": 2.2374, "step": 60360 }, { "epoch": 0.75, "learning_rate": 4.5838543573442426e-05, "loss": 2.2734, "step": 60368 }, { "epoch": 0.75, "learning_rate": 4.581855921575477e-05, "loss": 2.2392, "step": 60376 }, { "epoch": 0.75, "learning_rate": 4.579858129510189e-05, "loss": 2.25, "step": 60384 }, { "epoch": 0.75, "learning_rate": 4.5778609813487556e-05, "loss": 2.2607, "step": 60392 }, { "epoch": 0.76, "learning_rate": 4.5758644772914745e-05, "loss": 2.2629, "step": 60400 }, { "epoch": 0.76, "learning_rate": 4.573868617538587e-05, "loss": 2.228, "step": 60408 }, { "epoch": 0.76, "learning_rate": 4.571873402290263e-05, "loss": 2.239, "step": 60416 }, { "epoch": 0.76, "learning_rate": 4.569878831746614e-05, "loss": 2.2614, "step": 60424 }, { "epoch": 0.76, "learning_rate": 4.567884906107683e-05, "loss": 2.2629, "step": 60432 }, { "epoch": 0.76, "learning_rate": 4.5658916255734495e-05, "loss": 2.2453, "step": 60440 }, { "epoch": 0.76, "learning_rate": 4.563898990343828e-05, "loss": 2.2656, "step": 60448 }, { "epoch": 0.76, "learning_rate": 4.561907000618669e-05, "loss": 2.2579, "step": 60456 }, { "epoch": 0.76, "learning_rate": 4.559915656597757e-05, "loss": 2.2475, "step": 60464 }, { "epoch": 0.76, "learning_rate": 4.557924958480814e-05, "loss": 2.2645, "step": 60472 }, { "epoch": 0.76, "learning_rate": 4.555934906467495e-05, "loss": 2.2303, "step": 60480 }, { "epoch": 0.76, "learning_rate": 4.553945500757391e-05, "loss": 2.2486, "step": 60488 }, { "epoch": 0.76, "learning_rate": 4.551956741550026e-05, "loss": 2.2518, "step": 60496 }, { "epoch": 0.76, "learning_rate": 4.5499686290448644e-05, "loss": 2.2583, "step": 60504 }, { "epoch": 0.76, "learning_rate": 4.547981163441302e-05, "loss": 2.2638, "step": 60512 }, { "epoch": 0.76, "learning_rate": 4.545994344938667e-05, "loss": 2.2542, "step": 60520 }, { "epoch": 0.76, "learning_rate": 4.544008173736234e-05, "loss": 2.2595, "step": 60528 }, { "epoch": 0.76, "learning_rate": 4.5420226500331934e-05, "loss": 2.2627, "step": 60536 }, { "epoch": 0.76, "learning_rate": 4.540037774028694e-05, "loss": 2.2492, "step": 60544 }, { "epoch": 0.76, "learning_rate": 4.538053545921799e-05, "loss": 2.2411, "step": 60552 }, { "epoch": 0.76, "learning_rate": 4.5360699659115156e-05, "loss": 2.2633, "step": 60560 }, { "epoch": 0.76, "learning_rate": 4.5340870341967925e-05, "loss": 2.2557, "step": 60568 }, { "epoch": 0.76, "learning_rate": 4.5321047509764964e-05, "loss": 2.2639, "step": 60576 }, { "epoch": 0.76, "learning_rate": 4.530123116449449e-05, "loss": 2.2273, "step": 60584 }, { "epoch": 0.76, "learning_rate": 4.528142130814394e-05, "loss": 2.2538, "step": 60592 }, { "epoch": 0.76, "learning_rate": 4.526161794270007e-05, "loss": 2.2556, "step": 60600 }, { "epoch": 0.76, "learning_rate": 4.5241821070149136e-05, "loss": 2.2631, "step": 60608 }, { "epoch": 0.76, "learning_rate": 4.5222030692476564e-05, "loss": 2.257, "step": 60616 }, { "epoch": 0.76, "learning_rate": 4.520224681166728e-05, "loss": 2.2344, "step": 60624 }, { "epoch": 0.76, "learning_rate": 4.518246942970552e-05, "loss": 2.2627, "step": 60632 }, { "epoch": 0.76, "learning_rate": 4.516269854857473e-05, "loss": 2.2613, "step": 60640 }, { "epoch": 0.76, "learning_rate": 4.5142934170257916e-05, "loss": 2.2417, "step": 60648 }, { "epoch": 0.76, "learning_rate": 4.5123176296737315e-05, "loss": 2.2636, "step": 60656 }, { "epoch": 0.76, "learning_rate": 4.510342492999452e-05, "loss": 2.2659, "step": 60664 }, { "epoch": 0.76, "learning_rate": 4.508368007201049e-05, "loss": 2.2497, "step": 60672 }, { "epoch": 0.76, "learning_rate": 4.506394172476547e-05, "loss": 2.2507, "step": 60680 }, { "epoch": 0.76, "learning_rate": 4.5044209890239166e-05, "loss": 2.2528, "step": 60688 }, { "epoch": 0.76, "learning_rate": 4.502448457041056e-05, "loss": 2.2663, "step": 60696 }, { "epoch": 0.76, "learning_rate": 4.500476576725798e-05, "loss": 2.2527, "step": 60704 }, { "epoch": 0.76, "learning_rate": 4.49850534827591e-05, "loss": 2.2556, "step": 60712 }, { "epoch": 0.76, "learning_rate": 4.496534771889097e-05, "loss": 2.2288, "step": 60720 }, { "epoch": 0.76, "learning_rate": 4.494564847762995e-05, "loss": 2.2357, "step": 60728 }, { "epoch": 0.76, "learning_rate": 4.4925955760951774e-05, "loss": 2.2741, "step": 60736 }, { "epoch": 0.76, "learning_rate": 4.4906269570831504e-05, "loss": 2.2596, "step": 60744 }, { "epoch": 0.76, "learning_rate": 4.488658990924356e-05, "loss": 2.2427, "step": 60752 }, { "epoch": 0.76, "learning_rate": 4.4866916778161694e-05, "loss": 2.2482, "step": 60760 }, { "epoch": 0.76, "learning_rate": 4.4847250179558994e-05, "loss": 2.2484, "step": 60768 }, { "epoch": 0.76, "learning_rate": 4.4827590115407944e-05, "loss": 2.2587, "step": 60776 }, { "epoch": 0.76, "learning_rate": 4.480793658768031e-05, "loss": 2.2521, "step": 60784 }, { "epoch": 0.76, "learning_rate": 4.478828959834722e-05, "loss": 2.2588, "step": 60792 }, { "epoch": 0.76, "learning_rate": 4.4768649149379225e-05, "loss": 2.2583, "step": 60800 }, { "epoch": 0.76, "learning_rate": 4.474901524274606e-05, "loss": 2.2471, "step": 60808 }, { "epoch": 0.76, "learning_rate": 4.472938788041694e-05, "loss": 2.2439, "step": 60816 }, { "epoch": 0.76, "learning_rate": 4.4709767064360375e-05, "loss": 2.2672, "step": 60824 }, { "epoch": 0.76, "learning_rate": 4.4690152796544196e-05, "loss": 2.26, "step": 60832 }, { "epoch": 0.76, "learning_rate": 4.4670545078935666e-05, "loss": 2.2484, "step": 60840 }, { "epoch": 0.76, "learning_rate": 4.465094391350128e-05, "loss": 2.2262, "step": 60848 }, { "epoch": 0.76, "learning_rate": 4.463134930220688e-05, "loss": 2.2514, "step": 60856 }, { "epoch": 0.76, "learning_rate": 4.461176124701781e-05, "loss": 2.2684, "step": 60864 }, { "epoch": 0.76, "learning_rate": 4.4592179749898535e-05, "loss": 2.2466, "step": 60872 }, { "epoch": 0.76, "learning_rate": 4.457260481281305e-05, "loss": 2.2603, "step": 60880 }, { "epoch": 0.76, "learning_rate": 4.455303643772452e-05, "loss": 2.2565, "step": 60888 }, { "epoch": 0.76, "learning_rate": 4.4533474626595616e-05, "loss": 2.2402, "step": 60896 }, { "epoch": 0.76, "learning_rate": 4.451391938138829e-05, "loss": 2.2803, "step": 60904 }, { "epoch": 0.76, "learning_rate": 4.449437070406372e-05, "loss": 2.2539, "step": 60912 }, { "epoch": 0.76, "learning_rate": 4.447482859658263e-05, "loss": 2.2601, "step": 60920 }, { "epoch": 0.76, "learning_rate": 4.4455293060904944e-05, "loss": 2.2669, "step": 60928 }, { "epoch": 0.76, "learning_rate": 4.443576409898996e-05, "loss": 2.2602, "step": 60936 }, { "epoch": 0.76, "learning_rate": 4.441624171279636e-05, "loss": 2.2494, "step": 60944 }, { "epoch": 0.76, "learning_rate": 4.439672590428205e-05, "loss": 2.2534, "step": 60952 }, { "epoch": 0.76, "learning_rate": 4.437721667540442e-05, "loss": 2.2476, "step": 60960 }, { "epoch": 0.76, "learning_rate": 4.435771402812013e-05, "loss": 2.2561, "step": 60968 }, { "epoch": 0.76, "learning_rate": 4.433821796438516e-05, "loss": 2.2428, "step": 60976 }, { "epoch": 0.76, "learning_rate": 4.431872848615487e-05, "loss": 2.2378, "step": 60984 }, { "epoch": 0.76, "learning_rate": 4.429924559538396e-05, "loss": 2.2493, "step": 60992 }, { "epoch": 0.76, "learning_rate": 4.427976929402642e-05, "loss": 2.2729, "step": 61000 }, { "epoch": 0.76, "learning_rate": 4.4260299584035625e-05, "loss": 2.2669, "step": 61008 }, { "epoch": 0.76, "learning_rate": 4.424083646736429e-05, "loss": 2.2665, "step": 61016 }, { "epoch": 0.76, "learning_rate": 4.4221379945964436e-05, "loss": 2.2701, "step": 61024 }, { "epoch": 0.76, "learning_rate": 4.420193002178746e-05, "loss": 2.2682, "step": 61032 }, { "epoch": 0.76, "learning_rate": 4.418248669678406e-05, "loss": 2.2474, "step": 61040 }, { "epoch": 0.76, "learning_rate": 4.416304997290431e-05, "loss": 2.2605, "step": 61048 }, { "epoch": 0.76, "learning_rate": 4.4143619852097595e-05, "loss": 2.2618, "step": 61056 }, { "epoch": 0.76, "learning_rate": 4.412419633631262e-05, "loss": 2.2452, "step": 61064 }, { "epoch": 0.76, "learning_rate": 4.4104779427497536e-05, "loss": 2.2538, "step": 61072 }, { "epoch": 0.76, "learning_rate": 4.4085369127599664e-05, "loss": 2.251, "step": 61080 }, { "epoch": 0.76, "learning_rate": 4.406596543856577e-05, "loss": 2.256, "step": 61088 }, { "epoch": 0.76, "learning_rate": 4.4046568362341943e-05, "loss": 2.2561, "step": 61096 }, { "epoch": 0.76, "learning_rate": 4.402717790087357e-05, "loss": 2.2566, "step": 61104 }, { "epoch": 0.76, "learning_rate": 4.400779405610547e-05, "loss": 2.2852, "step": 61112 }, { "epoch": 0.76, "learning_rate": 4.398841682998169e-05, "loss": 2.2717, "step": 61120 }, { "epoch": 0.76, "learning_rate": 4.396904622444562e-05, "loss": 2.2525, "step": 61128 }, { "epoch": 0.76, "learning_rate": 4.3949682241440116e-05, "loss": 2.2632, "step": 61136 }, { "epoch": 0.76, "learning_rate": 4.393032488290718e-05, "loss": 2.2408, "step": 61144 }, { "epoch": 0.76, "learning_rate": 4.391097415078832e-05, "loss": 2.2476, "step": 61152 }, { "epoch": 0.76, "learning_rate": 4.3891630047024254e-05, "loss": 2.2431, "step": 61160 }, { "epoch": 0.76, "learning_rate": 4.387229257355509e-05, "loss": 2.2537, "step": 61168 }, { "epoch": 0.76, "learning_rate": 4.385296173232032e-05, "loss": 2.2551, "step": 61176 }, { "epoch": 0.76, "learning_rate": 4.383363752525863e-05, "loss": 2.2322, "step": 61184 }, { "epoch": 0.76, "learning_rate": 4.3814319954308196e-05, "loss": 2.259, "step": 61192 }, { "epoch": 0.77, "learning_rate": 4.3795009021406475e-05, "loss": 2.2675, "step": 61200 }, { "epoch": 0.77, "learning_rate": 4.377570472849016e-05, "loss": 2.2385, "step": 61208 }, { "epoch": 0.77, "learning_rate": 4.3756407077495464e-05, "loss": 2.2284, "step": 61216 }, { "epoch": 0.77, "learning_rate": 4.3737116070357717e-05, "loss": 2.2472, "step": 61224 }, { "epoch": 0.77, "learning_rate": 4.37178317090118e-05, "loss": 2.2594, "step": 61232 }, { "epoch": 0.77, "learning_rate": 4.369855399539179e-05, "loss": 2.2747, "step": 61240 }, { "epoch": 0.77, "learning_rate": 4.367928293143112e-05, "loss": 2.2641, "step": 61248 }, { "epoch": 0.77, "learning_rate": 4.3660018519062584e-05, "loss": 2.2514, "step": 61256 }, { "epoch": 0.77, "learning_rate": 4.364076076021829e-05, "loss": 2.2627, "step": 61264 }, { "epoch": 0.77, "learning_rate": 4.362150965682967e-05, "loss": 2.2475, "step": 61272 }, { "epoch": 0.77, "learning_rate": 4.360226521082752e-05, "loss": 2.274, "step": 61280 }, { "epoch": 0.77, "learning_rate": 4.358302742414193e-05, "loss": 2.2716, "step": 61288 }, { "epoch": 0.77, "learning_rate": 4.356379629870236e-05, "loss": 2.2662, "step": 61296 }, { "epoch": 0.77, "learning_rate": 4.354457183643757e-05, "loss": 2.2446, "step": 61304 }, { "epoch": 0.77, "learning_rate": 4.352535403927567e-05, "loss": 2.2795, "step": 61312 }, { "epoch": 0.77, "learning_rate": 4.3506142909144086e-05, "loss": 2.2645, "step": 61320 }, { "epoch": 0.77, "learning_rate": 4.348693844796959e-05, "loss": 2.2676, "step": 61328 }, { "epoch": 0.77, "learning_rate": 4.3467740657678305e-05, "loss": 2.2703, "step": 61336 }, { "epoch": 0.77, "learning_rate": 4.344854954019562e-05, "loss": 2.2447, "step": 61344 }, { "epoch": 0.77, "learning_rate": 4.3429365097446315e-05, "loss": 2.2623, "step": 61352 }, { "epoch": 0.77, "learning_rate": 4.3410187331354455e-05, "loss": 2.2598, "step": 61360 }, { "epoch": 0.77, "learning_rate": 4.339101624384355e-05, "loss": 2.2485, "step": 61368 }, { "epoch": 0.77, "learning_rate": 4.3371851836836266e-05, "loss": 2.2627, "step": 61376 }, { "epoch": 0.77, "learning_rate": 4.3352694112254694e-05, "loss": 2.2402, "step": 61384 }, { "epoch": 0.77, "learning_rate": 4.3333543072020256e-05, "loss": 2.2408, "step": 61392 }, { "epoch": 0.77, "learning_rate": 4.331439871805367e-05, "loss": 2.2396, "step": 61400 }, { "epoch": 0.77, "learning_rate": 4.329526105227509e-05, "loss": 2.2648, "step": 61408 }, { "epoch": 0.77, "learning_rate": 4.32761300766038e-05, "loss": 2.257, "step": 61416 }, { "epoch": 0.77, "learning_rate": 4.325700579295862e-05, "loss": 2.2448, "step": 61424 }, { "epoch": 0.77, "learning_rate": 4.323788820325759e-05, "loss": 2.2746, "step": 61432 }, { "epoch": 0.77, "learning_rate": 4.321877730941802e-05, "loss": 2.2679, "step": 61440 }, { "epoch": 0.77, "learning_rate": 4.319967311335675e-05, "loss": 2.2715, "step": 61448 }, { "epoch": 0.77, "learning_rate": 4.318057561698969e-05, "loss": 2.2654, "step": 61456 }, { "epoch": 0.77, "learning_rate": 4.316148482223231e-05, "loss": 2.2483, "step": 61464 }, { "epoch": 0.77, "learning_rate": 4.31424007309993e-05, "loss": 2.2534, "step": 61472 }, { "epoch": 0.77, "learning_rate": 4.31233233452046e-05, "loss": 2.255, "step": 61480 }, { "epoch": 0.77, "learning_rate": 4.310425266676166e-05, "loss": 2.2609, "step": 61488 }, { "epoch": 0.77, "learning_rate": 4.308518869758312e-05, "loss": 2.2645, "step": 61496 }, { "epoch": 0.77, "learning_rate": 4.306613143958099e-05, "loss": 2.2465, "step": 61504 }, { "epoch": 0.77, "learning_rate": 4.3047080894666647e-05, "loss": 2.2491, "step": 61512 }, { "epoch": 0.77, "learning_rate": 4.302803706475065e-05, "loss": 2.2558, "step": 61520 }, { "epoch": 0.77, "learning_rate": 4.300899995174308e-05, "loss": 2.2417, "step": 61528 }, { "epoch": 0.77, "learning_rate": 4.298996955755323e-05, "loss": 2.2382, "step": 61536 }, { "epoch": 0.77, "learning_rate": 4.297094588408973e-05, "loss": 2.2476, "step": 61544 }, { "epoch": 0.77, "learning_rate": 4.295192893326056e-05, "loss": 2.2636, "step": 61552 }, { "epoch": 0.77, "learning_rate": 4.293291870697298e-05, "loss": 2.2615, "step": 61560 }, { "epoch": 0.77, "learning_rate": 4.291391520713364e-05, "loss": 2.2768, "step": 61568 }, { "epoch": 0.77, "learning_rate": 4.2894918435648477e-05, "loss": 2.2409, "step": 61576 }, { "epoch": 0.77, "learning_rate": 4.287592839442276e-05, "loss": 2.2491, "step": 61584 }, { "epoch": 0.77, "learning_rate": 4.2856945085361076e-05, "loss": 2.2573, "step": 61592 }, { "epoch": 0.77, "learning_rate": 4.283796851036735e-05, "loss": 2.2635, "step": 61600 }, { "epoch": 0.77, "learning_rate": 4.2818998671344815e-05, "loss": 2.2631, "step": 61608 }, { "epoch": 0.77, "learning_rate": 4.280003557019604e-05, "loss": 2.2411, "step": 61616 }, { "epoch": 0.77, "learning_rate": 4.278107920882293e-05, "loss": 2.2463, "step": 61624 }, { "epoch": 0.77, "learning_rate": 4.276212958912666e-05, "loss": 2.2527, "step": 61632 }, { "epoch": 0.77, "learning_rate": 4.274318671300787e-05, "loss": 2.268, "step": 61640 }, { "epoch": 0.77, "learning_rate": 4.272425058236631e-05, "loss": 2.2371, "step": 61648 }, { "epoch": 0.77, "learning_rate": 4.270532119910121e-05, "loss": 2.2382, "step": 61656 }, { "epoch": 0.77, "learning_rate": 4.268639856511109e-05, "loss": 2.2368, "step": 61664 }, { "epoch": 0.77, "learning_rate": 4.266748268229375e-05, "loss": 2.2512, "step": 61672 }, { "epoch": 0.77, "learning_rate": 4.264857355254641e-05, "loss": 2.2751, "step": 61680 }, { "epoch": 0.77, "learning_rate": 4.2629671177765494e-05, "loss": 2.2638, "step": 61688 }, { "epoch": 0.77, "learning_rate": 4.2610775559846786e-05, "loss": 2.2448, "step": 61696 }, { "epoch": 0.77, "learning_rate": 4.25918867006855e-05, "loss": 2.2577, "step": 61704 }, { "epoch": 0.77, "learning_rate": 4.257300460217596e-05, "loss": 2.2378, "step": 61712 }, { "epoch": 0.77, "learning_rate": 4.255412926621205e-05, "loss": 2.2751, "step": 61720 }, { "epoch": 0.77, "learning_rate": 4.253526069468679e-05, "loss": 2.2744, "step": 61728 }, { "epoch": 0.77, "learning_rate": 4.2516398889492574e-05, "loss": 2.265, "step": 61736 }, { "epoch": 0.77, "learning_rate": 4.2497543852521214e-05, "loss": 2.2636, "step": 61744 }, { "epoch": 0.77, "learning_rate": 4.247869558566366e-05, "loss": 2.2524, "step": 61752 }, { "epoch": 0.77, "learning_rate": 4.245985409081038e-05, "loss": 2.2532, "step": 61760 }, { "epoch": 0.77, "learning_rate": 4.244101936985103e-05, "loss": 2.2553, "step": 61768 }, { "epoch": 0.77, "learning_rate": 4.242219142467462e-05, "loss": 2.2419, "step": 61776 }, { "epoch": 0.77, "learning_rate": 4.240337025716952e-05, "loss": 2.2575, "step": 61784 }, { "epoch": 0.77, "learning_rate": 4.238455586922331e-05, "loss": 2.2563, "step": 61792 }, { "epoch": 0.77, "learning_rate": 4.2365748262723035e-05, "loss": 2.2603, "step": 61800 }, { "epoch": 0.77, "learning_rate": 4.234694743955498e-05, "loss": 2.2439, "step": 61808 }, { "epoch": 0.77, "learning_rate": 4.232815340160475e-05, "loss": 2.2588, "step": 61816 }, { "epoch": 0.77, "learning_rate": 4.2309366150757294e-05, "loss": 2.2829, "step": 61824 }, { "epoch": 0.77, "learning_rate": 4.2290585688896846e-05, "loss": 2.2771, "step": 61832 }, { "epoch": 0.77, "learning_rate": 4.2271812017907e-05, "loss": 2.2627, "step": 61840 }, { "epoch": 0.77, "learning_rate": 4.2253045139670624e-05, "loss": 2.251, "step": 61848 }, { "epoch": 0.77, "learning_rate": 4.223428505606996e-05, "loss": 2.2435, "step": 61856 }, { "epoch": 0.77, "learning_rate": 4.221553176898652e-05, "loss": 2.2613, "step": 61864 }, { "epoch": 0.77, "learning_rate": 4.219678528030114e-05, "loss": 2.2647, "step": 61872 }, { "epoch": 0.77, "learning_rate": 4.2178045591894025e-05, "loss": 2.2575, "step": 61880 }, { "epoch": 0.77, "learning_rate": 4.215931270564463e-05, "loss": 2.2672, "step": 61888 }, { "epoch": 0.77, "learning_rate": 4.2140586623431756e-05, "loss": 2.2533, "step": 61896 }, { "epoch": 0.77, "learning_rate": 4.212186734713354e-05, "loss": 2.2622, "step": 61904 }, { "epoch": 0.77, "learning_rate": 4.2103154878627406e-05, "loss": 2.2585, "step": 61912 }, { "epoch": 0.77, "learning_rate": 4.208444921979011e-05, "loss": 2.2471, "step": 61920 }, { "epoch": 0.77, "learning_rate": 4.2065750372497724e-05, "loss": 2.2636, "step": 61928 }, { "epoch": 0.77, "learning_rate": 4.204705833862566e-05, "loss": 2.2277, "step": 61936 }, { "epoch": 0.77, "learning_rate": 4.202837312004856e-05, "loss": 2.2741, "step": 61944 }, { "epoch": 0.77, "learning_rate": 4.2009694718640536e-05, "loss": 2.2535, "step": 61952 }, { "epoch": 0.77, "learning_rate": 4.1991023136274856e-05, "loss": 2.2434, "step": 61960 }, { "epoch": 0.77, "learning_rate": 4.197235837482417e-05, "loss": 2.2567, "step": 61968 }, { "epoch": 0.77, "learning_rate": 4.195370043616052e-05, "loss": 2.2599, "step": 61976 }, { "epoch": 0.77, "learning_rate": 4.1935049322155095e-05, "loss": 2.2515, "step": 61984 }, { "epoch": 0.77, "learning_rate": 4.1916405034678604e-05, "loss": 2.2617, "step": 61992 }, { "epoch": 0.78, "learning_rate": 4.1897767575600874e-05, "loss": 2.2603, "step": 62000 }, { "epoch": 0.78, "learning_rate": 4.1879136946791143e-05, "loss": 2.2503, "step": 62008 }, { "epoch": 0.78, "learning_rate": 4.1860513150118035e-05, "loss": 2.2586, "step": 62016 }, { "epoch": 0.78, "learning_rate": 4.1841896187449305e-05, "loss": 2.2535, "step": 62024 }, { "epoch": 0.78, "learning_rate": 4.182328606065221e-05, "loss": 2.2472, "step": 62032 }, { "epoch": 0.78, "learning_rate": 4.180468277159323e-05, "loss": 2.2621, "step": 62040 }, { "epoch": 0.78, "learning_rate": 4.178608632213811e-05, "loss": 2.2315, "step": 62048 }, { "epoch": 0.78, "learning_rate": 4.1767496714152064e-05, "loss": 2.2545, "step": 62056 }, { "epoch": 0.78, "learning_rate": 4.1748913949499416e-05, "loss": 2.2742, "step": 62064 }, { "epoch": 0.78, "learning_rate": 4.1730338030043994e-05, "loss": 2.2555, "step": 62072 }, { "epoch": 0.78, "learning_rate": 4.1711768957648845e-05, "loss": 2.2598, "step": 62080 }, { "epoch": 0.78, "learning_rate": 4.1693206734176296e-05, "loss": 2.2478, "step": 62088 }, { "epoch": 0.78, "learning_rate": 4.167465136148806e-05, "loss": 2.2551, "step": 62096 }, { "epoch": 0.78, "learning_rate": 4.165610284144517e-05, "loss": 2.2649, "step": 62104 }, { "epoch": 0.78, "learning_rate": 4.163756117590789e-05, "loss": 2.2677, "step": 62112 }, { "epoch": 0.78, "learning_rate": 4.161902636673586e-05, "loss": 2.2593, "step": 62120 }, { "epoch": 0.78, "learning_rate": 4.1600498415788034e-05, "loss": 2.2702, "step": 62128 }, { "epoch": 0.78, "learning_rate": 4.1581977324922624e-05, "loss": 2.2607, "step": 62136 }, { "epoch": 0.78, "learning_rate": 4.156346309599723e-05, "loss": 2.2665, "step": 62144 }, { "epoch": 0.78, "learning_rate": 4.1544955730868694e-05, "loss": 2.2388, "step": 62152 }, { "epoch": 0.78, "learning_rate": 4.152645523139321e-05, "loss": 2.2649, "step": 62160 }, { "epoch": 0.78, "learning_rate": 4.150796159942627e-05, "loss": 2.263, "step": 62168 }, { "epoch": 0.78, "learning_rate": 4.148947483682268e-05, "loss": 2.2682, "step": 62176 }, { "epoch": 0.78, "learning_rate": 4.147099494543658e-05, "loss": 2.252, "step": 62184 }, { "epoch": 0.78, "learning_rate": 4.145252192712138e-05, "loss": 2.2785, "step": 62192 }, { "epoch": 0.78, "learning_rate": 4.14340557837298e-05, "loss": 2.2498, "step": 62200 }, { "epoch": 0.78, "learning_rate": 4.1415596517113925e-05, "loss": 2.2553, "step": 62208 }, { "epoch": 0.78, "learning_rate": 4.139714412912509e-05, "loss": 2.2561, "step": 62216 }, { "epoch": 0.78, "learning_rate": 4.137869862161398e-05, "loss": 2.2609, "step": 62224 }, { "epoch": 0.78, "learning_rate": 4.1360259996430564e-05, "loss": 2.245, "step": 62232 }, { "epoch": 0.78, "learning_rate": 4.134182825542411e-05, "loss": 2.2614, "step": 62240 }, { "epoch": 0.78, "learning_rate": 4.1323403400443296e-05, "loss": 2.2846, "step": 62248 }, { "epoch": 0.78, "learning_rate": 4.130498543333593e-05, "loss": 2.2513, "step": 62256 }, { "epoch": 0.78, "learning_rate": 4.1286574355949314e-05, "loss": 2.2461, "step": 62264 }, { "epoch": 0.78, "learning_rate": 4.126817017012993e-05, "loss": 2.2721, "step": 62272 }, { "epoch": 0.78, "learning_rate": 4.124977287772359e-05, "loss": 2.2653, "step": 62280 }, { "epoch": 0.78, "learning_rate": 4.1231382480575524e-05, "loss": 2.2457, "step": 62288 }, { "epoch": 0.78, "learning_rate": 4.121299898053008e-05, "loss": 2.2585, "step": 62296 }, { "epoch": 0.78, "learning_rate": 4.119462237943108e-05, "loss": 2.2635, "step": 62304 }, { "epoch": 0.78, "learning_rate": 4.117625267912163e-05, "loss": 2.2699, "step": 62312 }, { "epoch": 0.78, "learning_rate": 4.1157889881444004e-05, "loss": 2.2559, "step": 62320 }, { "epoch": 0.78, "learning_rate": 4.1139533988239985e-05, "loss": 2.2532, "step": 62328 }, { "epoch": 0.78, "learning_rate": 4.112118500135047e-05, "loss": 2.2463, "step": 62336 }, { "epoch": 0.78, "learning_rate": 4.110284292261585e-05, "loss": 2.2604, "step": 62344 }, { "epoch": 0.78, "learning_rate": 4.1084507753875696e-05, "loss": 2.2707, "step": 62352 }, { "epoch": 0.78, "learning_rate": 4.106617949696888e-05, "loss": 2.2383, "step": 62360 }, { "epoch": 0.78, "learning_rate": 4.1047858153733684e-05, "loss": 2.2677, "step": 62368 }, { "epoch": 0.78, "learning_rate": 4.102954372600761e-05, "loss": 2.2536, "step": 62376 }, { "epoch": 0.78, "learning_rate": 4.10112362156275e-05, "loss": 2.2531, "step": 62384 }, { "epoch": 0.78, "learning_rate": 4.09929356244295e-05, "loss": 2.2628, "step": 62392 }, { "epoch": 0.78, "learning_rate": 4.097464195424899e-05, "loss": 2.2542, "step": 62400 }, { "epoch": 0.78, "learning_rate": 4.09563552069208e-05, "loss": 2.2359, "step": 62408 }, { "epoch": 0.78, "learning_rate": 4.093807538427897e-05, "loss": 2.2563, "step": 62416 }, { "epoch": 0.78, "learning_rate": 4.0919802488156844e-05, "loss": 2.2642, "step": 62424 }, { "epoch": 0.78, "learning_rate": 4.09015365203871e-05, "loss": 2.2693, "step": 62432 }, { "epoch": 0.78, "learning_rate": 4.0883277482801705e-05, "loss": 2.2307, "step": 62440 }, { "epoch": 0.78, "learning_rate": 4.086502537723195e-05, "loss": 2.2605, "step": 62448 }, { "epoch": 0.78, "learning_rate": 4.0846780205508396e-05, "loss": 2.2482, "step": 62456 }, { "epoch": 0.78, "learning_rate": 4.0828541969460964e-05, "loss": 2.2555, "step": 62464 }, { "epoch": 0.78, "learning_rate": 4.0810310670918784e-05, "loss": 2.2676, "step": 62472 }, { "epoch": 0.78, "learning_rate": 4.079208631171044e-05, "loss": 2.2492, "step": 62480 }, { "epoch": 0.78, "learning_rate": 4.077386889366367e-05, "loss": 2.2502, "step": 62488 }, { "epoch": 0.78, "learning_rate": 4.0755658418605606e-05, "loss": 2.2556, "step": 62496 }, { "epoch": 0.78, "learning_rate": 4.073745488836263e-05, "loss": 2.2733, "step": 62504 }, { "epoch": 0.78, "learning_rate": 4.071925830476043e-05, "loss": 2.2669, "step": 62512 }, { "epoch": 0.78, "learning_rate": 4.070106866962411e-05, "loss": 2.2576, "step": 62520 }, { "epoch": 0.78, "learning_rate": 4.068288598477792e-05, "loss": 2.2472, "step": 62528 }, { "epoch": 0.78, "learning_rate": 4.066471025204546e-05, "loss": 2.2684, "step": 62536 }, { "epoch": 0.78, "learning_rate": 4.0646541473249725e-05, "loss": 2.2563, "step": 62544 }, { "epoch": 0.78, "learning_rate": 4.062837965021287e-05, "loss": 2.2587, "step": 62552 }, { "epoch": 0.78, "learning_rate": 4.06102247847565e-05, "loss": 2.2531, "step": 62560 }, { "epoch": 0.78, "learning_rate": 4.059207687870137e-05, "loss": 2.2544, "step": 62568 }, { "epoch": 0.78, "learning_rate": 4.057393593386761e-05, "loss": 2.2436, "step": 62576 }, { "epoch": 0.78, "learning_rate": 4.0555801952074755e-05, "loss": 2.2714, "step": 62584 }, { "epoch": 0.78, "learning_rate": 4.053767493514142e-05, "loss": 2.2368, "step": 62592 }, { "epoch": 0.78, "learning_rate": 4.05195548848857e-05, "loss": 2.2374, "step": 62600 }, { "epoch": 0.78, "learning_rate": 4.050144180312494e-05, "loss": 2.2551, "step": 62608 }, { "epoch": 0.78, "learning_rate": 4.048333569167577e-05, "loss": 2.2436, "step": 62616 }, { "epoch": 0.78, "learning_rate": 4.046523655235415e-05, "loss": 2.2603, "step": 62624 }, { "epoch": 0.78, "learning_rate": 4.044714438697525e-05, "loss": 2.251, "step": 62632 }, { "epoch": 0.78, "learning_rate": 4.042905919735367e-05, "loss": 2.247, "step": 62640 }, { "epoch": 0.78, "learning_rate": 4.041098098530326e-05, "loss": 2.2539, "step": 62648 }, { "epoch": 0.78, "learning_rate": 4.039290975263714e-05, "loss": 2.2494, "step": 62656 }, { "epoch": 0.78, "learning_rate": 4.0374845501167746e-05, "loss": 2.2513, "step": 62664 }, { "epoch": 0.78, "learning_rate": 4.0356788232706846e-05, "loss": 2.249, "step": 62672 }, { "epoch": 0.78, "learning_rate": 4.0338737949065454e-05, "loss": 2.246, "step": 62680 }, { "epoch": 0.78, "learning_rate": 4.032069465205392e-05, "loss": 2.2685, "step": 62688 }, { "epoch": 0.78, "learning_rate": 4.0302658343481904e-05, "loss": 2.2632, "step": 62696 }, { "epoch": 0.78, "learning_rate": 4.028462902515832e-05, "loss": 2.2604, "step": 62704 }, { "epoch": 0.78, "learning_rate": 4.026660669889141e-05, "loss": 2.2596, "step": 62712 }, { "epoch": 0.78, "learning_rate": 4.024859136648872e-05, "loss": 2.243, "step": 62720 }, { "epoch": 0.78, "learning_rate": 4.023058302975709e-05, "loss": 2.2712, "step": 62728 }, { "epoch": 0.78, "learning_rate": 4.021258169050264e-05, "loss": 2.2811, "step": 62736 }, { "epoch": 0.78, "learning_rate": 4.019458735053081e-05, "loss": 2.2775, "step": 62744 }, { "epoch": 0.78, "learning_rate": 4.017660001164633e-05, "loss": 2.2655, "step": 62752 }, { "epoch": 0.78, "learning_rate": 4.015861967565323e-05, "loss": 2.2531, "step": 62760 }, { "epoch": 0.78, "learning_rate": 4.0140646344354827e-05, "loss": 2.2252, "step": 62768 }, { "epoch": 0.78, "learning_rate": 4.012268001955375e-05, "loss": 2.2527, "step": 62776 }, { "epoch": 0.78, "learning_rate": 4.01047207030519e-05, "loss": 2.2531, "step": 62784 }, { "epoch": 0.78, "learning_rate": 4.008676839665058e-05, "loss": 2.2658, "step": 62792 }, { "epoch": 0.79, "learning_rate": 4.006882310215019e-05, "loss": 2.2371, "step": 62800 }, { "epoch": 0.79, "learning_rate": 4.005088482135058e-05, "loss": 2.2492, "step": 62808 }, { "epoch": 0.79, "learning_rate": 4.003295355605091e-05, "loss": 2.2739, "step": 62816 }, { "epoch": 0.79, "learning_rate": 4.00150293080495e-05, "loss": 2.2658, "step": 62824 }, { "epoch": 0.79, "learning_rate": 3.999711207914414e-05, "loss": 2.2545, "step": 62832 }, { "epoch": 0.79, "learning_rate": 3.9979201871131754e-05, "loss": 2.2576, "step": 62840 }, { "epoch": 0.79, "learning_rate": 3.996129868580864e-05, "loss": 2.2336, "step": 62848 }, { "epoch": 0.79, "learning_rate": 3.9943402524970455e-05, "loss": 2.2617, "step": 62856 }, { "epoch": 0.79, "learning_rate": 3.9925513390411985e-05, "loss": 2.2664, "step": 62864 }, { "epoch": 0.79, "learning_rate": 3.9907631283927486e-05, "loss": 2.2651, "step": 62872 }, { "epoch": 0.79, "learning_rate": 3.9889756207310425e-05, "loss": 2.2607, "step": 62880 }, { "epoch": 0.79, "learning_rate": 3.9871888162353496e-05, "loss": 2.2457, "step": 62888 }, { "epoch": 0.79, "learning_rate": 3.985402715084887e-05, "loss": 2.2694, "step": 62896 }, { "epoch": 0.79, "learning_rate": 3.983617317458781e-05, "loss": 2.2461, "step": 62904 }, { "epoch": 0.79, "learning_rate": 3.981832623536102e-05, "loss": 2.2657, "step": 62912 }, { "epoch": 0.79, "learning_rate": 3.9800486334958475e-05, "loss": 2.2515, "step": 62920 }, { "epoch": 0.79, "learning_rate": 3.978265347516932e-05, "loss": 2.2507, "step": 62928 }, { "epoch": 0.79, "learning_rate": 3.9764827657782175e-05, "loss": 2.2752, "step": 62936 }, { "epoch": 0.79, "learning_rate": 3.974700888458484e-05, "loss": 2.2514, "step": 62944 }, { "epoch": 0.79, "learning_rate": 3.972919715736445e-05, "loss": 2.2614, "step": 62952 }, { "epoch": 0.79, "learning_rate": 3.9711392477907406e-05, "loss": 2.2705, "step": 62960 }, { "epoch": 0.79, "learning_rate": 3.9693594847999404e-05, "loss": 2.2544, "step": 62968 }, { "epoch": 0.79, "learning_rate": 3.967580426942547e-05, "loss": 2.2502, "step": 62976 }, { "epoch": 0.79, "learning_rate": 3.9658020743969895e-05, "loss": 2.2852, "step": 62984 }, { "epoch": 0.79, "learning_rate": 3.964024427341625e-05, "loss": 2.2543, "step": 62992 }, { "epoch": 0.79, "learning_rate": 3.962247485954743e-05, "loss": 2.2518, "step": 63000 }, { "epoch": 0.79, "learning_rate": 3.9604712504145604e-05, "loss": 2.2444, "step": 63008 }, { "epoch": 0.79, "learning_rate": 3.9586957208992215e-05, "loss": 2.2482, "step": 63016 }, { "epoch": 0.79, "learning_rate": 3.956920897586804e-05, "loss": 2.261, "step": 63024 }, { "epoch": 0.79, "learning_rate": 3.9551467806553147e-05, "loss": 2.2724, "step": 63032 }, { "epoch": 0.79, "learning_rate": 3.953373370282682e-05, "loss": 2.261, "step": 63040 }, { "epoch": 0.79, "learning_rate": 3.951600666646774e-05, "loss": 2.2604, "step": 63048 }, { "epoch": 0.79, "learning_rate": 3.949828669925379e-05, "loss": 2.2552, "step": 63056 }, { "epoch": 0.79, "learning_rate": 3.9480573802962205e-05, "loss": 2.257, "step": 63064 }, { "epoch": 0.79, "learning_rate": 3.9462867979369486e-05, "loss": 2.2685, "step": 63072 }, { "epoch": 0.79, "learning_rate": 3.94451692302514e-05, "loss": 2.2647, "step": 63080 }, { "epoch": 0.79, "learning_rate": 3.94274775573831e-05, "loss": 2.248, "step": 63088 }, { "epoch": 0.79, "learning_rate": 3.940979296253889e-05, "loss": 2.2478, "step": 63096 }, { "epoch": 0.79, "learning_rate": 3.939211544749246e-05, "loss": 2.2597, "step": 63104 }, { "epoch": 0.79, "learning_rate": 3.9374445014016766e-05, "loss": 2.2578, "step": 63112 }, { "epoch": 0.79, "learning_rate": 3.9356781663884024e-05, "loss": 2.2628, "step": 63120 }, { "epoch": 0.79, "learning_rate": 3.933912539886585e-05, "loss": 2.2383, "step": 63128 }, { "epoch": 0.79, "learning_rate": 3.9321476220732944e-05, "loss": 2.2429, "step": 63136 }, { "epoch": 0.79, "learning_rate": 3.930383413125553e-05, "loss": 2.2537, "step": 63144 }, { "epoch": 0.79, "learning_rate": 3.9286199132202985e-05, "loss": 2.2699, "step": 63152 }, { "epoch": 0.79, "learning_rate": 3.926857122534394e-05, "loss": 2.2411, "step": 63160 }, { "epoch": 0.79, "learning_rate": 3.9250950412446455e-05, "loss": 2.2642, "step": 63168 }, { "epoch": 0.79, "learning_rate": 3.92333366952777e-05, "loss": 2.2699, "step": 63176 }, { "epoch": 0.79, "learning_rate": 3.921573007560433e-05, "loss": 2.2478, "step": 63184 }, { "epoch": 0.79, "learning_rate": 3.919813055519216e-05, "loss": 2.2579, "step": 63192 }, { "epoch": 0.79, "learning_rate": 3.918053813580627e-05, "loss": 2.2592, "step": 63200 }, { "epoch": 0.79, "learning_rate": 3.916295281921114e-05, "loss": 2.232, "step": 63208 }, { "epoch": 0.79, "learning_rate": 3.914537460717045e-05, "loss": 2.2552, "step": 63216 }, { "epoch": 0.79, "learning_rate": 3.91278035014472e-05, "loss": 2.2382, "step": 63224 }, { "epoch": 0.79, "learning_rate": 3.9110239503803715e-05, "loss": 2.2551, "step": 63232 }, { "epoch": 0.79, "learning_rate": 3.9092682616001475e-05, "loss": 2.2595, "step": 63240 }, { "epoch": 0.79, "learning_rate": 3.9075132839801396e-05, "loss": 2.2453, "step": 63248 }, { "epoch": 0.79, "learning_rate": 3.9057590176963624e-05, "loss": 2.2366, "step": 63256 }, { "epoch": 0.79, "learning_rate": 3.904005462924756e-05, "loss": 2.2633, "step": 63264 }, { "epoch": 0.79, "learning_rate": 3.902252619841196e-05, "loss": 2.2609, "step": 63272 }, { "epoch": 0.79, "learning_rate": 3.900500488621478e-05, "loss": 2.2544, "step": 63280 }, { "epoch": 0.79, "learning_rate": 3.898749069441333e-05, "loss": 2.2483, "step": 63288 }, { "epoch": 0.79, "learning_rate": 3.8969983624764205e-05, "loss": 2.2483, "step": 63296 }, { "epoch": 0.79, "learning_rate": 3.895248367902322e-05, "loss": 2.2599, "step": 63304 }, { "epoch": 0.79, "learning_rate": 3.8934990858945536e-05, "loss": 2.236, "step": 63312 }, { "epoch": 0.79, "learning_rate": 3.8917505166285634e-05, "loss": 2.2378, "step": 63320 }, { "epoch": 0.79, "learning_rate": 3.890002660279717e-05, "loss": 2.2526, "step": 63328 }, { "epoch": 0.79, "learning_rate": 3.888255517023316e-05, "loss": 2.241, "step": 63336 }, { "epoch": 0.79, "learning_rate": 3.886509087034589e-05, "loss": 2.2386, "step": 63344 }, { "epoch": 0.79, "learning_rate": 3.884763370488691e-05, "loss": 2.2412, "step": 63352 }, { "epoch": 0.79, "learning_rate": 3.8830183675607146e-05, "loss": 2.249, "step": 63360 }, { "epoch": 0.79, "learning_rate": 3.8812740784256664e-05, "loss": 2.2372, "step": 63368 }, { "epoch": 0.79, "learning_rate": 3.8795305032584895e-05, "loss": 2.2585, "step": 63376 }, { "epoch": 0.79, "learning_rate": 3.8777876422340597e-05, "loss": 2.2643, "step": 63384 }, { "epoch": 0.79, "learning_rate": 3.8760454955271686e-05, "loss": 2.2563, "step": 63392 }, { "epoch": 0.79, "learning_rate": 3.874304063312554e-05, "loss": 2.2698, "step": 63400 }, { "epoch": 0.79, "learning_rate": 3.8725633457648606e-05, "loss": 2.2651, "step": 63408 }, { "epoch": 0.79, "learning_rate": 3.870823343058676e-05, "loss": 2.2585, "step": 63416 }, { "epoch": 0.79, "learning_rate": 3.869084055368519e-05, "loss": 2.2734, "step": 63424 }, { "epoch": 0.79, "learning_rate": 3.86734548286882e-05, "loss": 2.2171, "step": 63432 }, { "epoch": 0.79, "learning_rate": 3.8656076257339565e-05, "loss": 2.2314, "step": 63440 }, { "epoch": 0.79, "learning_rate": 3.8638704841382246e-05, "loss": 2.2491, "step": 63448 }, { "epoch": 0.79, "learning_rate": 3.862134058255842e-05, "loss": 2.2397, "step": 63456 }, { "epoch": 0.79, "learning_rate": 3.860398348260973e-05, "loss": 2.2586, "step": 63464 }, { "epoch": 0.79, "learning_rate": 3.85866335432769e-05, "loss": 2.2448, "step": 63472 }, { "epoch": 0.79, "learning_rate": 3.85692907663001e-05, "loss": 2.2707, "step": 63480 }, { "epoch": 0.79, "learning_rate": 3.855195515341868e-05, "loss": 2.262, "step": 63488 }, { "epoch": 0.79, "learning_rate": 3.8534626706371315e-05, "loss": 2.2364, "step": 63496 }, { "epoch": 0.79, "learning_rate": 3.851730542689596e-05, "loss": 2.2687, "step": 63504 }, { "epoch": 0.79, "learning_rate": 3.8499991316729806e-05, "loss": 2.255, "step": 63512 }, { "epoch": 0.79, "learning_rate": 3.848268437760939e-05, "loss": 2.2539, "step": 63520 }, { "epoch": 0.79, "learning_rate": 3.84653846112705e-05, "loss": 2.2664, "step": 63528 }, { "epoch": 0.79, "learning_rate": 3.844809201944818e-05, "loss": 2.2718, "step": 63536 }, { "epoch": 0.79, "learning_rate": 3.843080660387681e-05, "loss": 2.2543, "step": 63544 }, { "epoch": 0.79, "learning_rate": 3.841352836629e-05, "loss": 2.2224, "step": 63552 }, { "epoch": 0.79, "learning_rate": 3.839625730842066e-05, "loss": 2.2453, "step": 63560 }, { "epoch": 0.79, "learning_rate": 3.837899343200097e-05, "loss": 2.2485, "step": 63568 }, { "epoch": 0.79, "learning_rate": 3.836173673876243e-05, "loss": 2.2686, "step": 63576 }, { "epoch": 0.79, "learning_rate": 3.834448723043577e-05, "loss": 2.2521, "step": 63584 }, { "epoch": 0.79, "learning_rate": 3.8327244908751015e-05, "loss": 2.2661, "step": 63592 }, { "epoch": 0.8, "learning_rate": 3.831000977543747e-05, "loss": 2.2494, "step": 63600 }, { "epoch": 0.8, "learning_rate": 3.829278183222374e-05, "loss": 2.2559, "step": 63608 }, { "epoch": 0.8, "learning_rate": 3.827556108083766e-05, "loss": 2.2786, "step": 63616 }, { "epoch": 0.8, "learning_rate": 3.8258347523006397e-05, "loss": 2.2652, "step": 63624 }, { "epoch": 0.8, "learning_rate": 3.824114116045637e-05, "loss": 2.2656, "step": 63632 }, { "epoch": 0.8, "learning_rate": 3.822394199491327e-05, "loss": 2.2472, "step": 63640 }, { "epoch": 0.8, "learning_rate": 3.8206750028102064e-05, "loss": 2.2537, "step": 63648 }, { "epoch": 0.8, "learning_rate": 3.818956526174708e-05, "loss": 2.2385, "step": 63656 }, { "epoch": 0.8, "learning_rate": 3.8172387697571746e-05, "loss": 2.2725, "step": 63664 }, { "epoch": 0.8, "learning_rate": 3.815521733729898e-05, "loss": 2.2616, "step": 63672 }, { "epoch": 0.8, "learning_rate": 3.813805418265079e-05, "loss": 2.2306, "step": 63680 }, { "epoch": 0.8, "learning_rate": 3.812089823534854e-05, "loss": 2.2621, "step": 63688 }, { "epoch": 0.8, "learning_rate": 3.810374949711298e-05, "loss": 2.2492, "step": 63696 }, { "epoch": 0.8, "learning_rate": 3.80866079696639e-05, "loss": 2.2443, "step": 63704 }, { "epoch": 0.8, "learning_rate": 3.806947365472058e-05, "loss": 2.2489, "step": 63712 }, { "epoch": 0.8, "learning_rate": 3.805234655400149e-05, "loss": 2.2356, "step": 63720 }, { "epoch": 0.8, "learning_rate": 3.803522666922432e-05, "loss": 2.2473, "step": 63728 }, { "epoch": 0.8, "learning_rate": 3.801811400210619e-05, "loss": 2.264, "step": 63736 }, { "epoch": 0.8, "learning_rate": 3.8001008554363304e-05, "loss": 2.2453, "step": 63744 }, { "epoch": 0.8, "learning_rate": 3.7983910327711316e-05, "loss": 2.2666, "step": 63752 }, { "epoch": 0.8, "learning_rate": 3.7966819323865076e-05, "loss": 2.2603, "step": 63760 }, { "epoch": 0.8, "learning_rate": 3.794973554453865e-05, "loss": 2.2462, "step": 63768 }, { "epoch": 0.8, "learning_rate": 3.7932658991445514e-05, "loss": 2.2478, "step": 63776 }, { "epoch": 0.8, "learning_rate": 3.7915589666298325e-05, "loss": 2.276, "step": 63784 }, { "epoch": 0.8, "learning_rate": 3.789852757080904e-05, "loss": 2.2476, "step": 63792 }, { "epoch": 0.8, "learning_rate": 3.7881472706688915e-05, "loss": 2.2345, "step": 63800 }, { "epoch": 0.8, "learning_rate": 3.786442507564838e-05, "loss": 2.2661, "step": 63808 }, { "epoch": 0.8, "learning_rate": 3.784738467939729e-05, "loss": 2.257, "step": 63816 }, { "epoch": 0.8, "learning_rate": 3.783035151964469e-05, "loss": 2.2543, "step": 63824 }, { "epoch": 0.8, "learning_rate": 3.781332559809889e-05, "loss": 2.2584, "step": 63832 }, { "epoch": 0.8, "learning_rate": 3.7796306916467496e-05, "loss": 2.2477, "step": 63840 }, { "epoch": 0.8, "learning_rate": 3.777929547645739e-05, "loss": 2.2567, "step": 63848 }, { "epoch": 0.8, "learning_rate": 3.776229127977472e-05, "loss": 2.2557, "step": 63856 }, { "epoch": 0.8, "learning_rate": 3.774529432812492e-05, "loss": 2.2505, "step": 63864 }, { "epoch": 0.8, "learning_rate": 3.7728304623212684e-05, "loss": 2.2724, "step": 63872 }, { "epoch": 0.8, "learning_rate": 3.771132216674197e-05, "loss": 2.2566, "step": 63880 }, { "epoch": 0.8, "learning_rate": 3.769434696041604e-05, "loss": 2.2562, "step": 63888 }, { "epoch": 0.8, "learning_rate": 3.76773790059374e-05, "loss": 2.2545, "step": 63896 }, { "epoch": 0.8, "learning_rate": 3.7660418305007835e-05, "loss": 2.2454, "step": 63904 }, { "epoch": 0.8, "learning_rate": 3.7643464859328425e-05, "loss": 2.2442, "step": 63912 }, { "epoch": 0.8, "learning_rate": 3.762651867059947e-05, "loss": 2.2221, "step": 63920 }, { "epoch": 0.8, "learning_rate": 3.760957974052066e-05, "loss": 2.2512, "step": 63928 }, { "epoch": 0.8, "learning_rate": 3.759264807079077e-05, "loss": 2.253, "step": 63936 }, { "epoch": 0.8, "learning_rate": 3.7575723663108006e-05, "loss": 2.2698, "step": 63944 }, { "epoch": 0.8, "learning_rate": 3.755880651916979e-05, "loss": 2.2576, "step": 63952 }, { "epoch": 0.8, "learning_rate": 3.7541896640672766e-05, "loss": 2.2655, "step": 63960 }, { "epoch": 0.8, "learning_rate": 3.7524994029313e-05, "loss": 2.2589, "step": 63968 }, { "epoch": 0.8, "learning_rate": 3.750809868678564e-05, "loss": 2.2304, "step": 63976 }, { "epoch": 0.8, "learning_rate": 3.7491210614785185e-05, "loss": 2.2762, "step": 63984 }, { "epoch": 0.8, "learning_rate": 3.747432981500551e-05, "loss": 2.2409, "step": 63992 }, { "epoch": 0.8, "learning_rate": 3.745745628913954e-05, "loss": 2.2408, "step": 64000 }, { "epoch": 0.8, "learning_rate": 3.7440590038879715e-05, "loss": 2.2466, "step": 64008 }, { "epoch": 0.8, "learning_rate": 3.742373106591751e-05, "loss": 2.247, "step": 64016 }, { "epoch": 0.8, "learning_rate": 3.740687937194387e-05, "loss": 2.2467, "step": 64024 }, { "epoch": 0.8, "learning_rate": 3.7390034958648904e-05, "loss": 2.2718, "step": 64032 }, { "epoch": 0.8, "learning_rate": 3.737319782772196e-05, "loss": 2.2464, "step": 64040 }, { "epoch": 0.8, "learning_rate": 3.735636798085178e-05, "loss": 2.2592, "step": 64048 }, { "epoch": 0.8, "learning_rate": 3.7339545419726266e-05, "loss": 2.2535, "step": 64056 }, { "epoch": 0.8, "learning_rate": 3.732273014603262e-05, "loss": 2.2612, "step": 64064 }, { "epoch": 0.8, "learning_rate": 3.730592216145736e-05, "loss": 2.2463, "step": 64072 }, { "epoch": 0.8, "learning_rate": 3.728912146768616e-05, "loss": 2.2653, "step": 64080 }, { "epoch": 0.8, "learning_rate": 3.7272328066404085e-05, "loss": 2.2714, "step": 64088 }, { "epoch": 0.8, "learning_rate": 3.72555419592954e-05, "loss": 2.2461, "step": 64096 }, { "epoch": 0.8, "learning_rate": 3.723876314804368e-05, "loss": 2.2623, "step": 64104 }, { "epoch": 0.8, "learning_rate": 3.722199163433173e-05, "loss": 2.26, "step": 64112 }, { "epoch": 0.8, "learning_rate": 3.7205227419841626e-05, "loss": 2.2644, "step": 64120 }, { "epoch": 0.8, "learning_rate": 3.718847050625475e-05, "loss": 2.2504, "step": 64128 }, { "epoch": 0.8, "learning_rate": 3.717172089525169e-05, "loss": 2.24, "step": 64136 }, { "epoch": 0.8, "learning_rate": 3.715497858851236e-05, "loss": 2.2622, "step": 64144 }, { "epoch": 0.8, "learning_rate": 3.713824358771592e-05, "loss": 2.2697, "step": 64152 }, { "epoch": 0.8, "learning_rate": 3.712151589454079e-05, "loss": 2.2482, "step": 64160 }, { "epoch": 0.8, "learning_rate": 3.7104795510664655e-05, "loss": 2.247, "step": 64168 }, { "epoch": 0.8, "learning_rate": 3.7088082437764495e-05, "loss": 2.2649, "step": 64176 }, { "epoch": 0.8, "learning_rate": 3.707137667751652e-05, "loss": 2.2513, "step": 64184 }, { "epoch": 0.8, "learning_rate": 3.705467823159621e-05, "loss": 2.2519, "step": 64192 }, { "epoch": 0.8, "learning_rate": 3.703798710167838e-05, "loss": 2.2748, "step": 64200 }, { "epoch": 0.8, "learning_rate": 3.7021303289437005e-05, "loss": 2.2475, "step": 64208 }, { "epoch": 0.8, "learning_rate": 3.700462679654536e-05, "loss": 2.2333, "step": 64216 }, { "epoch": 0.8, "learning_rate": 3.698795762467607e-05, "loss": 2.2512, "step": 64224 }, { "epoch": 0.8, "learning_rate": 3.697129577550089e-05, "loss": 2.2531, "step": 64232 }, { "epoch": 0.8, "learning_rate": 3.695464125069098e-05, "loss": 2.2628, "step": 64240 }, { "epoch": 0.8, "learning_rate": 3.693799405191664e-05, "loss": 2.2456, "step": 64248 }, { "epoch": 0.8, "learning_rate": 3.6921354180847466e-05, "loss": 2.2515, "step": 64256 }, { "epoch": 0.8, "learning_rate": 3.690472163915244e-05, "loss": 2.2638, "step": 64264 }, { "epoch": 0.8, "learning_rate": 3.688809642849961e-05, "loss": 2.2597, "step": 64272 }, { "epoch": 0.8, "learning_rate": 3.6871478550556434e-05, "loss": 2.2344, "step": 64280 }, { "epoch": 0.8, "learning_rate": 3.685486800698963e-05, "loss": 2.2565, "step": 64288 }, { "epoch": 0.8, "learning_rate": 3.683826479946506e-05, "loss": 2.2629, "step": 64296 }, { "epoch": 0.8, "learning_rate": 3.6821668929648014e-05, "loss": 2.2205, "step": 64304 }, { "epoch": 0.8, "learning_rate": 3.680508039920288e-05, "loss": 2.257, "step": 64312 }, { "epoch": 0.8, "learning_rate": 3.6788499209793445e-05, "loss": 2.2642, "step": 64320 }, { "epoch": 0.8, "learning_rate": 3.677192536308274e-05, "loss": 2.2347, "step": 64328 }, { "epoch": 0.8, "learning_rate": 3.6755358860732935e-05, "loss": 2.2588, "step": 64336 }, { "epoch": 0.8, "learning_rate": 3.6738799704405635e-05, "loss": 2.2537, "step": 64344 }, { "epoch": 0.8, "learning_rate": 3.6722247895761595e-05, "loss": 2.2535, "step": 64352 }, { "epoch": 0.8, "learning_rate": 3.670570343646089e-05, "loss": 2.2876, "step": 64360 }, { "epoch": 0.8, "learning_rate": 3.668916632816282e-05, "loss": 2.2425, "step": 64368 }, { "epoch": 0.8, "learning_rate": 3.667263657252595e-05, "loss": 2.2708, "step": 64376 }, { "epoch": 0.8, "learning_rate": 3.6656114171208155e-05, "loss": 2.2679, "step": 64384 }, { "epoch": 0.8, "learning_rate": 3.6639599125866505e-05, "loss": 2.2559, "step": 64392 }, { "epoch": 0.81, "learning_rate": 3.6623091438157384e-05, "loss": 2.2657, "step": 64400 }, { "epoch": 0.81, "learning_rate": 3.660659110973642e-05, "loss": 2.2385, "step": 64408 }, { "epoch": 0.81, "learning_rate": 3.6590098142258494e-05, "loss": 2.2497, "step": 64416 }, { "epoch": 0.81, "learning_rate": 3.6573612537377764e-05, "loss": 2.2447, "step": 64424 }, { "epoch": 0.81, "learning_rate": 3.655713429674764e-05, "loss": 2.2683, "step": 64432 }, { "epoch": 0.81, "learning_rate": 3.6540663422020796e-05, "loss": 2.2629, "step": 64440 }, { "epoch": 0.81, "learning_rate": 3.652419991484916e-05, "loss": 2.2558, "step": 64448 }, { "epoch": 0.81, "learning_rate": 3.650774377688394e-05, "loss": 2.2449, "step": 64456 }, { "epoch": 0.81, "learning_rate": 3.649129500977558e-05, "loss": 2.2561, "step": 64464 }, { "epoch": 0.81, "learning_rate": 3.647485361517383e-05, "loss": 2.2625, "step": 64472 }, { "epoch": 0.81, "learning_rate": 3.645841959472763e-05, "loss": 2.2563, "step": 64480 }, { "epoch": 0.81, "learning_rate": 3.644199295008521e-05, "loss": 2.2601, "step": 64488 }, { "epoch": 0.81, "learning_rate": 3.642557368289414e-05, "loss": 2.2591, "step": 64496 }, { "epoch": 0.81, "learning_rate": 3.6409161794801125e-05, "loss": 2.2672, "step": 64504 }, { "epoch": 0.81, "learning_rate": 3.639275728745218e-05, "loss": 2.2461, "step": 64512 }, { "epoch": 0.81, "learning_rate": 3.63763601624926e-05, "loss": 2.2313, "step": 64520 }, { "epoch": 0.81, "learning_rate": 3.6359970421566904e-05, "loss": 2.259, "step": 64528 }, { "epoch": 0.81, "learning_rate": 3.634358806631895e-05, "loss": 2.2748, "step": 64536 }, { "epoch": 0.81, "learning_rate": 3.63272130983917e-05, "loss": 2.2577, "step": 64544 }, { "epoch": 0.81, "learning_rate": 3.631084551942755e-05, "loss": 2.2318, "step": 64552 }, { "epoch": 0.81, "learning_rate": 3.629448533106808e-05, "loss": 2.2644, "step": 64560 }, { "epoch": 0.81, "learning_rate": 3.627813253495404e-05, "loss": 2.2419, "step": 64568 }, { "epoch": 0.81, "learning_rate": 3.6261787132725614e-05, "loss": 2.2657, "step": 64576 }, { "epoch": 0.81, "learning_rate": 3.624544912602209e-05, "loss": 2.2399, "step": 64584 }, { "epoch": 0.81, "learning_rate": 3.6229118516482105e-05, "loss": 2.2702, "step": 64592 }, { "epoch": 0.81, "learning_rate": 3.6212795305743555e-05, "loss": 2.2537, "step": 64600 }, { "epoch": 0.81, "learning_rate": 3.619647949544349e-05, "loss": 2.2365, "step": 64608 }, { "epoch": 0.81, "learning_rate": 3.618017108721836e-05, "loss": 2.2607, "step": 64616 }, { "epoch": 0.81, "learning_rate": 3.6163870082703774e-05, "loss": 2.2725, "step": 64624 }, { "epoch": 0.81, "learning_rate": 3.6147576483534654e-05, "loss": 2.2457, "step": 64632 }, { "epoch": 0.81, "learning_rate": 3.613129029134516e-05, "loss": 2.2436, "step": 64640 }, { "epoch": 0.81, "learning_rate": 3.611501150776864e-05, "loss": 2.2593, "step": 64648 }, { "epoch": 0.81, "learning_rate": 3.609874013443783e-05, "loss": 2.2728, "step": 64656 }, { "epoch": 0.81, "learning_rate": 3.608247617298464e-05, "loss": 2.2583, "step": 64664 }, { "epoch": 0.81, "learning_rate": 3.606621962504025e-05, "loss": 2.2427, "step": 64672 }, { "epoch": 0.81, "learning_rate": 3.6049970492235105e-05, "loss": 2.2705, "step": 64680 }, { "epoch": 0.81, "learning_rate": 3.6033728776198885e-05, "loss": 2.2494, "step": 64688 }, { "epoch": 0.81, "learning_rate": 3.601749447856055e-05, "loss": 2.251, "step": 64696 }, { "epoch": 0.81, "learning_rate": 3.600126760094832e-05, "loss": 2.2487, "step": 64704 }, { "epoch": 0.81, "learning_rate": 3.598504814498965e-05, "loss": 2.2637, "step": 64712 }, { "epoch": 0.81, "learning_rate": 3.596883611231127e-05, "loss": 2.2462, "step": 64720 }, { "epoch": 0.81, "learning_rate": 3.595263150453912e-05, "loss": 2.2461, "step": 64728 }, { "epoch": 0.81, "learning_rate": 3.593643432329847e-05, "loss": 2.2423, "step": 64736 }, { "epoch": 0.81, "learning_rate": 3.592024457021379e-05, "loss": 2.2682, "step": 64744 }, { "epoch": 0.81, "learning_rate": 3.590406224690881e-05, "loss": 2.2445, "step": 64752 }, { "epoch": 0.81, "learning_rate": 3.5887887355006535e-05, "loss": 2.2356, "step": 64760 }, { "epoch": 0.81, "learning_rate": 3.587171989612924e-05, "loss": 2.2436, "step": 64768 }, { "epoch": 0.81, "learning_rate": 3.585555987189839e-05, "loss": 2.2796, "step": 64776 }, { "epoch": 0.81, "learning_rate": 3.5839407283934755e-05, "loss": 2.2481, "step": 64784 }, { "epoch": 0.81, "learning_rate": 3.582326213385836e-05, "loss": 2.2455, "step": 64792 }, { "epoch": 0.81, "learning_rate": 3.580712442328843e-05, "loss": 2.2446, "step": 64800 }, { "epoch": 0.81, "learning_rate": 3.579099415384358e-05, "loss": 2.2534, "step": 64808 }, { "epoch": 0.81, "learning_rate": 3.577487132714149e-05, "loss": 2.2649, "step": 64816 }, { "epoch": 0.81, "learning_rate": 3.57587559447992e-05, "loss": 2.2531, "step": 64824 }, { "epoch": 0.81, "learning_rate": 3.574264800843308e-05, "loss": 2.2536, "step": 64832 }, { "epoch": 0.81, "learning_rate": 3.5726547519658534e-05, "loss": 2.2644, "step": 64840 }, { "epoch": 0.81, "learning_rate": 3.5710454480090465e-05, "loss": 2.2795, "step": 64848 }, { "epoch": 0.81, "learning_rate": 3.5694368891342854e-05, "loss": 2.234, "step": 64856 }, { "epoch": 0.81, "learning_rate": 3.567829075502897e-05, "loss": 2.253, "step": 64864 }, { "epoch": 0.81, "learning_rate": 3.566222007276143e-05, "loss": 2.2643, "step": 64872 }, { "epoch": 0.81, "learning_rate": 3.564615684615196e-05, "loss": 2.226, "step": 64880 }, { "epoch": 0.81, "learning_rate": 3.563010107681167e-05, "loss": 2.2592, "step": 64888 }, { "epoch": 0.81, "learning_rate": 3.561405276635085e-05, "loss": 2.2527, "step": 64896 }, { "epoch": 0.81, "learning_rate": 3.5598011916379023e-05, "loss": 2.2555, "step": 64904 }, { "epoch": 0.81, "learning_rate": 3.558197852850505e-05, "loss": 2.2412, "step": 64912 }, { "epoch": 0.81, "learning_rate": 3.5565952604336907e-05, "loss": 2.2661, "step": 64920 }, { "epoch": 0.81, "learning_rate": 3.5549934145481964e-05, "loss": 2.2588, "step": 64928 }, { "epoch": 0.81, "learning_rate": 3.553392315354678e-05, "loss": 2.2455, "step": 64936 }, { "epoch": 0.81, "learning_rate": 3.551791963013715e-05, "loss": 2.2435, "step": 64944 }, { "epoch": 0.81, "learning_rate": 3.5501923576858144e-05, "loss": 2.27, "step": 64952 }, { "epoch": 0.81, "learning_rate": 3.5485934995314086e-05, "loss": 2.2567, "step": 64960 }, { "epoch": 0.81, "learning_rate": 3.546995388710852e-05, "loss": 2.2376, "step": 64968 }, { "epoch": 0.81, "learning_rate": 3.5453980253844256e-05, "loss": 2.2438, "step": 64976 }, { "epoch": 0.81, "learning_rate": 3.543801409712339e-05, "loss": 2.2538, "step": 64984 }, { "epoch": 0.81, "learning_rate": 3.542205541854721e-05, "loss": 2.2501, "step": 64992 }, { "epoch": 0.81, "learning_rate": 3.5406104219716285e-05, "loss": 2.2693, "step": 65000 }, { "epoch": 0.81, "learning_rate": 3.539016050223044e-05, "loss": 2.2487, "step": 65008 }, { "epoch": 0.81, "learning_rate": 3.5374224267688734e-05, "loss": 2.2502, "step": 65016 }, { "epoch": 0.81, "learning_rate": 3.535829551768948e-05, "loss": 2.2756, "step": 65024 }, { "epoch": 0.81, "learning_rate": 3.534237425383023e-05, "loss": 2.2657, "step": 65032 }, { "epoch": 0.81, "learning_rate": 3.532646047770784e-05, "loss": 2.2596, "step": 65040 }, { "epoch": 0.81, "learning_rate": 3.531055419091832e-05, "loss": 2.246, "step": 65048 }, { "epoch": 0.81, "learning_rate": 3.529465539505698e-05, "loss": 2.2376, "step": 65056 }, { "epoch": 0.81, "learning_rate": 3.527876409171844e-05, "loss": 2.2415, "step": 65064 }, { "epoch": 0.81, "learning_rate": 3.5262880282496434e-05, "loss": 2.2532, "step": 65072 }, { "epoch": 0.81, "learning_rate": 3.5247003968984094e-05, "loss": 2.254, "step": 65080 }, { "epoch": 0.81, "learning_rate": 3.5231135152773645e-05, "loss": 2.2552, "step": 65088 }, { "epoch": 0.81, "learning_rate": 3.521527383545667e-05, "loss": 2.2534, "step": 65096 }, { "epoch": 0.81, "learning_rate": 3.519942001862402e-05, "loss": 2.2501, "step": 65104 }, { "epoch": 0.81, "learning_rate": 3.5183573703865656e-05, "loss": 2.2675, "step": 65112 }, { "epoch": 0.81, "learning_rate": 3.516773489277092e-05, "loss": 2.2428, "step": 65120 }, { "epoch": 0.81, "learning_rate": 3.5151903586928394e-05, "loss": 2.2215, "step": 65128 }, { "epoch": 0.81, "learning_rate": 3.513607978792577e-05, "loss": 2.2473, "step": 65136 }, { "epoch": 0.81, "learning_rate": 3.512026349735019e-05, "loss": 2.2516, "step": 65144 }, { "epoch": 0.81, "learning_rate": 3.510445471678785e-05, "loss": 2.25, "step": 65152 }, { "epoch": 0.81, "learning_rate": 3.508865344782433e-05, "loss": 2.2458, "step": 65160 }, { "epoch": 0.81, "learning_rate": 3.5072859692044426e-05, "loss": 2.2739, "step": 65168 }, { "epoch": 0.81, "learning_rate": 3.505707345103209e-05, "loss": 2.2773, "step": 65176 }, { "epoch": 0.81, "learning_rate": 3.5041294726370654e-05, "loss": 2.2545, "step": 65184 }, { "epoch": 0.81, "learning_rate": 3.502552351964263e-05, "loss": 2.2218, "step": 65192 }, { "epoch": 0.81, "learning_rate": 3.5009759832429766e-05, "loss": 2.2608, "step": 65200 }, { "epoch": 0.82, "learning_rate": 3.499400366631308e-05, "loss": 2.2645, "step": 65208 }, { "epoch": 0.82, "learning_rate": 3.4978255022872783e-05, "loss": 2.2668, "step": 65216 }, { "epoch": 0.82, "learning_rate": 3.496251390368843e-05, "loss": 2.2554, "step": 65224 }, { "epoch": 0.82, "learning_rate": 3.494678031033876e-05, "loss": 2.2669, "step": 65232 }, { "epoch": 0.82, "learning_rate": 3.493105424440174e-05, "loss": 2.2689, "step": 65240 }, { "epoch": 0.82, "learning_rate": 3.491533570745462e-05, "loss": 2.263, "step": 65248 }, { "epoch": 0.82, "learning_rate": 3.489962470107387e-05, "loss": 2.2335, "step": 65256 }, { "epoch": 0.82, "learning_rate": 3.488392122683522e-05, "loss": 2.2587, "step": 65264 }, { "epoch": 0.82, "learning_rate": 3.486822528631364e-05, "loss": 2.26, "step": 65272 }, { "epoch": 0.82, "learning_rate": 3.485253688108335e-05, "loss": 2.2398, "step": 65280 }, { "epoch": 0.82, "learning_rate": 3.483685601271779e-05, "loss": 2.2488, "step": 65288 }, { "epoch": 0.82, "learning_rate": 3.482118268278968e-05, "loss": 2.2417, "step": 65296 }, { "epoch": 0.82, "learning_rate": 3.480551689287097e-05, "loss": 2.2521, "step": 65304 }, { "epoch": 0.82, "learning_rate": 3.4789858644532823e-05, "loss": 2.2512, "step": 65312 }, { "epoch": 0.82, "learning_rate": 3.4774207939345704e-05, "loss": 2.2698, "step": 65320 }, { "epoch": 0.82, "learning_rate": 3.4758564778879244e-05, "loss": 2.2655, "step": 65328 }, { "epoch": 0.82, "learning_rate": 3.474292916470245e-05, "loss": 2.2489, "step": 65336 }, { "epoch": 0.82, "learning_rate": 3.47273010983834e-05, "loss": 2.264, "step": 65344 }, { "epoch": 0.82, "learning_rate": 3.471168058148953e-05, "loss": 2.2698, "step": 65352 }, { "epoch": 0.82, "learning_rate": 3.4696067615587494e-05, "loss": 2.2392, "step": 65360 }, { "epoch": 0.82, "learning_rate": 3.468046220224316e-05, "loss": 2.2554, "step": 65368 }, { "epoch": 0.82, "learning_rate": 3.466486434302172e-05, "loss": 2.2679, "step": 65376 }, { "epoch": 0.82, "learning_rate": 3.46492740394875e-05, "loss": 2.2286, "step": 65384 }, { "epoch": 0.82, "learning_rate": 3.463369129320411e-05, "loss": 2.2442, "step": 65392 }, { "epoch": 0.82, "learning_rate": 3.461811610573447e-05, "loss": 2.2533, "step": 65400 }, { "epoch": 0.82, "learning_rate": 3.4602548478640616e-05, "loss": 2.2518, "step": 65408 }, { "epoch": 0.82, "learning_rate": 3.4586988413483965e-05, "loss": 2.2594, "step": 65416 }, { "epoch": 0.82, "learning_rate": 3.457143591182501e-05, "loss": 2.2496, "step": 65424 }, { "epoch": 0.82, "learning_rate": 3.455589097522366e-05, "loss": 2.2656, "step": 65432 }, { "epoch": 0.82, "learning_rate": 3.454035360523897e-05, "loss": 2.2726, "step": 65440 }, { "epoch": 0.82, "learning_rate": 3.4524823803429204e-05, "loss": 2.2488, "step": 65448 }, { "epoch": 0.82, "learning_rate": 3.450930157135196e-05, "loss": 2.246, "step": 65456 }, { "epoch": 0.82, "learning_rate": 3.4493786910564017e-05, "loss": 2.2247, "step": 65464 }, { "epoch": 0.82, "learning_rate": 3.4478279822621404e-05, "loss": 2.2657, "step": 65472 }, { "epoch": 0.82, "learning_rate": 3.446278030907941e-05, "loss": 2.26, "step": 65480 }, { "epoch": 0.82, "learning_rate": 3.44472883714925e-05, "loss": 2.2608, "step": 65488 }, { "epoch": 0.82, "learning_rate": 3.4431804011414476e-05, "loss": 2.2454, "step": 65496 }, { "epoch": 0.82, "learning_rate": 3.441632723039831e-05, "loss": 2.2658, "step": 65504 }, { "epoch": 0.82, "learning_rate": 3.4400858029996265e-05, "loss": 2.2642, "step": 65512 }, { "epoch": 0.82, "learning_rate": 3.438539641175977e-05, "loss": 2.2388, "step": 65520 }, { "epoch": 0.82, "learning_rate": 3.4369942377239566e-05, "loss": 2.2422, "step": 65528 }, { "epoch": 0.82, "learning_rate": 3.4354495927985605e-05, "loss": 2.2397, "step": 65536 }, { "epoch": 0.82, "learning_rate": 3.433905706554706e-05, "loss": 2.2595, "step": 65544 }, { "epoch": 0.82, "learning_rate": 3.432362579147237e-05, "loss": 2.2565, "step": 65552 }, { "epoch": 0.82, "learning_rate": 3.430820210730922e-05, "loss": 2.2411, "step": 65560 }, { "epoch": 0.82, "learning_rate": 3.429278601460451e-05, "loss": 2.2461, "step": 65568 }, { "epoch": 0.82, "learning_rate": 3.4277377514904365e-05, "loss": 2.2609, "step": 65576 }, { "epoch": 0.82, "learning_rate": 3.426197660975419e-05, "loss": 2.2484, "step": 65584 }, { "epoch": 0.82, "learning_rate": 3.424658330069861e-05, "loss": 2.2505, "step": 65592 }, { "epoch": 0.82, "learning_rate": 3.423119758928146e-05, "loss": 2.2635, "step": 65600 }, { "epoch": 0.82, "learning_rate": 3.421581947704592e-05, "loss": 2.2438, "step": 65608 }, { "epoch": 0.82, "learning_rate": 3.420044896553423e-05, "loss": 2.2455, "step": 65616 }, { "epoch": 0.82, "learning_rate": 3.4185086056288e-05, "loss": 2.2584, "step": 65624 }, { "epoch": 0.82, "learning_rate": 3.416973075084806e-05, "loss": 2.2632, "step": 65632 }, { "epoch": 0.82, "learning_rate": 3.415438305075442e-05, "loss": 2.2379, "step": 65640 }, { "epoch": 0.82, "learning_rate": 3.413904295754644e-05, "loss": 2.2747, "step": 65648 }, { "epoch": 0.82, "learning_rate": 3.4123710472762584e-05, "loss": 2.2407, "step": 65656 }, { "epoch": 0.82, "learning_rate": 3.4108385597940594e-05, "loss": 2.2542, "step": 65664 }, { "epoch": 0.82, "learning_rate": 3.409306833461756e-05, "loss": 2.2605, "step": 65672 }, { "epoch": 0.82, "learning_rate": 3.4077758684329606e-05, "loss": 2.2492, "step": 65680 }, { "epoch": 0.82, "learning_rate": 3.406245664861231e-05, "loss": 2.2658, "step": 65688 }, { "epoch": 0.82, "learning_rate": 3.4047162229000295e-05, "loss": 2.2581, "step": 65696 }, { "epoch": 0.82, "learning_rate": 3.403187542702753e-05, "loss": 2.2244, "step": 65704 }, { "epoch": 0.82, "learning_rate": 3.401659624422722e-05, "loss": 2.2619, "step": 65712 }, { "epoch": 0.82, "learning_rate": 3.400132468213173e-05, "loss": 2.2446, "step": 65720 }, { "epoch": 0.82, "learning_rate": 3.398606074227276e-05, "loss": 2.2523, "step": 65728 }, { "epoch": 0.82, "learning_rate": 3.397080442618121e-05, "loss": 2.2301, "step": 65736 }, { "epoch": 0.82, "learning_rate": 3.395555573538712e-05, "loss": 2.2557, "step": 65744 }, { "epoch": 0.82, "learning_rate": 3.394031467141995e-05, "loss": 2.254, "step": 65752 }, { "epoch": 0.82, "learning_rate": 3.392508123580819e-05, "loss": 2.2449, "step": 65760 }, { "epoch": 0.82, "learning_rate": 3.390985543007974e-05, "loss": 2.2228, "step": 65768 }, { "epoch": 0.82, "learning_rate": 3.389463725576164e-05, "loss": 2.2688, "step": 65776 }, { "epoch": 0.82, "learning_rate": 3.387942671438018e-05, "loss": 2.2444, "step": 65784 }, { "epoch": 0.82, "learning_rate": 3.3864223807460906e-05, "loss": 2.2576, "step": 65792 }, { "epoch": 0.82, "learning_rate": 3.384902853652857e-05, "loss": 2.2607, "step": 65800 }, { "epoch": 0.82, "learning_rate": 3.383384090310718e-05, "loss": 2.2629, "step": 65808 }, { "epoch": 0.82, "learning_rate": 3.381866090871997e-05, "loss": 2.238, "step": 65816 }, { "epoch": 0.82, "learning_rate": 3.3803488554889396e-05, "loss": 2.2541, "step": 65824 }, { "epoch": 0.82, "learning_rate": 3.378832384313717e-05, "loss": 2.255, "step": 65832 }, { "epoch": 0.82, "learning_rate": 3.377316677498423e-05, "loss": 2.2358, "step": 65840 }, { "epoch": 0.82, "learning_rate": 3.375801735195072e-05, "loss": 2.2507, "step": 65848 }, { "epoch": 0.82, "learning_rate": 3.374287557555608e-05, "loss": 2.2538, "step": 65856 }, { "epoch": 0.82, "learning_rate": 3.3727741447318904e-05, "loss": 2.2484, "step": 65864 }, { "epoch": 0.82, "learning_rate": 3.3712614968757096e-05, "loss": 2.2637, "step": 65872 }, { "epoch": 0.82, "learning_rate": 3.369749614138773e-05, "loss": 2.2474, "step": 65880 }, { "epoch": 0.82, "learning_rate": 3.368238496672714e-05, "loss": 2.2615, "step": 65888 }, { "epoch": 0.82, "learning_rate": 3.366728144629088e-05, "loss": 2.2559, "step": 65896 }, { "epoch": 0.82, "learning_rate": 3.3652185581593816e-05, "loss": 2.2581, "step": 65904 }, { "epoch": 0.82, "learning_rate": 3.3637097374149905e-05, "loss": 2.2425, "step": 65912 }, { "epoch": 0.82, "learning_rate": 3.362201682547243e-05, "loss": 2.275, "step": 65920 }, { "epoch": 0.82, "learning_rate": 3.360694393707389e-05, "loss": 2.2554, "step": 65928 }, { "epoch": 0.82, "learning_rate": 3.3591878710465973e-05, "loss": 2.2453, "step": 65936 }, { "epoch": 0.82, "learning_rate": 3.357682114715972e-05, "loss": 2.2292, "step": 65944 }, { "epoch": 0.82, "learning_rate": 3.356177124866523e-05, "loss": 2.2631, "step": 65952 }, { "epoch": 0.82, "learning_rate": 3.354672901649198e-05, "loss": 2.2275, "step": 65960 }, { "epoch": 0.82, "learning_rate": 3.3531694452148606e-05, "loss": 2.2601, "step": 65968 }, { "epoch": 0.82, "learning_rate": 3.3516667557142955e-05, "loss": 2.2627, "step": 65976 }, { "epoch": 0.82, "learning_rate": 3.3501648332982213e-05, "loss": 2.2453, "step": 65984 }, { "epoch": 0.82, "learning_rate": 3.348663678117264e-05, "loss": 2.2382, "step": 65992 }, { "epoch": 0.82, "learning_rate": 3.347163290321987e-05, "loss": 2.2523, "step": 66000 }, { "epoch": 0.83, "learning_rate": 3.345663670062871e-05, "loss": 2.2535, "step": 66008 }, { "epoch": 0.83, "learning_rate": 3.3441648174903115e-05, "loss": 2.2637, "step": 66016 }, { "epoch": 0.83, "learning_rate": 3.3426667327546434e-05, "loss": 2.2445, "step": 66024 }, { "epoch": 0.83, "learning_rate": 3.3411694160061134e-05, "loss": 2.2555, "step": 66032 }, { "epoch": 0.83, "learning_rate": 3.339672867394893e-05, "loss": 2.2585, "step": 66040 }, { "epoch": 0.83, "learning_rate": 3.338177087071081e-05, "loss": 2.244, "step": 66048 }, { "epoch": 0.83, "learning_rate": 3.336682075184688e-05, "loss": 2.2268, "step": 66056 }, { "epoch": 0.83, "learning_rate": 3.335187831885662e-05, "loss": 2.2532, "step": 66064 }, { "epoch": 0.83, "learning_rate": 3.333694357323867e-05, "loss": 2.2307, "step": 66072 }, { "epoch": 0.83, "learning_rate": 3.332201651649086e-05, "loss": 2.2695, "step": 66080 }, { "epoch": 0.83, "learning_rate": 3.330709715011032e-05, "loss": 2.2407, "step": 66088 }, { "epoch": 0.83, "learning_rate": 3.329218547559337e-05, "loss": 2.2579, "step": 66096 }, { "epoch": 0.83, "learning_rate": 3.3277281494435576e-05, "loss": 2.2573, "step": 66104 }, { "epoch": 0.83, "learning_rate": 3.326238520813171e-05, "loss": 2.2455, "step": 66112 }, { "epoch": 0.83, "learning_rate": 3.324749661817578e-05, "loss": 2.2528, "step": 66120 }, { "epoch": 0.83, "learning_rate": 3.323261572606104e-05, "loss": 2.2437, "step": 66128 }, { "epoch": 0.83, "learning_rate": 3.321774253327995e-05, "loss": 2.2724, "step": 66136 }, { "epoch": 0.83, "learning_rate": 3.320287704132423e-05, "loss": 2.2582, "step": 66144 }, { "epoch": 0.83, "learning_rate": 3.318801925168477e-05, "loss": 2.2469, "step": 66152 }, { "epoch": 0.83, "learning_rate": 3.317316916585174e-05, "loss": 2.2373, "step": 66160 }, { "epoch": 0.83, "learning_rate": 3.315832678531449e-05, "loss": 2.2654, "step": 66168 }, { "epoch": 0.83, "learning_rate": 3.31434921115617e-05, "loss": 2.2523, "step": 66176 }, { "epoch": 0.83, "learning_rate": 3.312866514608115e-05, "loss": 2.2623, "step": 66184 }, { "epoch": 0.83, "learning_rate": 3.311384589035991e-05, "loss": 2.256, "step": 66192 }, { "epoch": 0.83, "learning_rate": 3.309903434588424e-05, "loss": 2.2419, "step": 66200 }, { "epoch": 0.83, "learning_rate": 3.308423051413968e-05, "loss": 2.2336, "step": 66208 }, { "epoch": 0.83, "learning_rate": 3.306943439661101e-05, "loss": 2.2455, "step": 66216 }, { "epoch": 0.83, "learning_rate": 3.305464599478214e-05, "loss": 2.2613, "step": 66224 }, { "epoch": 0.83, "learning_rate": 3.303986531013625e-05, "loss": 2.2576, "step": 66232 }, { "epoch": 0.83, "learning_rate": 3.302509234415583e-05, "loss": 2.2667, "step": 66240 }, { "epoch": 0.83, "learning_rate": 3.3010327098322445e-05, "loss": 2.2555, "step": 66248 }, { "epoch": 0.83, "learning_rate": 3.2995569574117056e-05, "loss": 2.2547, "step": 66256 }, { "epoch": 0.83, "learning_rate": 3.298081977301967e-05, "loss": 2.2374, "step": 66264 }, { "epoch": 0.83, "learning_rate": 3.296607769650965e-05, "loss": 2.2201, "step": 66272 }, { "epoch": 0.83, "learning_rate": 3.2951343346065565e-05, "loss": 2.2791, "step": 66280 }, { "epoch": 0.83, "learning_rate": 3.2936616723165115e-05, "loss": 2.247, "step": 66288 }, { "epoch": 0.83, "learning_rate": 3.292189782928536e-05, "loss": 2.2488, "step": 66296 }, { "epoch": 0.83, "learning_rate": 3.2907186665902525e-05, "loss": 2.2235, "step": 66304 }, { "epoch": 0.83, "learning_rate": 3.289248323449202e-05, "loss": 2.2651, "step": 66312 }, { "epoch": 0.83, "learning_rate": 3.287778753652855e-05, "loss": 2.2738, "step": 66320 }, { "epoch": 0.83, "learning_rate": 3.286309957348596e-05, "loss": 2.2466, "step": 66328 }, { "epoch": 0.83, "learning_rate": 3.2848419346837414e-05, "loss": 2.2497, "step": 66336 }, { "epoch": 0.83, "learning_rate": 3.283374685805524e-05, "loss": 2.2476, "step": 66344 }, { "epoch": 0.83, "learning_rate": 3.281908210861101e-05, "loss": 2.2549, "step": 66352 }, { "epoch": 0.83, "learning_rate": 3.2804425099975525e-05, "loss": 2.2299, "step": 66360 }, { "epoch": 0.83, "learning_rate": 3.278977583361877e-05, "loss": 2.2515, "step": 66368 }, { "epoch": 0.83, "learning_rate": 3.277513431101002e-05, "loss": 2.2469, "step": 66376 }, { "epoch": 0.83, "learning_rate": 3.276050053361771e-05, "loss": 2.2558, "step": 66384 }, { "epoch": 0.83, "learning_rate": 3.2745874502909526e-05, "loss": 2.2558, "step": 66392 }, { "epoch": 0.83, "learning_rate": 3.273125622035239e-05, "loss": 2.2312, "step": 66400 }, { "epoch": 0.83, "learning_rate": 3.271664568741242e-05, "loss": 2.2433, "step": 66408 }, { "epoch": 0.83, "learning_rate": 3.270204290555498e-05, "loss": 2.2262, "step": 66416 }, { "epoch": 0.83, "learning_rate": 3.268744787624465e-05, "loss": 2.2407, "step": 66424 }, { "epoch": 0.83, "learning_rate": 3.267286060094521e-05, "loss": 2.2339, "step": 66432 }, { "epoch": 0.83, "learning_rate": 3.265828108111969e-05, "loss": 2.2455, "step": 66440 }, { "epoch": 0.83, "learning_rate": 3.264370931823036e-05, "loss": 2.2514, "step": 66448 }, { "epoch": 0.83, "learning_rate": 3.262914531373864e-05, "loss": 2.2593, "step": 66456 }, { "epoch": 0.83, "learning_rate": 3.261458906910524e-05, "loss": 2.2513, "step": 66464 }, { "epoch": 0.83, "learning_rate": 3.260004058579006e-05, "loss": 2.2717, "step": 66472 }, { "epoch": 0.83, "learning_rate": 3.2585499865252225e-05, "loss": 2.2531, "step": 66480 }, { "epoch": 0.83, "learning_rate": 3.257096690895014e-05, "loss": 2.2519, "step": 66488 }, { "epoch": 0.83, "learning_rate": 3.2556441718341325e-05, "loss": 2.2317, "step": 66496 }, { "epoch": 0.83, "learning_rate": 3.2541924294882554e-05, "loss": 2.2616, "step": 66504 }, { "epoch": 0.83, "learning_rate": 3.252741464002991e-05, "loss": 2.2614, "step": 66512 }, { "epoch": 0.83, "learning_rate": 3.2512912755238555e-05, "loss": 2.2541, "step": 66520 }, { "epoch": 0.83, "learning_rate": 3.249841864196303e-05, "loss": 2.2485, "step": 66528 }, { "epoch": 0.83, "learning_rate": 3.248393230165695e-05, "loss": 2.258, "step": 66536 }, { "epoch": 0.83, "learning_rate": 3.246945373577321e-05, "loss": 2.265, "step": 66544 }, { "epoch": 0.83, "learning_rate": 3.245498294576398e-05, "loss": 2.2617, "step": 66552 }, { "epoch": 0.83, "learning_rate": 3.244051993308054e-05, "loss": 2.217, "step": 66560 }, { "epoch": 0.83, "learning_rate": 3.242606469917348e-05, "loss": 2.2494, "step": 66568 }, { "epoch": 0.83, "learning_rate": 3.241161724549259e-05, "loss": 2.2586, "step": 66576 }, { "epoch": 0.83, "learning_rate": 3.239717757348683e-05, "loss": 2.2329, "step": 66584 }, { "epoch": 0.83, "learning_rate": 3.238274568460446e-05, "loss": 2.2256, "step": 66592 }, { "epoch": 0.83, "learning_rate": 3.236832158029286e-05, "loss": 2.2528, "step": 66600 }, { "epoch": 0.83, "learning_rate": 3.235390526199874e-05, "loss": 2.2336, "step": 66608 }, { "epoch": 0.83, "learning_rate": 3.2339496731167954e-05, "loss": 2.2355, "step": 66616 }, { "epoch": 0.83, "learning_rate": 3.2325095989245604e-05, "loss": 2.2555, "step": 66624 }, { "epoch": 0.83, "learning_rate": 3.231070303767599e-05, "loss": 2.2709, "step": 66632 }, { "epoch": 0.83, "learning_rate": 3.229631787790264e-05, "loss": 2.2583, "step": 66640 }, { "epoch": 0.83, "learning_rate": 3.228194051136833e-05, "loss": 2.2511, "step": 66648 }, { "epoch": 0.83, "learning_rate": 3.226757093951501e-05, "loss": 2.2591, "step": 66656 }, { "epoch": 0.83, "learning_rate": 3.225320916378386e-05, "loss": 2.2554, "step": 66664 }, { "epoch": 0.83, "learning_rate": 3.2238855185615294e-05, "loss": 2.2696, "step": 66672 }, { "epoch": 0.83, "learning_rate": 3.222450900644894e-05, "loss": 2.2704, "step": 66680 }, { "epoch": 0.83, "learning_rate": 3.221017062772363e-05, "loss": 2.2281, "step": 66688 }, { "epoch": 0.83, "learning_rate": 3.219584005087742e-05, "loss": 2.227, "step": 66696 }, { "epoch": 0.83, "learning_rate": 3.218151727734759e-05, "loss": 2.2286, "step": 66704 }, { "epoch": 0.83, "learning_rate": 3.2167202308570645e-05, "loss": 2.2672, "step": 66712 }, { "epoch": 0.83, "learning_rate": 3.2152895145982274e-05, "loss": 2.2748, "step": 66720 }, { "epoch": 0.83, "learning_rate": 3.2138595791017416e-05, "loss": 2.2477, "step": 66728 }, { "epoch": 0.83, "learning_rate": 3.212430424511021e-05, "loss": 2.2185, "step": 66736 }, { "epoch": 0.83, "learning_rate": 3.211002050969403e-05, "loss": 2.2905, "step": 66744 }, { "epoch": 0.83, "learning_rate": 3.2095744586201435e-05, "loss": 2.2839, "step": 66752 }, { "epoch": 0.83, "learning_rate": 3.2081476476064225e-05, "loss": 2.2444, "step": 66760 }, { "epoch": 0.83, "learning_rate": 3.206721618071342e-05, "loss": 2.2445, "step": 66768 }, { "epoch": 0.83, "learning_rate": 3.205296370157922e-05, "loss": 2.2229, "step": 66776 }, { "epoch": 0.83, "learning_rate": 3.203871904009113e-05, "loss": 2.2662, "step": 66784 }, { "epoch": 0.83, "learning_rate": 3.2024482197677726e-05, "loss": 2.2498, "step": 66792 }, { "epoch": 0.83, "learning_rate": 3.2010253175766966e-05, "loss": 2.2227, "step": 66800 }, { "epoch": 0.84, "learning_rate": 3.199603197578587e-05, "loss": 2.249, "step": 66808 }, { "epoch": 0.84, "learning_rate": 3.1981818599160765e-05, "loss": 2.2586, "step": 66816 }, { "epoch": 0.84, "learning_rate": 3.19676130473172e-05, "loss": 2.2392, "step": 66824 }, { "epoch": 0.84, "learning_rate": 3.195341532167987e-05, "loss": 2.2687, "step": 66832 }, { "epoch": 0.84, "learning_rate": 3.193922542367276e-05, "loss": 2.2246, "step": 66840 }, { "epoch": 0.84, "learning_rate": 3.192504335471904e-05, "loss": 2.2723, "step": 66848 }, { "epoch": 0.84, "learning_rate": 3.191086911624104e-05, "loss": 2.261, "step": 66856 }, { "epoch": 0.84, "learning_rate": 3.1896702709660434e-05, "loss": 2.2474, "step": 66864 }, { "epoch": 0.84, "learning_rate": 3.188254413639794e-05, "loss": 2.2484, "step": 66872 }, { "epoch": 0.84, "learning_rate": 3.1868393397873644e-05, "loss": 2.2538, "step": 66880 }, { "epoch": 0.84, "learning_rate": 3.18542504955068e-05, "loss": 2.2563, "step": 66888 }, { "epoch": 0.84, "learning_rate": 3.18401154307158e-05, "loss": 2.2508, "step": 66896 }, { "epoch": 0.84, "learning_rate": 3.1825988204918355e-05, "loss": 2.2435, "step": 66904 }, { "epoch": 0.84, "learning_rate": 3.1811868819531345e-05, "loss": 2.2412, "step": 66912 }, { "epoch": 0.84, "learning_rate": 3.179775727597084e-05, "loss": 2.2502, "step": 66920 }, { "epoch": 0.84, "learning_rate": 3.178365357565219e-05, "loss": 2.2375, "step": 66928 }, { "epoch": 0.84, "learning_rate": 3.176955771998985e-05, "loss": 2.27, "step": 66936 }, { "epoch": 0.84, "learning_rate": 3.17554697103976e-05, "loss": 2.2658, "step": 66944 }, { "epoch": 0.84, "learning_rate": 3.1741389548288395e-05, "loss": 2.2309, "step": 66952 }, { "epoch": 0.84, "learning_rate": 3.1727317235074374e-05, "loss": 2.2407, "step": 66960 }, { "epoch": 0.84, "learning_rate": 3.171325277216692e-05, "loss": 2.2498, "step": 66968 }, { "epoch": 0.84, "learning_rate": 3.1699196160976605e-05, "loss": 2.2548, "step": 66976 }, { "epoch": 0.84, "learning_rate": 3.168514740291325e-05, "loss": 2.2494, "step": 66984 }, { "epoch": 0.84, "learning_rate": 3.167110649938586e-05, "loss": 2.2344, "step": 66992 }, { "epoch": 0.84, "learning_rate": 3.1657073451802636e-05, "loss": 2.271, "step": 67000 }, { "epoch": 0.84, "learning_rate": 3.164304826157102e-05, "loss": 2.2628, "step": 67008 }, { "epoch": 0.84, "learning_rate": 3.16290309300977e-05, "loss": 2.2333, "step": 67016 }, { "epoch": 0.84, "learning_rate": 3.161502145878849e-05, "loss": 2.2653, "step": 67024 }, { "epoch": 0.84, "learning_rate": 3.160101984904847e-05, "loss": 2.2383, "step": 67032 }, { "epoch": 0.84, "learning_rate": 3.158702610228193e-05, "loss": 2.2354, "step": 67040 }, { "epoch": 0.84, "learning_rate": 3.1573040219892335e-05, "loss": 2.2784, "step": 67048 }, { "epoch": 0.84, "learning_rate": 3.155906220328245e-05, "loss": 2.2363, "step": 67056 }, { "epoch": 0.84, "learning_rate": 3.154509205385415e-05, "loss": 2.2547, "step": 67064 }, { "epoch": 0.84, "learning_rate": 3.1531129773008535e-05, "loss": 2.2536, "step": 67072 }, { "epoch": 0.84, "learning_rate": 3.151717536214602e-05, "loss": 2.239, "step": 67080 }, { "epoch": 0.84, "learning_rate": 3.150322882266606e-05, "loss": 2.2725, "step": 67088 }, { "epoch": 0.84, "learning_rate": 3.1489290155967513e-05, "loss": 2.2463, "step": 67096 }, { "epoch": 0.84, "learning_rate": 3.147535936344827e-05, "loss": 2.2363, "step": 67104 }, { "epoch": 0.84, "learning_rate": 3.146143644650553e-05, "loss": 2.2504, "step": 67112 }, { "epoch": 0.84, "learning_rate": 3.1447521406535724e-05, "loss": 2.2286, "step": 67120 }, { "epoch": 0.84, "learning_rate": 3.1433614244934364e-05, "loss": 2.2464, "step": 67128 }, { "epoch": 0.84, "learning_rate": 3.141971496309635e-05, "loss": 2.236, "step": 67136 }, { "epoch": 0.84, "learning_rate": 3.140582356241567e-05, "loss": 2.2415, "step": 67144 }, { "epoch": 0.84, "learning_rate": 3.139194004428552e-05, "loss": 2.2619, "step": 67152 }, { "epoch": 0.84, "learning_rate": 3.1378064410098406e-05, "loss": 2.2692, "step": 67160 }, { "epoch": 0.84, "learning_rate": 3.136419666124589e-05, "loss": 2.2488, "step": 67168 }, { "epoch": 0.84, "learning_rate": 3.1350336799118904e-05, "loss": 2.2698, "step": 67176 }, { "epoch": 0.84, "learning_rate": 3.133648482510747e-05, "loss": 2.2305, "step": 67184 }, { "epoch": 0.84, "learning_rate": 3.1322640740600886e-05, "loss": 2.2447, "step": 67192 }, { "epoch": 0.84, "learning_rate": 3.130880454698761e-05, "loss": 2.2675, "step": 67200 }, { "epoch": 0.84, "learning_rate": 3.129497624565537e-05, "loss": 2.2594, "step": 67208 }, { "epoch": 0.84, "learning_rate": 3.1281155837991025e-05, "loss": 2.2471, "step": 67216 }, { "epoch": 0.84, "learning_rate": 3.126734332538072e-05, "loss": 2.2416, "step": 67224 }, { "epoch": 0.84, "learning_rate": 3.125353870920975e-05, "loss": 2.2586, "step": 67232 }, { "epoch": 0.84, "learning_rate": 3.123974199086264e-05, "loss": 2.2703, "step": 67240 }, { "epoch": 0.84, "learning_rate": 3.122595317172313e-05, "loss": 2.2194, "step": 67248 }, { "epoch": 0.84, "learning_rate": 3.121217225317416e-05, "loss": 2.261, "step": 67256 }, { "epoch": 0.84, "learning_rate": 3.1198399236597884e-05, "loss": 2.2569, "step": 67264 }, { "epoch": 0.84, "learning_rate": 3.118463412337564e-05, "loss": 2.2531, "step": 67272 }, { "epoch": 0.84, "learning_rate": 3.1170876914888e-05, "loss": 2.2586, "step": 67280 }, { "epoch": 0.84, "learning_rate": 3.115712761251473e-05, "loss": 2.262, "step": 67288 }, { "epoch": 0.84, "learning_rate": 3.1143386217634835e-05, "loss": 2.2306, "step": 67296 }, { "epoch": 0.84, "learning_rate": 3.112965273162646e-05, "loss": 2.2577, "step": 67304 }, { "epoch": 0.84, "learning_rate": 3.111592715586702e-05, "loss": 2.2533, "step": 67312 }, { "epoch": 0.84, "learning_rate": 3.110220949173308e-05, "loss": 2.2613, "step": 67320 }, { "epoch": 0.84, "learning_rate": 3.10884997406005e-05, "loss": 2.259, "step": 67328 }, { "epoch": 0.84, "learning_rate": 3.1074797903844255e-05, "loss": 2.2376, "step": 67336 }, { "epoch": 0.84, "learning_rate": 3.1061103982838534e-05, "loss": 2.2503, "step": 67344 }, { "epoch": 0.84, "learning_rate": 3.104741797895684e-05, "loss": 2.2349, "step": 67352 }, { "epoch": 0.84, "learning_rate": 3.10337398935717e-05, "loss": 2.2482, "step": 67360 }, { "epoch": 0.84, "learning_rate": 3.102006972805505e-05, "loss": 2.2456, "step": 67368 }, { "epoch": 0.84, "learning_rate": 3.1006407483777854e-05, "loss": 2.226, "step": 67376 }, { "epoch": 0.84, "learning_rate": 3.099275316211038e-05, "loss": 2.2482, "step": 67384 }, { "epoch": 0.84, "learning_rate": 3.097910676442211e-05, "loss": 2.2504, "step": 67392 }, { "epoch": 0.84, "learning_rate": 3.096546829208163e-05, "loss": 2.25, "step": 67400 }, { "epoch": 0.84, "learning_rate": 3.095183774645689e-05, "loss": 2.2508, "step": 67408 }, { "epoch": 0.84, "learning_rate": 3.093821512891491e-05, "loss": 2.2391, "step": 67416 }, { "epoch": 0.84, "learning_rate": 3.0924600440821925e-05, "loss": 2.2487, "step": 67424 }, { "epoch": 0.84, "learning_rate": 3.09109936835435e-05, "loss": 2.2459, "step": 67432 }, { "epoch": 0.84, "learning_rate": 3.089739485844422e-05, "loss": 2.2512, "step": 67440 }, { "epoch": 0.84, "learning_rate": 3.088380396688804e-05, "loss": 2.2524, "step": 67448 }, { "epoch": 0.84, "learning_rate": 3.0870221010238045e-05, "loss": 2.2506, "step": 67456 }, { "epoch": 0.84, "learning_rate": 3.0856645989856467e-05, "loss": 2.2434, "step": 67464 }, { "epoch": 0.84, "learning_rate": 3.0843078907104865e-05, "loss": 2.2879, "step": 67472 }, { "epoch": 0.84, "learning_rate": 3.0829519763343916e-05, "loss": 2.2371, "step": 67480 }, { "epoch": 0.84, "learning_rate": 3.081596855993354e-05, "loss": 2.234, "step": 67488 }, { "epoch": 0.84, "learning_rate": 3.080242529823283e-05, "loss": 2.2686, "step": 67496 }, { "epoch": 0.84, "learning_rate": 3.07888899796001e-05, "loss": 2.2543, "step": 67504 }, { "epoch": 0.84, "learning_rate": 3.077536260539287e-05, "loss": 2.2563, "step": 67512 }, { "epoch": 0.84, "learning_rate": 3.076184317696786e-05, "loss": 2.2502, "step": 67520 }, { "epoch": 0.84, "learning_rate": 3.0748331695681004e-05, "loss": 2.2457, "step": 67528 }, { "epoch": 0.84, "learning_rate": 3.0734828162887396e-05, "loss": 2.2475, "step": 67536 }, { "epoch": 0.84, "learning_rate": 3.07213325799414e-05, "loss": 2.2522, "step": 67544 }, { "epoch": 0.84, "learning_rate": 3.070784494819651e-05, "loss": 2.2518, "step": 67552 }, { "epoch": 0.84, "learning_rate": 3.069436526900549e-05, "loss": 2.2386, "step": 67560 }, { "epoch": 0.84, "learning_rate": 3.068089354372026e-05, "loss": 2.2469, "step": 67568 }, { "epoch": 0.84, "learning_rate": 3.0667429773691966e-05, "loss": 2.2568, "step": 67576 }, { "epoch": 0.84, "learning_rate": 3.065397396027093e-05, "loss": 2.2659, "step": 67584 }, { "epoch": 0.84, "learning_rate": 3.0640526104806724e-05, "loss": 2.2448, "step": 67592 }, { "epoch": 0.84, "learning_rate": 3.062708620864806e-05, "loss": 2.224, "step": 67600 }, { "epoch": 0.85, "learning_rate": 3.06136542731429e-05, "loss": 2.2597, "step": 67608 }, { "epoch": 0.85, "learning_rate": 3.0600230299638374e-05, "loss": 2.2474, "step": 67616 }, { "epoch": 0.85, "learning_rate": 3.058681428948088e-05, "loss": 2.2282, "step": 67624 }, { "epoch": 0.85, "learning_rate": 3.057340624401591e-05, "loss": 2.2672, "step": 67632 }, { "epoch": 0.85, "learning_rate": 3.056000616458825e-05, "loss": 2.2257, "step": 67640 }, { "epoch": 0.85, "learning_rate": 3.054661405254182e-05, "loss": 2.25, "step": 67648 }, { "epoch": 0.85, "learning_rate": 3.0533229909219796e-05, "loss": 2.2532, "step": 67656 }, { "epoch": 0.85, "learning_rate": 3.0519853735964556e-05, "loss": 2.2584, "step": 67664 }, { "epoch": 0.85, "learning_rate": 3.0506485534117586e-05, "loss": 2.2387, "step": 67672 }, { "epoch": 0.85, "learning_rate": 3.0493125305019698e-05, "loss": 2.2381, "step": 67680 }, { "epoch": 0.85, "learning_rate": 3.0479773050010863e-05, "loss": 2.2468, "step": 67688 }, { "epoch": 0.85, "learning_rate": 3.0466428770430154e-05, "loss": 2.244, "step": 67696 }, { "epoch": 0.85, "learning_rate": 3.0453092467616024e-05, "loss": 2.26, "step": 67704 }, { "epoch": 0.85, "learning_rate": 3.0439764142905935e-05, "loss": 2.2349, "step": 67712 }, { "epoch": 0.85, "learning_rate": 3.042644379763672e-05, "loss": 2.2544, "step": 67720 }, { "epoch": 0.85, "learning_rate": 3.0413131433144314e-05, "loss": 2.2526, "step": 67728 }, { "epoch": 0.85, "learning_rate": 3.039982705076383e-05, "loss": 2.2455, "step": 67736 }, { "epoch": 0.85, "learning_rate": 3.0386530651829664e-05, "loss": 2.2511, "step": 67744 }, { "epoch": 0.85, "learning_rate": 3.037324223767536e-05, "loss": 2.2395, "step": 67752 }, { "epoch": 0.85, "learning_rate": 3.035996180963368e-05, "loss": 2.2336, "step": 67760 }, { "epoch": 0.85, "learning_rate": 3.0346689369036573e-05, "loss": 2.2904, "step": 67768 }, { "epoch": 0.85, "learning_rate": 3.033342491721515e-05, "loss": 2.2546, "step": 67776 }, { "epoch": 0.85, "learning_rate": 3.0320168455499805e-05, "loss": 2.2334, "step": 67784 }, { "epoch": 0.85, "learning_rate": 3.030691998522008e-05, "loss": 2.2363, "step": 67792 }, { "epoch": 0.85, "learning_rate": 3.0293679507704715e-05, "loss": 2.2421, "step": 67800 }, { "epoch": 0.85, "learning_rate": 3.0280447024281644e-05, "loss": 2.2608, "step": 67808 }, { "epoch": 0.85, "learning_rate": 3.0267222536278034e-05, "loss": 2.2559, "step": 67816 }, { "epoch": 0.85, "learning_rate": 3.02540060450202e-05, "loss": 2.2584, "step": 67824 }, { "epoch": 0.85, "learning_rate": 3.0240797551833704e-05, "loss": 2.26, "step": 67832 }, { "epoch": 0.85, "learning_rate": 3.0227597058043272e-05, "loss": 2.2339, "step": 67840 }, { "epoch": 0.85, "learning_rate": 3.0214404564972813e-05, "loss": 2.259, "step": 67848 }, { "epoch": 0.85, "learning_rate": 3.0201220073945535e-05, "loss": 2.2416, "step": 67856 }, { "epoch": 0.85, "learning_rate": 3.018804358628368e-05, "loss": 2.2531, "step": 67864 }, { "epoch": 0.85, "learning_rate": 3.0174875103308837e-05, "loss": 2.2414, "step": 67872 }, { "epoch": 0.85, "learning_rate": 3.0161714626341696e-05, "loss": 2.2552, "step": 67880 }, { "epoch": 0.85, "learning_rate": 3.0148562156702163e-05, "loss": 2.2273, "step": 67888 }, { "epoch": 0.85, "learning_rate": 3.0135417695709433e-05, "loss": 2.2479, "step": 67896 }, { "epoch": 0.85, "learning_rate": 3.012228124468175e-05, "loss": 2.256, "step": 67904 }, { "epoch": 0.85, "learning_rate": 3.0109152804936624e-05, "loss": 2.2643, "step": 67912 }, { "epoch": 0.85, "learning_rate": 3.009603237779083e-05, "loss": 2.2358, "step": 67920 }, { "epoch": 0.85, "learning_rate": 3.0082919964560173e-05, "loss": 2.2535, "step": 67928 }, { "epoch": 0.85, "learning_rate": 3.0069815566559866e-05, "loss": 2.2345, "step": 67936 }, { "epoch": 0.85, "learning_rate": 3.0056719185104114e-05, "loss": 2.2498, "step": 67944 }, { "epoch": 0.85, "learning_rate": 3.004363082150644e-05, "loss": 2.2664, "step": 67952 }, { "epoch": 0.85, "learning_rate": 3.0030550477079568e-05, "loss": 2.2182, "step": 67960 }, { "epoch": 0.85, "learning_rate": 3.00174781531353e-05, "loss": 2.2253, "step": 67968 }, { "epoch": 0.85, "learning_rate": 3.0004413850984802e-05, "loss": 2.2422, "step": 67976 }, { "epoch": 0.85, "learning_rate": 2.9991357571938328e-05, "loss": 2.2167, "step": 67984 }, { "epoch": 0.85, "learning_rate": 2.9978309317305303e-05, "loss": 2.2355, "step": 67992 }, { "epoch": 0.85, "learning_rate": 2.9965269088394455e-05, "loss": 2.2652, "step": 68000 }, { "epoch": 0.85, "learning_rate": 2.9952236886513586e-05, "loss": 2.2358, "step": 68008 }, { "epoch": 0.85, "learning_rate": 2.9939212712969793e-05, "loss": 2.2619, "step": 68016 }, { "epoch": 0.85, "learning_rate": 2.9926196569069325e-05, "loss": 2.2639, "step": 68024 }, { "epoch": 0.85, "learning_rate": 2.9913188456117607e-05, "loss": 2.2468, "step": 68032 }, { "epoch": 0.85, "learning_rate": 2.9900188375419296e-05, "loss": 2.233, "step": 68040 }, { "epoch": 0.85, "learning_rate": 2.9887196328278223e-05, "loss": 2.2416, "step": 68048 }, { "epoch": 0.85, "learning_rate": 2.9874212315997414e-05, "loss": 2.2612, "step": 68056 }, { "epoch": 0.85, "learning_rate": 2.9861236339879085e-05, "loss": 2.2507, "step": 68064 }, { "epoch": 0.85, "learning_rate": 2.9848268401224666e-05, "loss": 2.2446, "step": 68072 }, { "epoch": 0.85, "learning_rate": 2.9835308501334753e-05, "loss": 2.2554, "step": 68080 }, { "epoch": 0.85, "learning_rate": 2.9822356641509165e-05, "loss": 2.2703, "step": 68088 }, { "epoch": 0.85, "learning_rate": 2.98094128230469e-05, "loss": 2.2513, "step": 68096 }, { "epoch": 0.85, "learning_rate": 2.9796477047246135e-05, "loss": 2.2228, "step": 68104 }, { "epoch": 0.85, "learning_rate": 2.978354931540427e-05, "loss": 2.2552, "step": 68112 }, { "epoch": 0.85, "learning_rate": 2.9770629628817868e-05, "loss": 2.2525, "step": 68120 }, { "epoch": 0.85, "learning_rate": 2.9757717988782723e-05, "loss": 2.2336, "step": 68128 }, { "epoch": 0.85, "learning_rate": 2.9744814396593777e-05, "loss": 2.2668, "step": 68136 }, { "epoch": 0.85, "learning_rate": 2.9731918853545206e-05, "loss": 2.2461, "step": 68144 }, { "epoch": 0.85, "learning_rate": 2.9719031360930337e-05, "loss": 2.2479, "step": 68152 }, { "epoch": 0.85, "learning_rate": 2.9706151920041735e-05, "loss": 2.2499, "step": 68160 }, { "epoch": 0.85, "learning_rate": 2.969328053217112e-05, "loss": 2.2617, "step": 68168 }, { "epoch": 0.85, "learning_rate": 2.9680417198609417e-05, "loss": 2.2192, "step": 68176 }, { "epoch": 0.85, "learning_rate": 2.9667561920646748e-05, "loss": 2.267, "step": 68184 }, { "epoch": 0.85, "learning_rate": 2.965471469957246e-05, "loss": 2.2546, "step": 68192 }, { "epoch": 0.85, "learning_rate": 2.9641875536674996e-05, "loss": 2.2279, "step": 68200 }, { "epoch": 0.85, "learning_rate": 2.962904443324211e-05, "loss": 2.2424, "step": 68208 }, { "epoch": 0.85, "learning_rate": 2.9616221390560645e-05, "loss": 2.2197, "step": 68216 }, { "epoch": 0.85, "learning_rate": 2.9603406409916684e-05, "loss": 2.2274, "step": 68224 }, { "epoch": 0.85, "learning_rate": 2.9590599492595532e-05, "loss": 2.2605, "step": 68232 }, { "epoch": 0.85, "learning_rate": 2.9577800639881597e-05, "loss": 2.2386, "step": 68240 }, { "epoch": 0.85, "learning_rate": 2.9565009853058574e-05, "loss": 2.2233, "step": 68248 }, { "epoch": 0.85, "learning_rate": 2.955222713340932e-05, "loss": 2.2557, "step": 68256 }, { "epoch": 0.85, "learning_rate": 2.9539452482215802e-05, "loss": 2.2606, "step": 68264 }, { "epoch": 0.85, "learning_rate": 2.952668590075932e-05, "loss": 2.2267, "step": 68272 }, { "epoch": 0.85, "learning_rate": 2.951392739032021e-05, "loss": 2.2501, "step": 68280 }, { "epoch": 0.85, "learning_rate": 2.9501176952178155e-05, "loss": 2.2334, "step": 68288 }, { "epoch": 0.85, "learning_rate": 2.9488434587611936e-05, "loss": 2.2446, "step": 68296 }, { "epoch": 0.85, "learning_rate": 2.9475700297899485e-05, "loss": 2.2251, "step": 68304 }, { "epoch": 0.85, "learning_rate": 2.9462974084318035e-05, "loss": 2.2391, "step": 68312 }, { "epoch": 0.85, "learning_rate": 2.945025594814394e-05, "loss": 2.2621, "step": 68320 }, { "epoch": 0.85, "learning_rate": 2.9437545890652746e-05, "loss": 2.2282, "step": 68328 }, { "epoch": 0.85, "learning_rate": 2.9424843913119238e-05, "loss": 2.2689, "step": 68336 }, { "epoch": 0.85, "learning_rate": 2.941215001681728e-05, "loss": 2.2365, "step": 68344 }, { "epoch": 0.85, "learning_rate": 2.939946420302005e-05, "loss": 2.2343, "step": 68352 }, { "epoch": 0.85, "learning_rate": 2.9386786472999867e-05, "loss": 2.2386, "step": 68360 }, { "epoch": 0.85, "learning_rate": 2.9374116828028202e-05, "loss": 2.2578, "step": 68368 }, { "epoch": 0.85, "learning_rate": 2.9361455269375786e-05, "loss": 2.254, "step": 68376 }, { "epoch": 0.85, "learning_rate": 2.9348801798312475e-05, "loss": 2.2579, "step": 68384 }, { "epoch": 0.85, "learning_rate": 2.9336156416107353e-05, "loss": 2.2638, "step": 68392 }, { "epoch": 0.85, "learning_rate": 2.9323519124028676e-05, "loss": 2.2563, "step": 68400 }, { "epoch": 0.86, "learning_rate": 2.931088992334388e-05, "loss": 2.2296, "step": 68408 }, { "epoch": 0.86, "learning_rate": 2.929826881531963e-05, "loss": 2.2448, "step": 68416 }, { "epoch": 0.86, "learning_rate": 2.928565580122173e-05, "loss": 2.2711, "step": 68424 }, { "epoch": 0.86, "learning_rate": 2.92730508823152e-05, "loss": 2.2415, "step": 68432 }, { "epoch": 0.86, "learning_rate": 2.9260454059864246e-05, "loss": 2.2437, "step": 68440 }, { "epoch": 0.86, "learning_rate": 2.924786533513225e-05, "loss": 2.2541, "step": 68448 }, { "epoch": 0.86, "learning_rate": 2.9235284709381773e-05, "loss": 2.2438, "step": 68456 }, { "epoch": 0.86, "learning_rate": 2.922271218387464e-05, "loss": 2.2524, "step": 68464 }, { "epoch": 0.86, "learning_rate": 2.9210147759871755e-05, "loss": 2.2331, "step": 68472 }, { "epoch": 0.86, "learning_rate": 2.919759143863326e-05, "loss": 2.2392, "step": 68480 }, { "epoch": 0.86, "learning_rate": 2.9185043221418495e-05, "loss": 2.236, "step": 68488 }, { "epoch": 0.86, "learning_rate": 2.917250310948596e-05, "loss": 2.2359, "step": 68496 }, { "epoch": 0.86, "learning_rate": 2.9159971104093403e-05, "loss": 2.2461, "step": 68504 }, { "epoch": 0.86, "learning_rate": 2.9147447206497657e-05, "loss": 2.2473, "step": 68512 }, { "epoch": 0.86, "learning_rate": 2.9134931417954804e-05, "loss": 2.2482, "step": 68520 }, { "epoch": 0.86, "learning_rate": 2.912242373972016e-05, "loss": 2.2413, "step": 68528 }, { "epoch": 0.86, "learning_rate": 2.9109924173048102e-05, "loss": 2.2653, "step": 68536 }, { "epoch": 0.86, "learning_rate": 2.9097432719192336e-05, "loss": 2.2558, "step": 68544 }, { "epoch": 0.86, "learning_rate": 2.9084949379405614e-05, "loss": 2.2246, "step": 68552 }, { "epoch": 0.86, "learning_rate": 2.9072474154939994e-05, "loss": 2.2421, "step": 68560 }, { "epoch": 0.86, "learning_rate": 2.906000704704668e-05, "loss": 2.2576, "step": 68568 }, { "epoch": 0.86, "learning_rate": 2.904754805697598e-05, "loss": 2.2211, "step": 68576 }, { "epoch": 0.86, "learning_rate": 2.9035097185977533e-05, "loss": 2.2582, "step": 68584 }, { "epoch": 0.86, "learning_rate": 2.9022654435300067e-05, "loss": 2.2431, "step": 68592 }, { "epoch": 0.86, "learning_rate": 2.9010219806191523e-05, "loss": 2.243, "step": 68600 }, { "epoch": 0.86, "learning_rate": 2.8997793299899035e-05, "loss": 2.2516, "step": 68608 }, { "epoch": 0.86, "learning_rate": 2.8985374917668852e-05, "loss": 2.2395, "step": 68616 }, { "epoch": 0.86, "learning_rate": 2.8972964660746533e-05, "loss": 2.2494, "step": 68624 }, { "epoch": 0.86, "learning_rate": 2.896056253037673e-05, "loss": 2.2506, "step": 68632 }, { "epoch": 0.86, "learning_rate": 2.894816852780331e-05, "loss": 2.2253, "step": 68640 }, { "epoch": 0.86, "learning_rate": 2.893578265426933e-05, "loss": 2.2683, "step": 68648 }, { "epoch": 0.86, "learning_rate": 2.892340491101701e-05, "loss": 2.2526, "step": 68656 }, { "epoch": 0.86, "learning_rate": 2.891103529928778e-05, "loss": 2.256, "step": 68664 }, { "epoch": 0.86, "learning_rate": 2.889867382032222e-05, "loss": 2.2201, "step": 68672 }, { "epoch": 0.86, "learning_rate": 2.888632047536014e-05, "loss": 2.2721, "step": 68680 }, { "epoch": 0.86, "learning_rate": 2.8873975265640496e-05, "loss": 2.2602, "step": 68688 }, { "epoch": 0.86, "learning_rate": 2.8861638192401446e-05, "loss": 2.2409, "step": 68696 }, { "epoch": 0.86, "learning_rate": 2.8849309256880336e-05, "loss": 2.2454, "step": 68704 }, { "epoch": 0.86, "learning_rate": 2.8836988460313674e-05, "loss": 2.2517, "step": 68712 }, { "epoch": 0.86, "learning_rate": 2.882467580393719e-05, "loss": 2.2412, "step": 68720 }, { "epoch": 0.86, "learning_rate": 2.8812371288985723e-05, "loss": 2.2379, "step": 68728 }, { "epoch": 0.86, "learning_rate": 2.8800074916693433e-05, "loss": 2.2637, "step": 68736 }, { "epoch": 0.86, "learning_rate": 2.8787786688293495e-05, "loss": 2.2438, "step": 68744 }, { "epoch": 0.86, "learning_rate": 2.877550660501836e-05, "loss": 2.2476, "step": 68752 }, { "epoch": 0.86, "learning_rate": 2.876323466809971e-05, "loss": 2.2562, "step": 68760 }, { "epoch": 0.86, "learning_rate": 2.8750970878768274e-05, "loss": 2.2407, "step": 68768 }, { "epoch": 0.86, "learning_rate": 2.8738715238254106e-05, "loss": 2.254, "step": 68776 }, { "epoch": 0.86, "learning_rate": 2.872646774778634e-05, "loss": 2.2541, "step": 68784 }, { "epoch": 0.86, "learning_rate": 2.8714228408593312e-05, "loss": 2.2586, "step": 68792 }, { "epoch": 0.86, "learning_rate": 2.8701997221902628e-05, "loss": 2.2567, "step": 68800 }, { "epoch": 0.86, "learning_rate": 2.8689774188940914e-05, "loss": 2.2603, "step": 68808 }, { "epoch": 0.86, "learning_rate": 2.867755931093415e-05, "loss": 2.2403, "step": 68816 }, { "epoch": 0.86, "learning_rate": 2.8665352589107397e-05, "loss": 2.2362, "step": 68824 }, { "epoch": 0.86, "learning_rate": 2.865315402468488e-05, "loss": 2.2518, "step": 68832 }, { "epoch": 0.86, "learning_rate": 2.864096361889012e-05, "loss": 2.2633, "step": 68840 }, { "epoch": 0.86, "learning_rate": 2.8628781372945656e-05, "loss": 2.2291, "step": 68848 }, { "epoch": 0.86, "learning_rate": 2.861660728807337e-05, "loss": 2.2435, "step": 68856 }, { "epoch": 0.86, "learning_rate": 2.860444136549425e-05, "loss": 2.2648, "step": 68864 }, { "epoch": 0.86, "learning_rate": 2.8592283606428405e-05, "loss": 2.2367, "step": 68872 }, { "epoch": 0.86, "learning_rate": 2.8580134012095262e-05, "loss": 2.2402, "step": 68880 }, { "epoch": 0.86, "learning_rate": 2.8567992583713314e-05, "loss": 2.2539, "step": 68888 }, { "epoch": 0.86, "learning_rate": 2.85558593225003e-05, "loss": 2.2376, "step": 68896 }, { "epoch": 0.86, "learning_rate": 2.85437342296731e-05, "loss": 2.2521, "step": 68904 }, { "epoch": 0.86, "learning_rate": 2.8531617306447806e-05, "loss": 2.2481, "step": 68912 }, { "epoch": 0.86, "learning_rate": 2.8519508554039665e-05, "loss": 2.2253, "step": 68920 }, { "epoch": 0.86, "learning_rate": 2.850740797366313e-05, "loss": 2.2525, "step": 68928 }, { "epoch": 0.86, "learning_rate": 2.8495315566531816e-05, "loss": 2.2203, "step": 68936 }, { "epoch": 0.86, "learning_rate": 2.848323133385851e-05, "loss": 2.233, "step": 68944 }, { "epoch": 0.86, "learning_rate": 2.8471155276855205e-05, "loss": 2.2382, "step": 68952 }, { "epoch": 0.86, "learning_rate": 2.8459087396733052e-05, "loss": 2.244, "step": 68960 }, { "epoch": 0.86, "learning_rate": 2.8447027694702404e-05, "loss": 2.2551, "step": 68968 }, { "epoch": 0.86, "learning_rate": 2.8434976171972776e-05, "loss": 2.2337, "step": 68976 }, { "epoch": 0.86, "learning_rate": 2.842293282975286e-05, "loss": 2.2619, "step": 68984 }, { "epoch": 0.86, "learning_rate": 2.8410897669250548e-05, "loss": 2.2249, "step": 68992 }, { "epoch": 0.86, "learning_rate": 2.8398870691672873e-05, "loss": 2.2537, "step": 69000 }, { "epoch": 0.86, "learning_rate": 2.8386851898226108e-05, "loss": 2.2287, "step": 69008 }, { "epoch": 0.86, "learning_rate": 2.837484129011564e-05, "loss": 2.2336, "step": 69016 }, { "epoch": 0.86, "learning_rate": 2.8362838868546066e-05, "loss": 2.2558, "step": 69024 }, { "epoch": 0.86, "learning_rate": 2.83508446347212e-05, "loss": 2.2727, "step": 69032 }, { "epoch": 0.86, "learning_rate": 2.8338858589843965e-05, "loss": 2.2575, "step": 69040 }, { "epoch": 0.86, "learning_rate": 2.832688073511648e-05, "loss": 2.2432, "step": 69048 }, { "epoch": 0.86, "learning_rate": 2.8314911071740074e-05, "loss": 2.2761, "step": 69056 }, { "epoch": 0.86, "learning_rate": 2.8302949600915223e-05, "loss": 2.2327, "step": 69064 }, { "epoch": 0.86, "learning_rate": 2.8290996323841634e-05, "loss": 2.2703, "step": 69072 }, { "epoch": 0.86, "learning_rate": 2.82790512417181e-05, "loss": 2.2523, "step": 69080 }, { "epoch": 0.86, "learning_rate": 2.826711435574268e-05, "loss": 2.2392, "step": 69088 }, { "epoch": 0.86, "learning_rate": 2.8255185667112594e-05, "loss": 2.2437, "step": 69096 }, { "epoch": 0.86, "learning_rate": 2.824326517702415e-05, "loss": 2.2344, "step": 69104 }, { "epoch": 0.86, "learning_rate": 2.823135288667298e-05, "loss": 2.2321, "step": 69112 }, { "epoch": 0.86, "learning_rate": 2.821944879725376e-05, "loss": 2.2482, "step": 69120 }, { "epoch": 0.86, "learning_rate": 2.820755290996045e-05, "loss": 2.245, "step": 69128 }, { "epoch": 0.86, "learning_rate": 2.819566522598613e-05, "loss": 2.2393, "step": 69136 }, { "epoch": 0.86, "learning_rate": 2.8183785746523027e-05, "loss": 2.2322, "step": 69144 }, { "epoch": 0.86, "learning_rate": 2.817191447276265e-05, "loss": 2.2385, "step": 69152 }, { "epoch": 0.86, "learning_rate": 2.816005140589557e-05, "loss": 2.2588, "step": 69160 }, { "epoch": 0.86, "learning_rate": 2.814819654711161e-05, "loss": 2.248, "step": 69168 }, { "epoch": 0.86, "learning_rate": 2.813634989759976e-05, "loss": 2.2468, "step": 69176 }, { "epoch": 0.86, "learning_rate": 2.8124511458548108e-05, "loss": 2.2611, "step": 69184 }, { "epoch": 0.86, "learning_rate": 2.8112681231144043e-05, "loss": 2.2353, "step": 69192 }, { "epoch": 0.86, "learning_rate": 2.810085921657406e-05, "loss": 2.229, "step": 69200 }, { "epoch": 0.87, "learning_rate": 2.8089045416023818e-05, "loss": 2.2605, "step": 69208 }, { "epoch": 0.87, "learning_rate": 2.8077239830678197e-05, "loss": 2.2413, "step": 69216 }, { "epoch": 0.87, "learning_rate": 2.8065442461721226e-05, "loss": 2.2428, "step": 69224 }, { "epoch": 0.87, "learning_rate": 2.805365331033609e-05, "loss": 2.2346, "step": 69232 }, { "epoch": 0.87, "learning_rate": 2.804187237770521e-05, "loss": 2.2485, "step": 69240 }, { "epoch": 0.87, "learning_rate": 2.8030099665010122e-05, "loss": 2.2453, "step": 69248 }, { "epoch": 0.87, "learning_rate": 2.801833517343158e-05, "loss": 2.2248, "step": 69256 }, { "epoch": 0.87, "learning_rate": 2.8006578904149484e-05, "loss": 2.2478, "step": 69264 }, { "epoch": 0.87, "learning_rate": 2.7994830858342914e-05, "loss": 2.2438, "step": 69272 }, { "epoch": 0.87, "learning_rate": 2.7983091037190152e-05, "loss": 2.2694, "step": 69280 }, { "epoch": 0.87, "learning_rate": 2.797135944186862e-05, "loss": 2.2484, "step": 69288 }, { "epoch": 0.87, "learning_rate": 2.7959636073554922e-05, "loss": 2.2387, "step": 69296 }, { "epoch": 0.87, "learning_rate": 2.7947920933424885e-05, "loss": 2.2504, "step": 69304 }, { "epoch": 0.87, "learning_rate": 2.7936214022653446e-05, "loss": 2.2324, "step": 69312 }, { "epoch": 0.87, "learning_rate": 2.7924515342414727e-05, "loss": 2.2343, "step": 69320 }, { "epoch": 0.87, "learning_rate": 2.7912824893882062e-05, "loss": 2.26, "step": 69328 }, { "epoch": 0.87, "learning_rate": 2.7901142678227908e-05, "loss": 2.2506, "step": 69336 }, { "epoch": 0.87, "learning_rate": 2.7889468696623976e-05, "loss": 2.2456, "step": 69344 }, { "epoch": 0.87, "learning_rate": 2.7877802950241054e-05, "loss": 2.2553, "step": 69352 }, { "epoch": 0.87, "learning_rate": 2.7866145440249146e-05, "loss": 2.2607, "step": 69360 }, { "epoch": 0.87, "learning_rate": 2.78544961678175e-05, "loss": 2.258, "step": 69368 }, { "epoch": 0.87, "learning_rate": 2.7842855134114387e-05, "loss": 2.2442, "step": 69376 }, { "epoch": 0.87, "learning_rate": 2.7831222340307412e-05, "loss": 2.2306, "step": 69384 }, { "epoch": 0.87, "learning_rate": 2.7819597787563217e-05, "loss": 2.2399, "step": 69392 }, { "epoch": 0.87, "learning_rate": 2.7807981477047696e-05, "loss": 2.227, "step": 69400 }, { "epoch": 0.87, "learning_rate": 2.7796373409925935e-05, "loss": 2.2312, "step": 69408 }, { "epoch": 0.87, "learning_rate": 2.7784773587362097e-05, "loss": 2.2609, "step": 69416 }, { "epoch": 0.87, "learning_rate": 2.7773182010519632e-05, "loss": 2.2126, "step": 69424 }, { "epoch": 0.87, "learning_rate": 2.7761598680561086e-05, "loss": 2.2677, "step": 69432 }, { "epoch": 0.87, "learning_rate": 2.77500235986482e-05, "loss": 2.2418, "step": 69440 }, { "epoch": 0.87, "learning_rate": 2.7738456765941918e-05, "loss": 2.2484, "step": 69448 }, { "epoch": 0.87, "learning_rate": 2.7726898183602264e-05, "loss": 2.2539, "step": 69456 }, { "epoch": 0.87, "learning_rate": 2.7715347852788547e-05, "loss": 2.2307, "step": 69464 }, { "epoch": 0.87, "learning_rate": 2.7703805774659204e-05, "loss": 2.2262, "step": 69472 }, { "epoch": 0.87, "learning_rate": 2.7692271950371817e-05, "loss": 2.2384, "step": 69480 }, { "epoch": 0.87, "learning_rate": 2.768074638108318e-05, "loss": 2.2409, "step": 69488 }, { "epoch": 0.87, "learning_rate": 2.7669229067949222e-05, "loss": 2.2278, "step": 69496 }, { "epoch": 0.87, "learning_rate": 2.765772001212509e-05, "loss": 2.258, "step": 69504 }, { "epoch": 0.87, "learning_rate": 2.7646219214765056e-05, "loss": 2.2603, "step": 69512 }, { "epoch": 0.87, "learning_rate": 2.7634726677022592e-05, "loss": 2.2429, "step": 69520 }, { "epoch": 0.87, "learning_rate": 2.7623242400050335e-05, "loss": 2.244, "step": 69528 }, { "epoch": 0.87, "learning_rate": 2.7611766385000092e-05, "loss": 2.2346, "step": 69536 }, { "epoch": 0.87, "learning_rate": 2.760029863302284e-05, "loss": 2.2324, "step": 69544 }, { "epoch": 0.87, "learning_rate": 2.758883914526875e-05, "loss": 2.2654, "step": 69552 }, { "epoch": 0.87, "learning_rate": 2.7577387922887105e-05, "loss": 2.2516, "step": 69560 }, { "epoch": 0.87, "learning_rate": 2.756594496702643e-05, "loss": 2.2474, "step": 69568 }, { "epoch": 0.87, "learning_rate": 2.755451027883438e-05, "loss": 2.234, "step": 69576 }, { "epoch": 0.87, "learning_rate": 2.7543083859457773e-05, "loss": 2.2472, "step": 69584 }, { "epoch": 0.87, "learning_rate": 2.753166571004263e-05, "loss": 2.2352, "step": 69592 }, { "epoch": 0.87, "learning_rate": 2.752025583173414e-05, "loss": 2.2379, "step": 69600 }, { "epoch": 0.87, "learning_rate": 2.7508854225676622e-05, "loss": 2.2512, "step": 69608 }, { "epoch": 0.87, "learning_rate": 2.7497460893013622e-05, "loss": 2.2183, "step": 69616 }, { "epoch": 0.87, "learning_rate": 2.748607583488779e-05, "loss": 2.2475, "step": 69624 }, { "epoch": 0.87, "learning_rate": 2.7474699052441e-05, "loss": 2.2596, "step": 69632 }, { "epoch": 0.87, "learning_rate": 2.7463330546814303e-05, "loss": 2.258, "step": 69640 }, { "epoch": 0.87, "learning_rate": 2.7451970319147847e-05, "loss": 2.23, "step": 69648 }, { "epoch": 0.87, "learning_rate": 2.7440618370581043e-05, "loss": 2.2531, "step": 69656 }, { "epoch": 0.87, "learning_rate": 2.7429274702252415e-05, "loss": 2.2537, "step": 69664 }, { "epoch": 0.87, "learning_rate": 2.7417939315299646e-05, "loss": 2.2326, "step": 69672 }, { "epoch": 0.87, "learning_rate": 2.740661221085965e-05, "loss": 2.2372, "step": 69680 }, { "epoch": 0.87, "learning_rate": 2.7395293390068416e-05, "loss": 2.2364, "step": 69688 }, { "epoch": 0.87, "learning_rate": 2.7383982854061208e-05, "loss": 2.2454, "step": 69696 }, { "epoch": 0.87, "learning_rate": 2.7372680603972406e-05, "loss": 2.2332, "step": 69704 }, { "epoch": 0.87, "learning_rate": 2.736138664093552e-05, "loss": 2.2303, "step": 69712 }, { "epoch": 0.87, "learning_rate": 2.7350100966083307e-05, "loss": 2.2418, "step": 69720 }, { "epoch": 0.87, "learning_rate": 2.7338823580547657e-05, "loss": 2.2383, "step": 69728 }, { "epoch": 0.87, "learning_rate": 2.732755448545961e-05, "loss": 2.2502, "step": 69736 }, { "epoch": 0.87, "learning_rate": 2.7316293681949416e-05, "loss": 2.2296, "step": 69744 }, { "epoch": 0.87, "learning_rate": 2.7305041171146428e-05, "loss": 2.2378, "step": 69752 }, { "epoch": 0.87, "learning_rate": 2.7293796954179253e-05, "loss": 2.2512, "step": 69760 }, { "epoch": 0.87, "learning_rate": 2.7282561032175592e-05, "loss": 2.2472, "step": 69768 }, { "epoch": 0.87, "learning_rate": 2.7271333406262363e-05, "loss": 2.2466, "step": 69776 }, { "epoch": 0.87, "learning_rate": 2.7260114077565624e-05, "loss": 2.2453, "step": 69784 }, { "epoch": 0.87, "learning_rate": 2.7248903047210622e-05, "loss": 2.2563, "step": 69792 }, { "epoch": 0.87, "learning_rate": 2.7237700316321745e-05, "loss": 2.232, "step": 69800 }, { "epoch": 0.87, "learning_rate": 2.7226505886022573e-05, "loss": 2.2515, "step": 69808 }, { "epoch": 0.87, "learning_rate": 2.7215319757435837e-05, "loss": 2.2466, "step": 69816 }, { "epoch": 0.87, "learning_rate": 2.7204141931683443e-05, "loss": 2.2623, "step": 69824 }, { "epoch": 0.87, "learning_rate": 2.719297240988647e-05, "loss": 2.2274, "step": 69832 }, { "epoch": 0.87, "learning_rate": 2.7181811193165147e-05, "loss": 2.2367, "step": 69840 }, { "epoch": 0.87, "learning_rate": 2.7170658282638895e-05, "loss": 2.254, "step": 69848 }, { "epoch": 0.87, "learning_rate": 2.7159513679426274e-05, "loss": 2.2372, "step": 69856 }, { "epoch": 0.87, "learning_rate": 2.7148377384645023e-05, "loss": 2.2248, "step": 69864 }, { "epoch": 0.87, "learning_rate": 2.713724939941209e-05, "loss": 2.2674, "step": 69872 }, { "epoch": 0.87, "learning_rate": 2.712612972484349e-05, "loss": 2.2531, "step": 69880 }, { "epoch": 0.87, "learning_rate": 2.711501836205449e-05, "loss": 2.2285, "step": 69888 }, { "epoch": 0.87, "learning_rate": 2.71039153121595e-05, "loss": 2.2471, "step": 69896 }, { "epoch": 0.87, "learning_rate": 2.7092820576272083e-05, "loss": 2.2504, "step": 69904 }, { "epoch": 0.87, "learning_rate": 2.7081734155505e-05, "loss": 2.2558, "step": 69912 }, { "epoch": 0.87, "learning_rate": 2.7070656050970134e-05, "loss": 2.2171, "step": 69920 }, { "epoch": 0.87, "learning_rate": 2.7059586263778534e-05, "loss": 2.2526, "step": 69928 }, { "epoch": 0.87, "learning_rate": 2.704852479504052e-05, "loss": 2.261, "step": 69936 }, { "epoch": 0.87, "learning_rate": 2.703747164586539e-05, "loss": 2.2546, "step": 69944 }, { "epoch": 0.87, "learning_rate": 2.7026426817361804e-05, "loss": 2.2314, "step": 69952 }, { "epoch": 0.87, "learning_rate": 2.701539031063742e-05, "loss": 2.2506, "step": 69960 }, { "epoch": 0.87, "learning_rate": 2.7004362126799183e-05, "loss": 2.2254, "step": 69968 }, { "epoch": 0.87, "learning_rate": 2.699334226695316e-05, "loss": 2.2268, "step": 69976 }, { "epoch": 0.87, "learning_rate": 2.698233073220453e-05, "loss": 2.2369, "step": 69984 }, { "epoch": 0.87, "learning_rate": 2.697132752365775e-05, "loss": 2.2345, "step": 69992 }, { "epoch": 0.88, "learning_rate": 2.6960332642416348e-05, "loss": 2.2376, "step": 70000 }, { "epoch": 0.88, "learning_rate": 2.6949346089583054e-05, "loss": 2.2457, "step": 70008 }, { "epoch": 0.88, "learning_rate": 2.6938367866259774e-05, "loss": 2.2338, "step": 70016 }, { "epoch": 0.88, "learning_rate": 2.692739797354752e-05, "loss": 2.2507, "step": 70024 }, { "epoch": 0.88, "learning_rate": 2.6916436412546537e-05, "loss": 2.2379, "step": 70032 }, { "epoch": 0.88, "learning_rate": 2.690548318435621e-05, "loss": 2.231, "step": 70040 }, { "epoch": 0.88, "learning_rate": 2.6894538290075078e-05, "loss": 2.2284, "step": 70048 }, { "epoch": 0.88, "learning_rate": 2.6883601730800844e-05, "loss": 2.2324, "step": 70056 }, { "epoch": 0.88, "learning_rate": 2.6872673507630414e-05, "loss": 2.25, "step": 70064 }, { "epoch": 0.88, "learning_rate": 2.686175362165979e-05, "loss": 2.2615, "step": 70072 }, { "epoch": 0.88, "learning_rate": 2.6850842073984196e-05, "loss": 2.2395, "step": 70080 }, { "epoch": 0.88, "learning_rate": 2.6839938865698e-05, "loss": 2.2541, "step": 70088 }, { "epoch": 0.88, "learning_rate": 2.6829043997894714e-05, "loss": 2.2388, "step": 70096 }, { "epoch": 0.88, "learning_rate": 2.6818157471667036e-05, "loss": 2.249, "step": 70104 }, { "epoch": 0.88, "learning_rate": 2.6807279288106845e-05, "loss": 2.2459, "step": 70112 }, { "epoch": 0.88, "learning_rate": 2.6796409448305145e-05, "loss": 2.2409, "step": 70120 }, { "epoch": 0.88, "learning_rate": 2.6785547953352108e-05, "loss": 2.2253, "step": 70128 }, { "epoch": 0.88, "learning_rate": 2.6774694804337093e-05, "loss": 2.2496, "step": 70136 }, { "epoch": 0.88, "learning_rate": 2.6763850002348622e-05, "loss": 2.2649, "step": 70144 }, { "epoch": 0.88, "learning_rate": 2.6753013548474347e-05, "loss": 2.2599, "step": 70152 }, { "epoch": 0.88, "learning_rate": 2.674218544380111e-05, "loss": 2.2362, "step": 70160 }, { "epoch": 0.88, "learning_rate": 2.6731365689414905e-05, "loss": 2.2124, "step": 70168 }, { "epoch": 0.88, "learning_rate": 2.6720554286400878e-05, "loss": 2.2433, "step": 70176 }, { "epoch": 0.88, "learning_rate": 2.6709751235843404e-05, "loss": 2.2515, "step": 70184 }, { "epoch": 0.88, "learning_rate": 2.6698956538825914e-05, "loss": 2.2439, "step": 70192 }, { "epoch": 0.88, "learning_rate": 2.668817019643106e-05, "loss": 2.2473, "step": 70200 }, { "epoch": 0.88, "learning_rate": 2.6677392209740704e-05, "loss": 2.2494, "step": 70208 }, { "epoch": 0.88, "learning_rate": 2.6666622579835733e-05, "loss": 2.2322, "step": 70216 }, { "epoch": 0.88, "learning_rate": 2.665586130779636e-05, "loss": 2.2667, "step": 70224 }, { "epoch": 0.88, "learning_rate": 2.6645108394701834e-05, "loss": 2.2428, "step": 70232 }, { "epoch": 0.88, "learning_rate": 2.6634363841630604e-05, "loss": 2.231, "step": 70240 }, { "epoch": 0.88, "learning_rate": 2.6623627649660322e-05, "loss": 2.2454, "step": 70248 }, { "epoch": 0.88, "learning_rate": 2.661289981986773e-05, "loss": 2.2518, "step": 70256 }, { "epoch": 0.88, "learning_rate": 2.660218035332881e-05, "loss": 2.231, "step": 70264 }, { "epoch": 0.88, "learning_rate": 2.6591469251118628e-05, "loss": 2.2453, "step": 70272 }, { "epoch": 0.88, "learning_rate": 2.658076651431148e-05, "loss": 2.2341, "step": 70280 }, { "epoch": 0.88, "learning_rate": 2.6570072143980766e-05, "loss": 2.2548, "step": 70288 }, { "epoch": 0.88, "learning_rate": 2.655938614119906e-05, "loss": 2.2648, "step": 70296 }, { "epoch": 0.88, "learning_rate": 2.6548708507038134e-05, "loss": 2.2509, "step": 70304 }, { "epoch": 0.88, "learning_rate": 2.6538039242568887e-05, "loss": 2.2511, "step": 70312 }, { "epoch": 0.88, "learning_rate": 2.6527378348861374e-05, "loss": 2.2556, "step": 70320 }, { "epoch": 0.88, "learning_rate": 2.651672582698484e-05, "loss": 2.2587, "step": 70328 }, { "epoch": 0.88, "learning_rate": 2.6506081678007656e-05, "loss": 2.2378, "step": 70336 }, { "epoch": 0.88, "learning_rate": 2.6495445902997383e-05, "loss": 2.2418, "step": 70344 }, { "epoch": 0.88, "learning_rate": 2.6484818503020714e-05, "loss": 2.2381, "step": 70352 }, { "epoch": 0.88, "learning_rate": 2.6474199479143535e-05, "loss": 2.2583, "step": 70360 }, { "epoch": 0.88, "learning_rate": 2.6463588832430864e-05, "loss": 2.2469, "step": 70368 }, { "epoch": 0.88, "learning_rate": 2.645298656394689e-05, "loss": 2.2353, "step": 70376 }, { "epoch": 0.88, "learning_rate": 2.644239267475495e-05, "loss": 2.2416, "step": 70384 }, { "epoch": 0.88, "learning_rate": 2.6431807165917572e-05, "loss": 2.2253, "step": 70392 }, { "epoch": 0.88, "learning_rate": 2.6421230038496413e-05, "loss": 2.2248, "step": 70400 }, { "epoch": 0.88, "learning_rate": 2.6410661293552296e-05, "loss": 2.2555, "step": 70408 }, { "epoch": 0.88, "learning_rate": 2.6400100932145205e-05, "loss": 2.2366, "step": 70416 }, { "epoch": 0.88, "learning_rate": 2.6389548955334282e-05, "loss": 2.257, "step": 70424 }, { "epoch": 0.88, "learning_rate": 2.6379005364177828e-05, "loss": 2.243, "step": 70432 }, { "epoch": 0.88, "learning_rate": 2.636847015973335e-05, "loss": 2.2432, "step": 70440 }, { "epoch": 0.88, "learning_rate": 2.6357943343057388e-05, "loss": 2.2539, "step": 70448 }, { "epoch": 0.88, "learning_rate": 2.6347424915205808e-05, "loss": 2.2385, "step": 70456 }, { "epoch": 0.88, "learning_rate": 2.6336914877233487e-05, "loss": 2.2434, "step": 70464 }, { "epoch": 0.88, "learning_rate": 2.632641323019453e-05, "loss": 2.2285, "step": 70472 }, { "epoch": 0.88, "learning_rate": 2.6315919975142234e-05, "loss": 2.2441, "step": 70480 }, { "epoch": 0.88, "learning_rate": 2.630543511312895e-05, "loss": 2.2404, "step": 70488 }, { "epoch": 0.88, "learning_rate": 2.6294958645206307e-05, "loss": 2.2343, "step": 70496 }, { "epoch": 0.88, "learning_rate": 2.6284490572425023e-05, "loss": 2.2448, "step": 70504 }, { "epoch": 0.88, "learning_rate": 2.627403089583495e-05, "loss": 2.2272, "step": 70512 }, { "epoch": 0.88, "learning_rate": 2.6263579616485185e-05, "loss": 2.2442, "step": 70520 }, { "epoch": 0.88, "learning_rate": 2.6253136735423884e-05, "loss": 2.2354, "step": 70528 }, { "epoch": 0.88, "learning_rate": 2.6242702253698444e-05, "loss": 2.2375, "step": 70536 }, { "epoch": 0.88, "learning_rate": 2.6232276172355386e-05, "loss": 2.253, "step": 70544 }, { "epoch": 0.88, "learning_rate": 2.622185849244035e-05, "loss": 2.2367, "step": 70552 }, { "epoch": 0.88, "learning_rate": 2.62114492149982e-05, "loss": 2.229, "step": 70560 }, { "epoch": 0.88, "learning_rate": 2.620104834107293e-05, "loss": 2.2321, "step": 70568 }, { "epoch": 0.88, "learning_rate": 2.619065587170768e-05, "loss": 2.231, "step": 70576 }, { "epoch": 0.88, "learning_rate": 2.6180271807944774e-05, "loss": 2.2498, "step": 70584 }, { "epoch": 0.88, "learning_rate": 2.6169896150825618e-05, "loss": 2.2471, "step": 70592 }, { "epoch": 0.88, "learning_rate": 2.615952890139089e-05, "loss": 2.2352, "step": 70600 }, { "epoch": 0.88, "learning_rate": 2.6149170060680344e-05, "loss": 2.2423, "step": 70608 }, { "epoch": 0.88, "learning_rate": 2.613881962973292e-05, "loss": 2.2388, "step": 70616 }, { "epoch": 0.88, "learning_rate": 2.6128477609586698e-05, "loss": 2.2416, "step": 70624 }, { "epoch": 0.88, "learning_rate": 2.611814400127894e-05, "loss": 2.2464, "step": 70632 }, { "epoch": 0.88, "learning_rate": 2.6107818805846028e-05, "loss": 2.2523, "step": 70640 }, { "epoch": 0.88, "learning_rate": 2.6097502024323538e-05, "loss": 2.2315, "step": 70648 }, { "epoch": 0.88, "learning_rate": 2.6087193657746173e-05, "loss": 2.231, "step": 70656 }, { "epoch": 0.88, "learning_rate": 2.6076893707147802e-05, "loss": 2.2401, "step": 70664 }, { "epoch": 0.88, "learning_rate": 2.6066602173561467e-05, "loss": 2.247, "step": 70672 }, { "epoch": 0.88, "learning_rate": 2.605631905801934e-05, "loss": 2.245, "step": 70680 }, { "epoch": 0.88, "learning_rate": 2.6046044361552752e-05, "loss": 2.2391, "step": 70688 }, { "epoch": 0.88, "learning_rate": 2.6035778085192218e-05, "loss": 2.2277, "step": 70696 }, { "epoch": 0.88, "learning_rate": 2.602552022996735e-05, "loss": 2.2423, "step": 70704 }, { "epoch": 0.88, "learning_rate": 2.601527079690701e-05, "loss": 2.2483, "step": 70712 }, { "epoch": 0.88, "learning_rate": 2.600502978703911e-05, "loss": 2.2175, "step": 70720 }, { "epoch": 0.88, "learning_rate": 2.599479720139078e-05, "loss": 2.2641, "step": 70728 }, { "epoch": 0.88, "learning_rate": 2.59845730409883e-05, "loss": 2.2322, "step": 70736 }, { "epoch": 0.88, "learning_rate": 2.597435730685706e-05, "loss": 2.2425, "step": 70744 }, { "epoch": 0.88, "learning_rate": 2.59641500000217e-05, "loss": 2.2098, "step": 70752 }, { "epoch": 0.88, "learning_rate": 2.595395112150591e-05, "loss": 2.2403, "step": 70760 }, { "epoch": 0.88, "learning_rate": 2.594376067233257e-05, "loss": 2.2539, "step": 70768 }, { "epoch": 0.88, "learning_rate": 2.5933578653523776e-05, "loss": 2.2437, "step": 70776 }, { "epoch": 0.88, "learning_rate": 2.592340506610067e-05, "loss": 2.2542, "step": 70784 }, { "epoch": 0.88, "learning_rate": 2.591323991108366e-05, "loss": 2.2404, "step": 70792 }, { "epoch": 0.89, "learning_rate": 2.59030831894922e-05, "loss": 2.2505, "step": 70800 }, { "epoch": 0.89, "learning_rate": 2.5892934902344985e-05, "loss": 2.2269, "step": 70808 }, { "epoch": 0.89, "learning_rate": 2.5882795050659836e-05, "loss": 2.2446, "step": 70816 }, { "epoch": 0.89, "learning_rate": 2.587266363545368e-05, "loss": 2.2335, "step": 70824 }, { "epoch": 0.89, "learning_rate": 2.586254065774269e-05, "loss": 2.2512, "step": 70832 }, { "epoch": 0.89, "learning_rate": 2.5852426118542123e-05, "loss": 2.2235, "step": 70840 }, { "epoch": 0.89, "learning_rate": 2.584232001886641e-05, "loss": 2.2458, "step": 70848 }, { "epoch": 0.89, "learning_rate": 2.583222235972914e-05, "loss": 2.221, "step": 70856 }, { "epoch": 0.89, "learning_rate": 2.5822133142143023e-05, "loss": 2.2457, "step": 70864 }, { "epoch": 0.89, "learning_rate": 2.581205236712e-05, "loss": 2.2718, "step": 70872 }, { "epoch": 0.89, "learning_rate": 2.5801980035671075e-05, "loss": 2.2216, "step": 70880 }, { "epoch": 0.89, "learning_rate": 2.5791916148806467e-05, "loss": 2.2622, "step": 70888 }, { "epoch": 0.89, "learning_rate": 2.578186070753552e-05, "loss": 2.2647, "step": 70896 }, { "epoch": 0.89, "learning_rate": 2.5771813712866728e-05, "loss": 2.2284, "step": 70904 }, { "epoch": 0.89, "learning_rate": 2.5761775165807766e-05, "loss": 2.2709, "step": 70912 }, { "epoch": 0.89, "learning_rate": 2.5751745067365434e-05, "loss": 2.2099, "step": 70920 }, { "epoch": 0.89, "learning_rate": 2.574172341854569e-05, "loss": 2.2521, "step": 70928 }, { "epoch": 0.89, "learning_rate": 2.5731710220353667e-05, "loss": 2.2364, "step": 70936 }, { "epoch": 0.89, "learning_rate": 2.5721705473793607e-05, "loss": 2.2263, "step": 70944 }, { "epoch": 0.89, "learning_rate": 2.5711709179868938e-05, "loss": 2.2395, "step": 70952 }, { "epoch": 0.89, "learning_rate": 2.5701721339582236e-05, "loss": 2.2513, "step": 70960 }, { "epoch": 0.89, "learning_rate": 2.5691741953935226e-05, "loss": 2.2285, "step": 70968 }, { "epoch": 0.89, "learning_rate": 2.5681771023928775e-05, "loss": 2.2477, "step": 70976 }, { "epoch": 0.89, "learning_rate": 2.5671808550562938e-05, "loss": 2.2382, "step": 70984 }, { "epoch": 0.89, "learning_rate": 2.566185453483685e-05, "loss": 2.2506, "step": 70992 }, { "epoch": 0.89, "learning_rate": 2.5651908977748884e-05, "loss": 2.2585, "step": 71000 }, { "epoch": 0.89, "learning_rate": 2.564197188029649e-05, "loss": 2.26, "step": 71008 }, { "epoch": 0.89, "learning_rate": 2.5632043243476306e-05, "loss": 2.2573, "step": 71016 }, { "epoch": 0.89, "learning_rate": 2.5622123068284164e-05, "loss": 2.2284, "step": 71024 }, { "epoch": 0.89, "learning_rate": 2.5612211355714947e-05, "loss": 2.2082, "step": 71032 }, { "epoch": 0.89, "learning_rate": 2.5602308106762756e-05, "loss": 2.2336, "step": 71040 }, { "epoch": 0.89, "learning_rate": 2.5592413322420867e-05, "loss": 2.2227, "step": 71048 }, { "epoch": 0.89, "learning_rate": 2.5582527003681607e-05, "loss": 2.2466, "step": 71056 }, { "epoch": 0.89, "learning_rate": 2.5572649151536583e-05, "loss": 2.2434, "step": 71064 }, { "epoch": 0.89, "learning_rate": 2.5562779766976436e-05, "loss": 2.2441, "step": 71072 }, { "epoch": 0.89, "learning_rate": 2.5552918850991027e-05, "loss": 2.2316, "step": 71080 }, { "epoch": 0.89, "learning_rate": 2.5543066404569376e-05, "loss": 2.2619, "step": 71088 }, { "epoch": 0.89, "learning_rate": 2.553322242869959e-05, "loss": 2.2562, "step": 71096 }, { "epoch": 0.89, "learning_rate": 2.5523386924368982e-05, "loss": 2.2597, "step": 71104 }, { "epoch": 0.89, "learning_rate": 2.551355989256401e-05, "loss": 2.2234, "step": 71112 }, { "epoch": 0.89, "learning_rate": 2.5503741334270226e-05, "loss": 2.2562, "step": 71120 }, { "epoch": 0.89, "learning_rate": 2.5493931250472425e-05, "loss": 2.2738, "step": 71128 }, { "epoch": 0.89, "learning_rate": 2.548412964215446e-05, "loss": 2.2414, "step": 71136 }, { "epoch": 0.89, "learning_rate": 2.5474336510299417e-05, "loss": 2.2605, "step": 71144 }, { "epoch": 0.89, "learning_rate": 2.5464551855889472e-05, "loss": 2.2252, "step": 71152 }, { "epoch": 0.89, "learning_rate": 2.5454775679905968e-05, "loss": 2.2447, "step": 71160 }, { "epoch": 0.89, "learning_rate": 2.54450079833294e-05, "loss": 2.2306, "step": 71168 }, { "epoch": 0.89, "learning_rate": 2.5435248767139425e-05, "loss": 2.2321, "step": 71176 }, { "epoch": 0.89, "learning_rate": 2.5425498032314832e-05, "loss": 2.2267, "step": 71184 }, { "epoch": 0.89, "learning_rate": 2.5415755779833543e-05, "loss": 2.2515, "step": 71192 }, { "epoch": 0.89, "learning_rate": 2.540602201067268e-05, "loss": 2.2403, "step": 71200 }, { "epoch": 0.89, "learning_rate": 2.5396296725808477e-05, "loss": 2.2613, "step": 71208 }, { "epoch": 0.89, "learning_rate": 2.5386579926216312e-05, "loss": 2.2538, "step": 71216 }, { "epoch": 0.89, "learning_rate": 2.5376871612870738e-05, "loss": 2.2423, "step": 71224 }, { "epoch": 0.89, "learning_rate": 2.5367171786745442e-05, "loss": 2.2674, "step": 71232 }, { "epoch": 0.89, "learning_rate": 2.535748044881326e-05, "loss": 2.2433, "step": 71240 }, { "epoch": 0.89, "learning_rate": 2.534779760004618e-05, "loss": 2.2525, "step": 71248 }, { "epoch": 0.89, "learning_rate": 2.5338123241415334e-05, "loss": 2.2384, "step": 71256 }, { "epoch": 0.89, "learning_rate": 2.5328457373890997e-05, "loss": 2.2438, "step": 71264 }, { "epoch": 0.89, "learning_rate": 2.531879999844262e-05, "loss": 2.2372, "step": 71272 }, { "epoch": 0.89, "learning_rate": 2.530915111603877e-05, "loss": 2.2423, "step": 71280 }, { "epoch": 0.89, "learning_rate": 2.529951072764718e-05, "loss": 2.241, "step": 71288 }, { "epoch": 0.89, "learning_rate": 2.5289878834234726e-05, "loss": 2.2451, "step": 71296 }, { "epoch": 0.89, "learning_rate": 2.528025543676743e-05, "loss": 2.232, "step": 71304 }, { "epoch": 0.89, "learning_rate": 2.527064053621045e-05, "loss": 2.2387, "step": 71312 }, { "epoch": 0.89, "learning_rate": 2.5261034133528138e-05, "loss": 2.2429, "step": 71320 }, { "epoch": 0.89, "learning_rate": 2.525143622968393e-05, "loss": 2.2372, "step": 71328 }, { "epoch": 0.89, "learning_rate": 2.5241846825640485e-05, "loss": 2.2613, "step": 71336 }, { "epoch": 0.89, "learning_rate": 2.5232265922359516e-05, "loss": 2.2501, "step": 71344 }, { "epoch": 0.89, "learning_rate": 2.5222693520801947e-05, "loss": 2.2455, "step": 71352 }, { "epoch": 0.89, "learning_rate": 2.521312962192786e-05, "loss": 2.2312, "step": 71360 }, { "epoch": 0.89, "learning_rate": 2.520357422669643e-05, "loss": 2.2335, "step": 71368 }, { "epoch": 0.89, "learning_rate": 2.5194027336066028e-05, "loss": 2.2451, "step": 71376 }, { "epoch": 0.89, "learning_rate": 2.5184488950994163e-05, "loss": 2.207, "step": 71384 }, { "epoch": 0.89, "learning_rate": 2.517495907243743e-05, "loss": 2.2572, "step": 71392 }, { "epoch": 0.89, "learning_rate": 2.5165437701351702e-05, "loss": 2.2407, "step": 71400 }, { "epoch": 0.89, "learning_rate": 2.515592483869183e-05, "loss": 2.2363, "step": 71408 }, { "epoch": 0.89, "learning_rate": 2.5146420485411958e-05, "loss": 2.2416, "step": 71416 }, { "epoch": 0.89, "learning_rate": 2.513692464246533e-05, "loss": 2.2361, "step": 71424 }, { "epoch": 0.89, "learning_rate": 2.5127437310804263e-05, "loss": 2.253, "step": 71432 }, { "epoch": 0.89, "learning_rate": 2.5117958491380337e-05, "loss": 2.259, "step": 71440 }, { "epoch": 0.89, "learning_rate": 2.5108488185144203e-05, "loss": 2.2423, "step": 71448 }, { "epoch": 0.89, "learning_rate": 2.5099026393045682e-05, "loss": 2.2262, "step": 71456 }, { "epoch": 0.89, "learning_rate": 2.508957311603376e-05, "loss": 2.2344, "step": 71464 }, { "epoch": 0.89, "learning_rate": 2.5080128355056483e-05, "loss": 2.2377, "step": 71472 }, { "epoch": 0.89, "learning_rate": 2.507069211106118e-05, "loss": 2.247, "step": 71480 }, { "epoch": 0.89, "learning_rate": 2.506126438499421e-05, "loss": 2.2473, "step": 71488 }, { "epoch": 0.89, "learning_rate": 2.5051845177801136e-05, "loss": 2.2285, "step": 71496 }, { "epoch": 0.89, "learning_rate": 2.5042434490426648e-05, "loss": 2.2405, "step": 71504 }, { "epoch": 0.89, "learning_rate": 2.5033032323814587e-05, "loss": 2.2332, "step": 71512 }, { "epoch": 0.89, "learning_rate": 2.5023638678907925e-05, "loss": 2.2419, "step": 71520 }, { "epoch": 0.89, "learning_rate": 2.5014253556648813e-05, "loss": 2.2503, "step": 71528 }, { "epoch": 0.89, "learning_rate": 2.5004876957978508e-05, "loss": 2.2474, "step": 71536 }, { "epoch": 0.89, "learning_rate": 2.499550888383742e-05, "loss": 2.2355, "step": 71544 }, { "epoch": 0.89, "learning_rate": 2.4986149335165166e-05, "loss": 2.2421, "step": 71552 }, { "epoch": 0.89, "learning_rate": 2.4976798312900394e-05, "loss": 2.2343, "step": 71560 }, { "epoch": 0.89, "learning_rate": 2.496745581798099e-05, "loss": 2.2387, "step": 71568 }, { "epoch": 0.89, "learning_rate": 2.4958121851343943e-05, "loss": 2.2423, "step": 71576 }, { "epoch": 0.89, "learning_rate": 2.4948796413925384e-05, "loss": 2.2533, "step": 71584 }, { "epoch": 0.89, "learning_rate": 2.493947950666065e-05, "loss": 2.237, "step": 71592 }, { "epoch": 0.9, "learning_rate": 2.493017113048413e-05, "loss": 2.2426, "step": 71600 }, { "epoch": 0.9, "learning_rate": 2.4920871286329396e-05, "loss": 2.2578, "step": 71608 }, { "epoch": 0.9, "learning_rate": 2.491157997512921e-05, "loss": 2.2512, "step": 71616 }, { "epoch": 0.9, "learning_rate": 2.49022971978154e-05, "loss": 2.2414, "step": 71624 }, { "epoch": 0.9, "learning_rate": 2.489302295531901e-05, "loss": 2.2216, "step": 71632 }, { "epoch": 0.9, "learning_rate": 2.4883757248570156e-05, "loss": 2.238, "step": 71640 }, { "epoch": 0.9, "learning_rate": 2.487450007849815e-05, "loss": 2.252, "step": 71648 }, { "epoch": 0.9, "learning_rate": 2.4865251446031466e-05, "loss": 2.2622, "step": 71656 }, { "epoch": 0.9, "learning_rate": 2.4856011352097634e-05, "loss": 2.2203, "step": 71664 }, { "epoch": 0.9, "learning_rate": 2.4846779797623418e-05, "loss": 2.2486, "step": 71672 }, { "epoch": 0.9, "learning_rate": 2.4837556783534682e-05, "loss": 2.263, "step": 71680 }, { "epoch": 0.9, "learning_rate": 2.482834231075646e-05, "loss": 2.2584, "step": 71688 }, { "epoch": 0.9, "learning_rate": 2.481913638021289e-05, "loss": 2.2488, "step": 71696 }, { "epoch": 0.9, "learning_rate": 2.4809938992827265e-05, "loss": 2.2176, "step": 71704 }, { "epoch": 0.9, "learning_rate": 2.4800750149522052e-05, "loss": 2.2406, "step": 71712 }, { "epoch": 0.9, "learning_rate": 2.479156985121884e-05, "loss": 2.241, "step": 71720 }, { "epoch": 0.9, "learning_rate": 2.478239809883834e-05, "loss": 2.2553, "step": 71728 }, { "epoch": 0.9, "learning_rate": 2.4773234893300457e-05, "loss": 2.2085, "step": 71736 }, { "epoch": 0.9, "learning_rate": 2.476408023552418e-05, "loss": 2.2558, "step": 71744 }, { "epoch": 0.9, "learning_rate": 2.4754934126427693e-05, "loss": 2.2164, "step": 71752 }, { "epoch": 0.9, "learning_rate": 2.474579656692829e-05, "loss": 2.2482, "step": 71760 }, { "epoch": 0.9, "learning_rate": 2.4736667557942408e-05, "loss": 2.2404, "step": 71768 }, { "epoch": 0.9, "learning_rate": 2.472754710038564e-05, "loss": 2.2312, "step": 71776 }, { "epoch": 0.9, "learning_rate": 2.4718435195172714e-05, "loss": 2.2645, "step": 71784 }, { "epoch": 0.9, "learning_rate": 2.4709331843217513e-05, "loss": 2.2436, "step": 71792 }, { "epoch": 0.9, "learning_rate": 2.470023704543304e-05, "loss": 2.2385, "step": 71800 }, { "epoch": 0.9, "learning_rate": 2.4691150802731462e-05, "loss": 2.2283, "step": 71808 }, { "epoch": 0.9, "learning_rate": 2.4682073116024074e-05, "loss": 2.2222, "step": 71816 }, { "epoch": 0.9, "learning_rate": 2.4673003986221305e-05, "loss": 2.2497, "step": 71824 }, { "epoch": 0.9, "learning_rate": 2.466394341423275e-05, "loss": 2.2376, "step": 71832 }, { "epoch": 0.9, "learning_rate": 2.4654891400967137e-05, "loss": 2.2467, "step": 71840 }, { "epoch": 0.9, "learning_rate": 2.4645847947332316e-05, "loss": 2.2292, "step": 71848 }, { "epoch": 0.9, "learning_rate": 2.4636813054235286e-05, "loss": 2.262, "step": 71856 }, { "epoch": 0.9, "learning_rate": 2.462778672258225e-05, "loss": 2.2515, "step": 71864 }, { "epoch": 0.9, "learning_rate": 2.4618768953278443e-05, "loss": 2.2694, "step": 71872 }, { "epoch": 0.9, "learning_rate": 2.460975974722829e-05, "loss": 2.2376, "step": 71880 }, { "epoch": 0.9, "learning_rate": 2.4600759105335423e-05, "loss": 2.2451, "step": 71888 }, { "epoch": 0.9, "learning_rate": 2.4591767028502496e-05, "loss": 2.2445, "step": 71896 }, { "epoch": 0.9, "learning_rate": 2.4582783517631407e-05, "loss": 2.2358, "step": 71904 }, { "epoch": 0.9, "learning_rate": 2.457380857362311e-05, "loss": 2.2382, "step": 71912 }, { "epoch": 0.9, "learning_rate": 2.4564842197377763e-05, "loss": 2.2368, "step": 71920 }, { "epoch": 0.9, "learning_rate": 2.4555884389794665e-05, "loss": 2.2267, "step": 71928 }, { "epoch": 0.9, "learning_rate": 2.4546935151772176e-05, "loss": 2.2466, "step": 71936 }, { "epoch": 0.9, "learning_rate": 2.45379944842079e-05, "loss": 2.2288, "step": 71944 }, { "epoch": 0.9, "learning_rate": 2.4529062387998544e-05, "loss": 2.2312, "step": 71952 }, { "epoch": 0.9, "learning_rate": 2.4520138864039895e-05, "loss": 2.2384, "step": 71960 }, { "epoch": 0.9, "learning_rate": 2.451122391322699e-05, "loss": 2.2516, "step": 71968 }, { "epoch": 0.9, "learning_rate": 2.4502317536453888e-05, "loss": 2.2426, "step": 71976 }, { "epoch": 0.9, "learning_rate": 2.4493419734613895e-05, "loss": 2.2497, "step": 71984 }, { "epoch": 0.9, "learning_rate": 2.448453050859942e-05, "loss": 2.2436, "step": 71992 }, { "epoch": 0.9, "learning_rate": 2.4475649859301942e-05, "loss": 2.2314, "step": 72000 }, { "epoch": 0.9, "learning_rate": 2.4466777787612188e-05, "loss": 2.2255, "step": 72008 }, { "epoch": 0.9, "learning_rate": 2.445791429441997e-05, "loss": 2.2361, "step": 72016 }, { "epoch": 0.9, "learning_rate": 2.4449059380614235e-05, "loss": 2.2421, "step": 72024 }, { "epoch": 0.9, "learning_rate": 2.4440213047083088e-05, "loss": 2.2444, "step": 72032 }, { "epoch": 0.9, "learning_rate": 2.443137529471376e-05, "loss": 2.2237, "step": 72040 }, { "epoch": 0.9, "learning_rate": 2.4422546124392634e-05, "loss": 2.2472, "step": 72048 }, { "epoch": 0.9, "learning_rate": 2.4413725537005222e-05, "loss": 2.2488, "step": 72056 }, { "epoch": 0.9, "learning_rate": 2.4404913533436186e-05, "loss": 2.2232, "step": 72064 }, { "epoch": 0.9, "learning_rate": 2.4396110114569306e-05, "loss": 2.2529, "step": 72072 }, { "epoch": 0.9, "learning_rate": 2.4387315281287533e-05, "loss": 2.2511, "step": 72080 }, { "epoch": 0.9, "learning_rate": 2.4378529034472916e-05, "loss": 2.2327, "step": 72088 }, { "epoch": 0.9, "learning_rate": 2.436975137500669e-05, "loss": 2.2384, "step": 72096 }, { "epoch": 0.9, "learning_rate": 2.4360982303769183e-05, "loss": 2.2277, "step": 72104 }, { "epoch": 0.9, "learning_rate": 2.4352221821639904e-05, "loss": 2.2349, "step": 72112 }, { "epoch": 0.9, "learning_rate": 2.4343469929497463e-05, "loss": 2.2447, "step": 72120 }, { "epoch": 0.9, "learning_rate": 2.433472662821963e-05, "loss": 2.2593, "step": 72128 }, { "epoch": 0.9, "learning_rate": 2.4325991918683318e-05, "loss": 2.2425, "step": 72136 }, { "epoch": 0.9, "learning_rate": 2.4317265801764555e-05, "loss": 2.2288, "step": 72144 }, { "epoch": 0.9, "learning_rate": 2.4308548278338517e-05, "loss": 2.2612, "step": 72152 }, { "epoch": 0.9, "learning_rate": 2.4299839349279556e-05, "loss": 2.2252, "step": 72160 }, { "epoch": 0.9, "learning_rate": 2.429113901546109e-05, "loss": 2.2297, "step": 72168 }, { "epoch": 0.9, "learning_rate": 2.428244727775573e-05, "loss": 2.2373, "step": 72176 }, { "epoch": 0.9, "learning_rate": 2.4273764137035205e-05, "loss": 2.226, "step": 72184 }, { "epoch": 0.9, "learning_rate": 2.426508959417037e-05, "loss": 2.2365, "step": 72192 }, { "epoch": 0.9, "learning_rate": 2.4256423650031275e-05, "loss": 2.2273, "step": 72200 }, { "epoch": 0.9, "learning_rate": 2.4247766305487012e-05, "loss": 2.2509, "step": 72208 }, { "epoch": 0.9, "learning_rate": 2.4239117561405905e-05, "loss": 2.2645, "step": 72216 }, { "epoch": 0.9, "learning_rate": 2.4230477418655377e-05, "loss": 2.2291, "step": 72224 }, { "epoch": 0.9, "learning_rate": 2.4221845878101928e-05, "loss": 2.2258, "step": 72232 }, { "epoch": 0.9, "learning_rate": 2.421322294061133e-05, "loss": 2.2296, "step": 72240 }, { "epoch": 0.9, "learning_rate": 2.4204608607048344e-05, "loss": 2.2507, "step": 72248 }, { "epoch": 0.9, "learning_rate": 2.419600287827698e-05, "loss": 2.2416, "step": 72256 }, { "epoch": 0.9, "learning_rate": 2.4187405755160354e-05, "loss": 2.2535, "step": 72264 }, { "epoch": 0.9, "learning_rate": 2.417881723856066e-05, "loss": 2.2291, "step": 72272 }, { "epoch": 0.9, "learning_rate": 2.4170237329339324e-05, "loss": 2.2499, "step": 72280 }, { "epoch": 0.9, "learning_rate": 2.416166602835684e-05, "loss": 2.2451, "step": 72288 }, { "epoch": 0.9, "learning_rate": 2.415310333647287e-05, "loss": 2.2463, "step": 72296 }, { "epoch": 0.9, "learning_rate": 2.4144549254546218e-05, "loss": 2.2284, "step": 72304 }, { "epoch": 0.9, "learning_rate": 2.4136003783434765e-05, "loss": 2.2449, "step": 72312 }, { "epoch": 0.9, "learning_rate": 2.412746692399561e-05, "loss": 2.2328, "step": 72320 }, { "epoch": 0.9, "learning_rate": 2.4118938677084942e-05, "loss": 2.2147, "step": 72328 }, { "epoch": 0.9, "learning_rate": 2.411041904355809e-05, "loss": 2.2534, "step": 72336 }, { "epoch": 0.9, "learning_rate": 2.4101908024269546e-05, "loss": 2.2433, "step": 72344 }, { "epoch": 0.9, "learning_rate": 2.4093405620072887e-05, "loss": 2.2412, "step": 72352 }, { "epoch": 0.9, "learning_rate": 2.4084911831820876e-05, "loss": 2.2381, "step": 72360 }, { "epoch": 0.9, "learning_rate": 2.4076426660365385e-05, "loss": 2.2363, "step": 72368 }, { "epoch": 0.9, "learning_rate": 2.4067950106557436e-05, "loss": 2.2731, "step": 72376 }, { "epoch": 0.9, "learning_rate": 2.4059482171247154e-05, "loss": 2.2359, "step": 72384 }, { "epoch": 0.9, "learning_rate": 2.4051022855283866e-05, "loss": 2.2324, "step": 72392 }, { "epoch": 0.91, "learning_rate": 2.4042572159515968e-05, "loss": 2.2496, "step": 72400 }, { "epoch": 0.91, "learning_rate": 2.403413008479102e-05, "loss": 2.244, "step": 72408 }, { "epoch": 0.91, "learning_rate": 2.4025696631955712e-05, "loss": 2.2523, "step": 72416 }, { "epoch": 0.91, "learning_rate": 2.401727180185586e-05, "loss": 2.2378, "step": 72424 }, { "epoch": 0.91, "learning_rate": 2.400885559533648e-05, "loss": 2.2199, "step": 72432 }, { "epoch": 0.91, "learning_rate": 2.40004480132416e-05, "loss": 2.2172, "step": 72440 }, { "epoch": 0.91, "learning_rate": 2.3992049056414485e-05, "loss": 2.2259, "step": 72448 }, { "epoch": 0.91, "learning_rate": 2.3983658725697518e-05, "loss": 2.2466, "step": 72456 }, { "epoch": 0.91, "learning_rate": 2.3975277021932168e-05, "loss": 2.2305, "step": 72464 }, { "epoch": 0.91, "learning_rate": 2.396690394595911e-05, "loss": 2.2357, "step": 72472 }, { "epoch": 0.91, "learning_rate": 2.3958539498618082e-05, "loss": 2.2139, "step": 72480 }, { "epoch": 0.91, "learning_rate": 2.3950183680747993e-05, "loss": 2.233, "step": 72488 }, { "epoch": 0.91, "learning_rate": 2.394183649318692e-05, "loss": 2.2435, "step": 72496 }, { "epoch": 0.91, "learning_rate": 2.3933497936771994e-05, "loss": 2.2604, "step": 72504 }, { "epoch": 0.91, "learning_rate": 2.3925168012339557e-05, "loss": 2.2299, "step": 72512 }, { "epoch": 0.91, "learning_rate": 2.391684672072505e-05, "loss": 2.2552, "step": 72520 }, { "epoch": 0.91, "learning_rate": 2.390853406276302e-05, "loss": 2.2435, "step": 72528 }, { "epoch": 0.91, "learning_rate": 2.3900230039287222e-05, "loss": 2.2323, "step": 72536 }, { "epoch": 0.91, "learning_rate": 2.3891934651130466e-05, "loss": 2.2479, "step": 72544 }, { "epoch": 0.91, "learning_rate": 2.388364789912476e-05, "loss": 2.2519, "step": 72552 }, { "epoch": 0.91, "learning_rate": 2.387536978410121e-05, "loss": 2.2426, "step": 72560 }, { "epoch": 0.91, "learning_rate": 2.386710030689005e-05, "loss": 2.2562, "step": 72568 }, { "epoch": 0.91, "learning_rate": 2.3858839468320684e-05, "loss": 2.2445, "step": 72576 }, { "epoch": 0.91, "learning_rate": 2.3850587269221615e-05, "loss": 2.2157, "step": 72584 }, { "epoch": 0.91, "learning_rate": 2.3842343710420487e-05, "loss": 2.234, "step": 72592 }, { "epoch": 0.91, "learning_rate": 2.3834108792744093e-05, "loss": 2.2532, "step": 72600 }, { "epoch": 0.91, "learning_rate": 2.3825882517018343e-05, "loss": 2.2421, "step": 72608 }, { "epoch": 0.91, "learning_rate": 2.3817664884068293e-05, "loss": 2.2458, "step": 72616 }, { "epoch": 0.91, "learning_rate": 2.3809455894718114e-05, "loss": 2.2349, "step": 72624 }, { "epoch": 0.91, "learning_rate": 2.380125554979113e-05, "loss": 2.2359, "step": 72632 }, { "epoch": 0.91, "learning_rate": 2.379306385010978e-05, "loss": 2.2359, "step": 72640 }, { "epoch": 0.91, "learning_rate": 2.378488079649565e-05, "loss": 2.2504, "step": 72648 }, { "epoch": 0.91, "learning_rate": 2.3776706389769457e-05, "loss": 2.2283, "step": 72656 }, { "epoch": 0.91, "learning_rate": 2.3768540630751054e-05, "loss": 2.2394, "step": 72664 }, { "epoch": 0.91, "learning_rate": 2.3760383520259394e-05, "loss": 2.2448, "step": 72672 }, { "epoch": 0.91, "learning_rate": 2.3752235059112615e-05, "loss": 2.2354, "step": 72680 }, { "epoch": 0.91, "learning_rate": 2.3744095248127953e-05, "loss": 2.2217, "step": 72688 }, { "epoch": 0.91, "learning_rate": 2.3735964088121787e-05, "loss": 2.2614, "step": 72696 }, { "epoch": 0.91, "learning_rate": 2.3727841579909617e-05, "loss": 2.2403, "step": 72704 }, { "epoch": 0.91, "learning_rate": 2.3719727724306103e-05, "loss": 2.2361, "step": 72712 }, { "epoch": 0.91, "learning_rate": 2.3711622522124992e-05, "loss": 2.246, "step": 72720 }, { "epoch": 0.91, "learning_rate": 2.3703525974179223e-05, "loss": 2.2425, "step": 72728 }, { "epoch": 0.91, "learning_rate": 2.369543808128079e-05, "loss": 2.2479, "step": 72736 }, { "epoch": 0.91, "learning_rate": 2.3687358844240918e-05, "loss": 2.2534, "step": 72744 }, { "epoch": 0.91, "learning_rate": 2.3679288263869868e-05, "loss": 2.2172, "step": 72752 }, { "epoch": 0.91, "learning_rate": 2.367122634097707e-05, "loss": 2.2632, "step": 72760 }, { "epoch": 0.91, "learning_rate": 2.3663173076371133e-05, "loss": 2.2315, "step": 72768 }, { "epoch": 0.91, "learning_rate": 2.3655128470859696e-05, "loss": 2.2397, "step": 72776 }, { "epoch": 0.91, "learning_rate": 2.3647092525249638e-05, "loss": 2.2361, "step": 72784 }, { "epoch": 0.91, "learning_rate": 2.3639065240346896e-05, "loss": 2.2346, "step": 72792 }, { "epoch": 0.91, "learning_rate": 2.3631046616956543e-05, "loss": 2.2343, "step": 72800 }, { "epoch": 0.91, "learning_rate": 2.3623036655882845e-05, "loss": 2.263, "step": 72808 }, { "epoch": 0.91, "learning_rate": 2.361503535792911e-05, "loss": 2.2355, "step": 72816 }, { "epoch": 0.91, "learning_rate": 2.360704272389785e-05, "loss": 2.2362, "step": 72824 }, { "epoch": 0.91, "learning_rate": 2.3599058754590693e-05, "loss": 2.2481, "step": 72832 }, { "epoch": 0.91, "learning_rate": 2.3591083450808348e-05, "loss": 2.2473, "step": 72840 }, { "epoch": 0.91, "learning_rate": 2.3583116813350718e-05, "loss": 2.2281, "step": 72848 }, { "epoch": 0.91, "learning_rate": 2.357515884301681e-05, "loss": 2.2411, "step": 72856 }, { "epoch": 0.91, "learning_rate": 2.3567209540604757e-05, "loss": 2.2526, "step": 72864 }, { "epoch": 0.91, "learning_rate": 2.3559268906911843e-05, "loss": 2.2414, "step": 72872 }, { "epoch": 0.91, "learning_rate": 2.3551336942734437e-05, "loss": 2.2606, "step": 72880 }, { "epoch": 0.91, "learning_rate": 2.354341364886811e-05, "loss": 2.2315, "step": 72888 }, { "epoch": 0.91, "learning_rate": 2.3535499026107486e-05, "loss": 2.2453, "step": 72896 }, { "epoch": 0.91, "learning_rate": 2.352759307524639e-05, "loss": 2.2432, "step": 72904 }, { "epoch": 0.91, "learning_rate": 2.3519695797077716e-05, "loss": 2.2373, "step": 72912 }, { "epoch": 0.91, "learning_rate": 2.3511807192393536e-05, "loss": 2.2215, "step": 72920 }, { "epoch": 0.91, "learning_rate": 2.3503927261985035e-05, "loss": 2.2476, "step": 72928 }, { "epoch": 0.91, "learning_rate": 2.3496056006642507e-05, "loss": 2.235, "step": 72936 }, { "epoch": 0.91, "learning_rate": 2.3488193427155402e-05, "loss": 2.2443, "step": 72944 }, { "epoch": 0.91, "learning_rate": 2.3480339524312296e-05, "loss": 2.2372, "step": 72952 }, { "epoch": 0.91, "learning_rate": 2.3472494298900888e-05, "loss": 2.2146, "step": 72960 }, { "epoch": 0.91, "learning_rate": 2.3464657751708003e-05, "loss": 2.2418, "step": 72968 }, { "epoch": 0.91, "learning_rate": 2.3456829883519615e-05, "loss": 2.2437, "step": 72976 }, { "epoch": 0.91, "learning_rate": 2.3449010695120803e-05, "loss": 2.2618, "step": 72984 }, { "epoch": 0.91, "learning_rate": 2.344120018729579e-05, "loss": 2.218, "step": 72992 }, { "epoch": 0.91, "learning_rate": 2.3433398360827954e-05, "loss": 2.2361, "step": 73000 }, { "epoch": 0.91, "learning_rate": 2.3425605216499736e-05, "loss": 2.2446, "step": 73008 }, { "epoch": 0.91, "learning_rate": 2.3417820755092755e-05, "loss": 2.2199, "step": 73016 }, { "epoch": 0.91, "learning_rate": 2.3410044977387745e-05, "loss": 2.2439, "step": 73024 }, { "epoch": 0.91, "learning_rate": 2.3402277884164576e-05, "loss": 2.2437, "step": 73032 }, { "epoch": 0.91, "learning_rate": 2.3394519476202258e-05, "loss": 2.2289, "step": 73040 }, { "epoch": 0.91, "learning_rate": 2.3386769754278902e-05, "loss": 2.244, "step": 73048 }, { "epoch": 0.91, "learning_rate": 2.3379028719171746e-05, "loss": 2.2458, "step": 73056 }, { "epoch": 0.91, "learning_rate": 2.337129637165721e-05, "loss": 2.234, "step": 73064 }, { "epoch": 0.91, "learning_rate": 2.3363572712510757e-05, "loss": 2.2549, "step": 73072 }, { "epoch": 0.91, "learning_rate": 2.3355857742507083e-05, "loss": 2.2332, "step": 73080 }, { "epoch": 0.91, "learning_rate": 2.334815146241989e-05, "loss": 2.2226, "step": 73088 }, { "epoch": 0.91, "learning_rate": 2.3340453873022126e-05, "loss": 2.2375, "step": 73096 }, { "epoch": 0.91, "learning_rate": 2.3332764975085812e-05, "loss": 2.2267, "step": 73104 }, { "epoch": 0.91, "learning_rate": 2.3325084769382067e-05, "loss": 2.2389, "step": 73112 }, { "epoch": 0.91, "learning_rate": 2.3317413256681205e-05, "loss": 2.2213, "step": 73120 }, { "epoch": 0.91, "learning_rate": 2.3309750437752616e-05, "loss": 2.2467, "step": 73128 }, { "epoch": 0.91, "learning_rate": 2.3302096313364847e-05, "loss": 2.2128, "step": 73136 }, { "epoch": 0.91, "learning_rate": 2.3294450884285567e-05, "loss": 2.2412, "step": 73144 }, { "epoch": 0.91, "learning_rate": 2.328681415128155e-05, "loss": 2.2498, "step": 73152 }, { "epoch": 0.91, "learning_rate": 2.3279186115118727e-05, "loss": 2.2464, "step": 73160 }, { "epoch": 0.91, "learning_rate": 2.327156677656216e-05, "loss": 2.2272, "step": 73168 }, { "epoch": 0.91, "learning_rate": 2.326395613637602e-05, "loss": 2.2558, "step": 73176 }, { "epoch": 0.91, "learning_rate": 2.325635419532359e-05, "loss": 2.2422, "step": 73184 }, { "epoch": 0.91, "learning_rate": 2.3248760954167325e-05, "loss": 2.2183, "step": 73192 }, { "epoch": 0.92, "learning_rate": 2.3241176413668785e-05, "loss": 2.2405, "step": 73200 }, { "epoch": 0.92, "learning_rate": 2.323360057458864e-05, "loss": 2.2438, "step": 73208 }, { "epoch": 0.92, "learning_rate": 2.3226033437686713e-05, "loss": 2.2333, "step": 73216 }, { "epoch": 0.92, "learning_rate": 2.3218475003721937e-05, "loss": 2.2523, "step": 73224 }, { "epoch": 0.92, "learning_rate": 2.3210925273452393e-05, "loss": 2.2477, "step": 73232 }, { "epoch": 0.92, "learning_rate": 2.3203384247635274e-05, "loss": 2.2445, "step": 73240 }, { "epoch": 0.92, "learning_rate": 2.3195851927026893e-05, "loss": 2.2506, "step": 73248 }, { "epoch": 0.92, "learning_rate": 2.3188328312382704e-05, "loss": 2.2442, "step": 73256 }, { "epoch": 0.92, "learning_rate": 2.318081340445728e-05, "loss": 2.2323, "step": 73264 }, { "epoch": 0.92, "learning_rate": 2.317330720400434e-05, "loss": 2.2358, "step": 73272 }, { "epoch": 0.92, "learning_rate": 2.3165809711776692e-05, "loss": 2.2431, "step": 73280 }, { "epoch": 0.92, "learning_rate": 2.315832092852629e-05, "loss": 2.2532, "step": 73288 }, { "epoch": 0.92, "learning_rate": 2.315084085500425e-05, "loss": 2.2188, "step": 73296 }, { "epoch": 0.92, "learning_rate": 2.314336949196074e-05, "loss": 2.225, "step": 73304 }, { "epoch": 0.92, "learning_rate": 2.3135906840145122e-05, "loss": 2.2402, "step": 73312 }, { "epoch": 0.92, "learning_rate": 2.312845290030585e-05, "loss": 2.2209, "step": 73320 }, { "epoch": 0.92, "learning_rate": 2.3121007673190487e-05, "loss": 2.241, "step": 73328 }, { "epoch": 0.92, "learning_rate": 2.3113571159545804e-05, "loss": 2.2372, "step": 73336 }, { "epoch": 0.92, "learning_rate": 2.3106143360117582e-05, "loss": 2.2319, "step": 73344 }, { "epoch": 0.92, "learning_rate": 2.309872427565083e-05, "loss": 2.2489, "step": 73352 }, { "epoch": 0.92, "learning_rate": 2.309131390688963e-05, "loss": 2.2549, "step": 73360 }, { "epoch": 0.92, "learning_rate": 2.3083912254577166e-05, "loss": 2.2468, "step": 73368 }, { "epoch": 0.92, "learning_rate": 2.307651931945584e-05, "loss": 2.2375, "step": 73376 }, { "epoch": 0.92, "learning_rate": 2.3069135102267067e-05, "loss": 2.2609, "step": 73384 }, { "epoch": 0.92, "learning_rate": 2.306175960375147e-05, "loss": 2.251, "step": 73392 }, { "epoch": 0.92, "learning_rate": 2.3054392824648786e-05, "loss": 2.2297, "step": 73400 }, { "epoch": 0.92, "learning_rate": 2.3047034765697812e-05, "loss": 2.2424, "step": 73408 }, { "epoch": 0.92, "learning_rate": 2.3039685427636555e-05, "loss": 2.2385, "step": 73416 }, { "epoch": 0.92, "learning_rate": 2.3032344811202112e-05, "loss": 2.2333, "step": 73424 }, { "epoch": 0.92, "learning_rate": 2.30250129171307e-05, "loss": 2.2453, "step": 73432 }, { "epoch": 0.92, "learning_rate": 2.301768974615766e-05, "loss": 2.2435, "step": 73440 }, { "epoch": 0.92, "learning_rate": 2.301037529901748e-05, "loss": 2.2157, "step": 73448 }, { "epoch": 0.92, "learning_rate": 2.3003069576443737e-05, "loss": 2.2493, "step": 73456 }, { "epoch": 0.92, "learning_rate": 2.2995772579169167e-05, "loss": 2.2574, "step": 73464 }, { "epoch": 0.92, "learning_rate": 2.2988484307925616e-05, "loss": 2.2287, "step": 73472 }, { "epoch": 0.92, "learning_rate": 2.2981204763444047e-05, "loss": 2.2468, "step": 73480 }, { "epoch": 0.92, "learning_rate": 2.297393394645457e-05, "loss": 2.2125, "step": 73488 }, { "epoch": 0.92, "learning_rate": 2.2966671857686405e-05, "loss": 2.2367, "step": 73496 }, { "epoch": 0.92, "learning_rate": 2.2959418497867882e-05, "loss": 2.2361, "step": 73504 }, { "epoch": 0.92, "learning_rate": 2.2952173867726504e-05, "loss": 2.2535, "step": 73512 }, { "epoch": 0.92, "learning_rate": 2.2944937967988834e-05, "loss": 2.2436, "step": 73520 }, { "epoch": 0.92, "learning_rate": 2.29377107993806e-05, "loss": 2.2437, "step": 73528 }, { "epoch": 0.92, "learning_rate": 2.293049236262666e-05, "loss": 2.2429, "step": 73536 }, { "epoch": 0.92, "learning_rate": 2.2923282658450974e-05, "loss": 2.2349, "step": 73544 }, { "epoch": 0.92, "learning_rate": 2.2916081687576624e-05, "loss": 2.2485, "step": 73552 }, { "epoch": 0.92, "learning_rate": 2.2908889450725828e-05, "loss": 2.2416, "step": 73560 }, { "epoch": 0.92, "learning_rate": 2.2901705948619965e-05, "loss": 2.2445, "step": 73568 }, { "epoch": 0.92, "learning_rate": 2.289453118197945e-05, "loss": 2.2475, "step": 73576 }, { "epoch": 0.92, "learning_rate": 2.28873651515239e-05, "loss": 2.2672, "step": 73584 }, { "epoch": 0.92, "learning_rate": 2.288020785797201e-05, "loss": 2.2272, "step": 73592 }, { "epoch": 0.92, "learning_rate": 2.2873059302041616e-05, "loss": 2.2342, "step": 73600 }, { "epoch": 0.92, "learning_rate": 2.2865919484449696e-05, "loss": 2.2638, "step": 73608 }, { "epoch": 0.92, "learning_rate": 2.2858788405912316e-05, "loss": 2.2553, "step": 73616 }, { "epoch": 0.92, "learning_rate": 2.2851666067144695e-05, "loss": 2.2227, "step": 73624 }, { "epoch": 0.92, "learning_rate": 2.284455246886117e-05, "loss": 2.2435, "step": 73632 }, { "epoch": 0.92, "learning_rate": 2.2837447611775158e-05, "loss": 2.2444, "step": 73640 }, { "epoch": 0.92, "learning_rate": 2.2830351496599283e-05, "loss": 2.2393, "step": 73648 }, { "epoch": 0.92, "learning_rate": 2.2823264124045197e-05, "loss": 2.2453, "step": 73656 }, { "epoch": 0.92, "learning_rate": 2.2816185494823765e-05, "loss": 2.2238, "step": 73664 }, { "epoch": 0.92, "learning_rate": 2.2809115609644926e-05, "loss": 2.2321, "step": 73672 }, { "epoch": 0.92, "learning_rate": 2.280205446921772e-05, "loss": 2.2292, "step": 73680 }, { "epoch": 0.92, "learning_rate": 2.279500207425037e-05, "loss": 2.2216, "step": 73688 }, { "epoch": 0.92, "learning_rate": 2.278795842545019e-05, "loss": 2.2499, "step": 73696 }, { "epoch": 0.92, "learning_rate": 2.2780923523523594e-05, "loss": 2.2472, "step": 73704 }, { "epoch": 0.92, "learning_rate": 2.277389736917618e-05, "loss": 2.2353, "step": 73712 }, { "epoch": 0.92, "learning_rate": 2.2766879963112585e-05, "loss": 2.2495, "step": 73720 }, { "epoch": 0.92, "learning_rate": 2.2759871306036642e-05, "loss": 2.2578, "step": 73728 }, { "epoch": 0.92, "learning_rate": 2.275287139865128e-05, "loss": 2.2326, "step": 73736 }, { "epoch": 0.92, "learning_rate": 2.274588024165855e-05, "loss": 2.2488, "step": 73744 }, { "epoch": 0.92, "learning_rate": 2.2738897835759632e-05, "loss": 2.2316, "step": 73752 }, { "epoch": 0.92, "learning_rate": 2.2731924181654802e-05, "loss": 2.2325, "step": 73760 }, { "epoch": 0.92, "learning_rate": 2.2724959280043493e-05, "loss": 2.2398, "step": 73768 }, { "epoch": 0.92, "learning_rate": 2.2718003131624244e-05, "loss": 2.2366, "step": 73776 }, { "epoch": 0.92, "learning_rate": 2.2711055737094705e-05, "loss": 2.2219, "step": 73784 }, { "epoch": 0.92, "learning_rate": 2.270411709715167e-05, "loss": 2.2491, "step": 73792 }, { "epoch": 0.92, "learning_rate": 2.2697187212491044e-05, "loss": 2.2384, "step": 73800 }, { "epoch": 0.92, "learning_rate": 2.2690266083807858e-05, "loss": 2.2363, "step": 73808 }, { "epoch": 0.92, "learning_rate": 2.2683353711796265e-05, "loss": 2.2424, "step": 73816 }, { "epoch": 0.92, "learning_rate": 2.2676450097149528e-05, "loss": 2.2354, "step": 73824 }, { "epoch": 0.92, "learning_rate": 2.266955524056003e-05, "loss": 2.2519, "step": 73832 }, { "epoch": 0.92, "learning_rate": 2.266266914271932e-05, "loss": 2.253, "step": 73840 }, { "epoch": 0.92, "learning_rate": 2.2655791804318004e-05, "loss": 2.2375, "step": 73848 }, { "epoch": 0.92, "learning_rate": 2.2648923226045855e-05, "loss": 2.2244, "step": 73856 }, { "epoch": 0.92, "learning_rate": 2.264206340859174e-05, "loss": 2.2306, "step": 73864 }, { "epoch": 0.92, "learning_rate": 2.2635212352643668e-05, "loss": 2.2539, "step": 73872 }, { "epoch": 0.92, "learning_rate": 2.2628370058888776e-05, "loss": 2.2418, "step": 73880 }, { "epoch": 0.92, "learning_rate": 2.2621536528013284e-05, "loss": 2.2527, "step": 73888 }, { "epoch": 0.92, "learning_rate": 2.2614711760702555e-05, "loss": 2.2277, "step": 73896 }, { "epoch": 0.92, "learning_rate": 2.2607895757641095e-05, "loss": 2.2313, "step": 73904 }, { "epoch": 0.92, "learning_rate": 2.2601088519512496e-05, "loss": 2.2304, "step": 73912 }, { "epoch": 0.92, "learning_rate": 2.2594290046999498e-05, "loss": 2.2391, "step": 73920 }, { "epoch": 0.92, "learning_rate": 2.258750034078393e-05, "loss": 2.244, "step": 73928 }, { "epoch": 0.92, "learning_rate": 2.2580719401546764e-05, "loss": 2.2447, "step": 73936 }, { "epoch": 0.92, "learning_rate": 2.2573947229968116e-05, "loss": 2.2323, "step": 73944 }, { "epoch": 0.92, "learning_rate": 2.2567183826727155e-05, "loss": 2.2453, "step": 73952 }, { "epoch": 0.92, "learning_rate": 2.2560429192502245e-05, "loss": 2.2421, "step": 73960 }, { "epoch": 0.92, "learning_rate": 2.255368332797083e-05, "loss": 2.2383, "step": 73968 }, { "epoch": 0.92, "learning_rate": 2.254694623380948e-05, "loss": 2.2425, "step": 73976 }, { "epoch": 0.92, "learning_rate": 2.2540217910693895e-05, "loss": 2.2526, "step": 73984 }, { "epoch": 0.92, "learning_rate": 2.253349835929886e-05, "loss": 2.2678, "step": 73992 }, { "epoch": 0.93, "learning_rate": 2.2526787580298332e-05, "loss": 2.2509, "step": 74000 }, { "epoch": 0.93, "learning_rate": 2.2520085574365368e-05, "loss": 2.2405, "step": 74008 }, { "epoch": 0.93, "learning_rate": 2.251339234217213e-05, "loss": 2.214, "step": 74016 }, { "epoch": 0.93, "learning_rate": 2.2506707884389907e-05, "loss": 2.2212, "step": 74024 }, { "epoch": 0.93, "learning_rate": 2.2500032201689118e-05, "loss": 2.2477, "step": 74032 }, { "epoch": 0.93, "learning_rate": 2.2493365294739305e-05, "loss": 2.2135, "step": 74040 }, { "epoch": 0.93, "learning_rate": 2.2486707164209112e-05, "loss": 2.2225, "step": 74048 }, { "epoch": 0.93, "learning_rate": 2.2480057810766304e-05, "loss": 2.2488, "step": 74056 }, { "epoch": 0.93, "learning_rate": 2.2473417235077793e-05, "loss": 2.2312, "step": 74064 }, { "epoch": 0.93, "learning_rate": 2.246678543780958e-05, "loss": 2.2213, "step": 74072 }, { "epoch": 0.93, "learning_rate": 2.246016241962679e-05, "loss": 2.2471, "step": 74080 }, { "epoch": 0.93, "learning_rate": 2.2453548181193686e-05, "loss": 2.2164, "step": 74088 }, { "epoch": 0.93, "learning_rate": 2.2446942723173632e-05, "loss": 2.2524, "step": 74096 }, { "epoch": 0.93, "learning_rate": 2.2440346046229122e-05, "loss": 2.2369, "step": 74104 }, { "epoch": 0.93, "learning_rate": 2.2433758151021757e-05, "loss": 2.2337, "step": 74112 }, { "epoch": 0.93, "learning_rate": 2.2427179038212282e-05, "loss": 2.2543, "step": 74120 }, { "epoch": 0.93, "learning_rate": 2.2420608708460517e-05, "loss": 2.2668, "step": 74128 }, { "epoch": 0.93, "learning_rate": 2.2414047162425464e-05, "loss": 2.2326, "step": 74136 }, { "epoch": 0.93, "learning_rate": 2.240749440076518e-05, "loss": 2.2321, "step": 74144 }, { "epoch": 0.93, "learning_rate": 2.24009504241369e-05, "loss": 2.2145, "step": 74152 }, { "epoch": 0.93, "learning_rate": 2.2394415233196913e-05, "loss": 2.2554, "step": 74160 }, { "epoch": 0.93, "learning_rate": 2.2387888828600674e-05, "loss": 2.225, "step": 74168 }, { "epoch": 0.93, "learning_rate": 2.238137121100276e-05, "loss": 2.2486, "step": 74176 }, { "epoch": 0.93, "learning_rate": 2.237486238105682e-05, "loss": 2.2354, "step": 74184 }, { "epoch": 0.93, "learning_rate": 2.2368362339415687e-05, "loss": 2.2372, "step": 74192 }, { "epoch": 0.93, "learning_rate": 2.236187108673127e-05, "loss": 2.2425, "step": 74200 }, { "epoch": 0.93, "learning_rate": 2.235538862365458e-05, "loss": 2.2495, "step": 74208 }, { "epoch": 0.93, "learning_rate": 2.2348914950835802e-05, "loss": 2.2478, "step": 74216 }, { "epoch": 0.93, "learning_rate": 2.2342450068924187e-05, "loss": 2.2495, "step": 74224 }, { "epoch": 0.93, "learning_rate": 2.2335993978568147e-05, "loss": 2.253, "step": 74232 }, { "epoch": 0.93, "learning_rate": 2.232954668041518e-05, "loss": 2.2379, "step": 74240 }, { "epoch": 0.93, "learning_rate": 2.232310817511189e-05, "loss": 2.2293, "step": 74248 }, { "epoch": 0.93, "learning_rate": 2.2316678463304063e-05, "loss": 2.2253, "step": 74256 }, { "epoch": 0.93, "learning_rate": 2.2310257545636545e-05, "loss": 2.2323, "step": 74264 }, { "epoch": 0.93, "learning_rate": 2.2303845422753315e-05, "loss": 2.2411, "step": 74272 }, { "epoch": 0.93, "learning_rate": 2.2297442095297484e-05, "loss": 2.2255, "step": 74280 }, { "epoch": 0.93, "learning_rate": 2.2291047563911245e-05, "loss": 2.2447, "step": 74288 }, { "epoch": 0.93, "learning_rate": 2.2284661829235952e-05, "loss": 2.2515, "step": 74296 }, { "epoch": 0.93, "learning_rate": 2.227828489191206e-05, "loss": 2.2521, "step": 74304 }, { "epoch": 0.93, "learning_rate": 2.227191675257913e-05, "loss": 2.2384, "step": 74312 }, { "epoch": 0.93, "learning_rate": 2.226555741187586e-05, "loss": 2.2222, "step": 74320 }, { "epoch": 0.93, "learning_rate": 2.2259206870440054e-05, "loss": 2.2283, "step": 74328 }, { "epoch": 0.93, "learning_rate": 2.225286512890863e-05, "loss": 2.2227, "step": 74336 }, { "epoch": 0.93, "learning_rate": 2.2246532187917622e-05, "loss": 2.2353, "step": 74344 }, { "epoch": 0.93, "learning_rate": 2.2240208048102204e-05, "loss": 2.2332, "step": 74352 }, { "epoch": 0.93, "learning_rate": 2.223389271009665e-05, "loss": 2.2411, "step": 74360 }, { "epoch": 0.93, "learning_rate": 2.2227586174534346e-05, "loss": 2.2463, "step": 74368 }, { "epoch": 0.93, "learning_rate": 2.222128844204779e-05, "loss": 2.2389, "step": 74376 }, { "epoch": 0.93, "learning_rate": 2.221499951326863e-05, "loss": 2.2362, "step": 74384 }, { "epoch": 0.93, "learning_rate": 2.2208719388827606e-05, "loss": 2.2432, "step": 74392 }, { "epoch": 0.93, "learning_rate": 2.220244806935456e-05, "loss": 2.2397, "step": 74400 }, { "epoch": 0.93, "learning_rate": 2.2196185555478503e-05, "loss": 2.2443, "step": 74408 }, { "epoch": 0.93, "learning_rate": 2.2189931847827505e-05, "loss": 2.2294, "step": 74416 }, { "epoch": 0.93, "learning_rate": 2.2183686947028775e-05, "loss": 2.2347, "step": 74424 }, { "epoch": 0.93, "learning_rate": 2.2177450853708653e-05, "loss": 2.2404, "step": 74432 }, { "epoch": 0.93, "learning_rate": 2.2171223568492575e-05, "loss": 2.2496, "step": 74440 }, { "epoch": 0.93, "learning_rate": 2.2165005092005124e-05, "loss": 2.2322, "step": 74448 }, { "epoch": 0.93, "learning_rate": 2.2158795424869953e-05, "loss": 2.2258, "step": 74456 }, { "epoch": 0.93, "learning_rate": 2.215259456770986e-05, "loss": 2.2242, "step": 74464 }, { "epoch": 0.93, "learning_rate": 2.2146402521146776e-05, "loss": 2.2418, "step": 74472 }, { "epoch": 0.93, "learning_rate": 2.214021928580169e-05, "loss": 2.2343, "step": 74480 }, { "epoch": 0.93, "learning_rate": 2.2134044862294793e-05, "loss": 2.2341, "step": 74488 }, { "epoch": 0.93, "learning_rate": 2.2127879251245298e-05, "loss": 2.2423, "step": 74496 }, { "epoch": 0.93, "learning_rate": 2.2121722453271615e-05, "loss": 2.2222, "step": 74504 }, { "epoch": 0.93, "learning_rate": 2.2115574468991234e-05, "loss": 2.2346, "step": 74512 }, { "epoch": 0.93, "learning_rate": 2.2109435299020738e-05, "loss": 2.2403, "step": 74520 }, { "epoch": 0.93, "learning_rate": 2.210330494397587e-05, "loss": 2.2356, "step": 74528 }, { "epoch": 0.93, "learning_rate": 2.2097183404471472e-05, "loss": 2.2358, "step": 74536 }, { "epoch": 0.93, "learning_rate": 2.2091070681121487e-05, "loss": 2.221, "step": 74544 }, { "epoch": 0.93, "learning_rate": 2.2084966774539002e-05, "loss": 2.2475, "step": 74552 }, { "epoch": 0.93, "learning_rate": 2.2078871685336177e-05, "loss": 2.2547, "step": 74560 }, { "epoch": 0.93, "learning_rate": 2.2072785414124344e-05, "loss": 2.2278, "step": 74568 }, { "epoch": 0.93, "learning_rate": 2.206670796151391e-05, "loss": 2.2455, "step": 74576 }, { "epoch": 0.93, "learning_rate": 2.2060639328114418e-05, "loss": 2.2492, "step": 74584 }, { "epoch": 0.93, "learning_rate": 2.2054579514534497e-05, "loss": 2.2276, "step": 74592 }, { "epoch": 0.93, "learning_rate": 2.204852852138194e-05, "loss": 2.2211, "step": 74600 }, { "epoch": 0.93, "learning_rate": 2.204248634926359e-05, "loss": 2.2473, "step": 74608 }, { "epoch": 0.93, "learning_rate": 2.2036452998785483e-05, "loss": 2.2257, "step": 74616 }, { "epoch": 0.93, "learning_rate": 2.203042847055271e-05, "loss": 2.2306, "step": 74624 }, { "epoch": 0.93, "learning_rate": 2.2024412765169485e-05, "loss": 2.2487, "step": 74632 }, { "epoch": 0.93, "learning_rate": 2.201840588323917e-05, "loss": 2.2304, "step": 74640 }, { "epoch": 0.93, "learning_rate": 2.2012407825364224e-05, "loss": 2.2428, "step": 74648 }, { "epoch": 0.93, "learning_rate": 2.20064185921462e-05, "loss": 2.2495, "step": 74656 }, { "epoch": 0.93, "learning_rate": 2.200043818418579e-05, "loss": 2.2406, "step": 74664 }, { "epoch": 0.93, "learning_rate": 2.1994466602082787e-05, "loss": 2.2218, "step": 74672 }, { "epoch": 0.93, "learning_rate": 2.198850384643614e-05, "loss": 2.2199, "step": 74680 }, { "epoch": 0.93, "learning_rate": 2.198254991784384e-05, "loss": 2.2365, "step": 74688 }, { "epoch": 0.93, "learning_rate": 2.1976604816903057e-05, "loss": 2.2437, "step": 74696 }, { "epoch": 0.93, "learning_rate": 2.197066854421004e-05, "loss": 2.2447, "step": 74704 }, { "epoch": 0.93, "learning_rate": 2.196474110036015e-05, "loss": 2.232, "step": 74712 }, { "epoch": 0.93, "learning_rate": 2.195882248594792e-05, "loss": 2.2239, "step": 74720 }, { "epoch": 0.93, "learning_rate": 2.1952912701566915e-05, "loss": 2.2467, "step": 74728 }, { "epoch": 0.93, "learning_rate": 2.1947011747809853e-05, "loss": 2.2503, "step": 74736 }, { "epoch": 0.93, "learning_rate": 2.194111962526859e-05, "loss": 2.2403, "step": 74744 }, { "epoch": 0.93, "learning_rate": 2.193523633453405e-05, "loss": 2.237, "step": 74752 }, { "epoch": 0.93, "learning_rate": 2.192936187619632e-05, "loss": 2.2312, "step": 74760 }, { "epoch": 0.93, "learning_rate": 2.1923496250844545e-05, "loss": 2.2346, "step": 74768 }, { "epoch": 0.93, "learning_rate": 2.1917639459067017e-05, "loss": 2.2353, "step": 74776 }, { "epoch": 0.93, "learning_rate": 2.1911791501451173e-05, "loss": 2.2112, "step": 74784 }, { "epoch": 0.93, "learning_rate": 2.190595237858349e-05, "loss": 2.2431, "step": 74792 }, { "epoch": 0.94, "learning_rate": 2.190012209104962e-05, "loss": 2.2456, "step": 74800 }, { "epoch": 0.94, "learning_rate": 2.1894300639434298e-05, "loss": 2.2187, "step": 74808 }, { "epoch": 0.94, "learning_rate": 2.1888488024321395e-05, "loss": 2.2246, "step": 74816 }, { "epoch": 0.94, "learning_rate": 2.1882684246293877e-05, "loss": 2.2386, "step": 74824 }, { "epoch": 0.94, "learning_rate": 2.1876889305933813e-05, "loss": 2.2439, "step": 74832 }, { "epoch": 0.94, "learning_rate": 2.187110320382244e-05, "loss": 2.2476, "step": 74840 }, { "epoch": 0.94, "learning_rate": 2.186532594054004e-05, "loss": 2.2203, "step": 74848 }, { "epoch": 0.94, "learning_rate": 2.1859557516666044e-05, "loss": 2.2419, "step": 74856 }, { "epoch": 0.94, "learning_rate": 2.1853797932779003e-05, "loss": 2.2227, "step": 74864 }, { "epoch": 0.94, "learning_rate": 2.184804718945657e-05, "loss": 2.2541, "step": 74872 }, { "epoch": 0.94, "learning_rate": 2.18423052872755e-05, "loss": 2.2235, "step": 74880 }, { "epoch": 0.94, "learning_rate": 2.1836572226811686e-05, "loss": 2.2348, "step": 74888 }, { "epoch": 0.94, "learning_rate": 2.1830848008640108e-05, "loss": 2.2277, "step": 74896 }, { "epoch": 0.94, "learning_rate": 2.1825132633334893e-05, "loss": 2.2353, "step": 74904 }, { "epoch": 0.94, "learning_rate": 2.1819426101469235e-05, "loss": 2.2291, "step": 74912 }, { "epoch": 0.94, "learning_rate": 2.1813728413615496e-05, "loss": 2.204, "step": 74920 }, { "epoch": 0.94, "learning_rate": 2.1808039570345097e-05, "loss": 2.2422, "step": 74928 }, { "epoch": 0.94, "learning_rate": 2.18023595722286e-05, "loss": 2.2405, "step": 74936 }, { "epoch": 0.94, "learning_rate": 2.1796688419835697e-05, "loss": 2.2357, "step": 74944 }, { "epoch": 0.94, "learning_rate": 2.179102611373514e-05, "loss": 2.2395, "step": 74952 }, { "epoch": 0.94, "learning_rate": 2.1785372654494857e-05, "loss": 2.2342, "step": 74960 }, { "epoch": 0.94, "learning_rate": 2.177972804268184e-05, "loss": 2.2323, "step": 74968 }, { "epoch": 0.94, "learning_rate": 2.1774092278862223e-05, "loss": 2.231, "step": 74976 }, { "epoch": 0.94, "learning_rate": 2.1768465363601216e-05, "loss": 2.2238, "step": 74984 }, { "epoch": 0.94, "learning_rate": 2.1762847297463215e-05, "loss": 2.2265, "step": 74992 }, { "epoch": 0.94, "learning_rate": 2.1757238081011637e-05, "loss": 2.2464, "step": 75000 }, { "epoch": 0.94, "learning_rate": 2.1751637714809063e-05, "loss": 2.2364, "step": 75008 }, { "epoch": 0.94, "learning_rate": 2.174604619941719e-05, "loss": 2.2308, "step": 75016 }, { "epoch": 0.94, "learning_rate": 2.1740463535396795e-05, "loss": 2.2516, "step": 75024 }, { "epoch": 0.94, "learning_rate": 2.1734889723307818e-05, "loss": 2.2361, "step": 75032 }, { "epoch": 0.94, "learning_rate": 2.1729324763709264e-05, "loss": 2.2388, "step": 75040 }, { "epoch": 0.94, "learning_rate": 2.172376865715926e-05, "loss": 2.2584, "step": 75048 }, { "epoch": 0.94, "learning_rate": 2.1718221404215065e-05, "loss": 2.2253, "step": 75056 }, { "epoch": 0.94, "learning_rate": 2.1712683005433018e-05, "loss": 2.2283, "step": 75064 }, { "epoch": 0.94, "learning_rate": 2.1707153461368617e-05, "loss": 2.2354, "step": 75072 }, { "epoch": 0.94, "learning_rate": 2.170163277257643e-05, "loss": 2.2322, "step": 75080 }, { "epoch": 0.94, "learning_rate": 2.1696120939610137e-05, "loss": 2.2576, "step": 75088 }, { "epoch": 0.94, "learning_rate": 2.1690617963022554e-05, "loss": 2.2361, "step": 75096 }, { "epoch": 0.94, "learning_rate": 2.1685123843365613e-05, "loss": 2.2428, "step": 75104 }, { "epoch": 0.94, "learning_rate": 2.1679638581190324e-05, "loss": 2.2447, "step": 75112 }, { "epoch": 0.94, "learning_rate": 2.167416217704685e-05, "loss": 2.2353, "step": 75120 }, { "epoch": 0.94, "learning_rate": 2.166869463148441e-05, "loss": 2.2542, "step": 75128 }, { "epoch": 0.94, "learning_rate": 2.1663235945051392e-05, "loss": 2.2343, "step": 75136 }, { "epoch": 0.94, "learning_rate": 2.1657786118295256e-05, "loss": 2.2461, "step": 75144 }, { "epoch": 0.94, "learning_rate": 2.1652345151762614e-05, "loss": 2.2224, "step": 75152 }, { "epoch": 0.94, "learning_rate": 2.164691304599914e-05, "loss": 2.2271, "step": 75160 }, { "epoch": 0.94, "learning_rate": 2.164148980154965e-05, "loss": 2.2227, "step": 75168 }, { "epoch": 0.94, "learning_rate": 2.1636075418958067e-05, "loss": 2.2508, "step": 75176 }, { "epoch": 0.94, "learning_rate": 2.1630669898767417e-05, "loss": 2.2357, "step": 75184 }, { "epoch": 0.94, "learning_rate": 2.1625273241519855e-05, "loss": 2.2426, "step": 75192 }, { "epoch": 0.94, "learning_rate": 2.161988544775662e-05, "loss": 2.2377, "step": 75200 }, { "epoch": 0.94, "learning_rate": 2.1614506518018094e-05, "loss": 2.2481, "step": 75208 }, { "epoch": 0.94, "learning_rate": 2.1609136452843744e-05, "loss": 2.2258, "step": 75216 }, { "epoch": 0.94, "learning_rate": 2.160377525277216e-05, "loss": 2.2032, "step": 75224 }, { "epoch": 0.94, "learning_rate": 2.1598422918341026e-05, "loss": 2.2316, "step": 75232 }, { "epoch": 0.94, "learning_rate": 2.1593079450087166e-05, "loss": 2.2341, "step": 75240 }, { "epoch": 0.94, "learning_rate": 2.158774484854651e-05, "loss": 2.2407, "step": 75248 }, { "epoch": 0.94, "learning_rate": 2.1582419114254056e-05, "loss": 2.2417, "step": 75256 }, { "epoch": 0.94, "learning_rate": 2.1577102247743973e-05, "loss": 2.2406, "step": 75264 }, { "epoch": 0.94, "learning_rate": 2.1571794249549502e-05, "loss": 2.2199, "step": 75272 }, { "epoch": 0.94, "learning_rate": 2.1566495120202995e-05, "loss": 2.2576, "step": 75280 }, { "epoch": 0.94, "learning_rate": 2.1561204860235952e-05, "loss": 2.2155, "step": 75288 }, { "epoch": 0.94, "learning_rate": 2.1555923470178934e-05, "loss": 2.2335, "step": 75296 }, { "epoch": 0.94, "learning_rate": 2.155065095056163e-05, "loss": 2.2478, "step": 75304 }, { "epoch": 0.94, "learning_rate": 2.1545387301912873e-05, "loss": 2.2459, "step": 75312 }, { "epoch": 0.94, "learning_rate": 2.1540132524760534e-05, "loss": 2.26, "step": 75320 }, { "epoch": 0.94, "learning_rate": 2.1534886619631683e-05, "loss": 2.2326, "step": 75328 }, { "epoch": 0.94, "learning_rate": 2.1529649587052415e-05, "loss": 2.2193, "step": 75336 }, { "epoch": 0.94, "learning_rate": 2.1524421427548002e-05, "loss": 2.2322, "step": 75344 }, { "epoch": 0.94, "learning_rate": 2.1519202141642805e-05, "loss": 2.253, "step": 75352 }, { "epoch": 0.94, "learning_rate": 2.1513991729860243e-05, "loss": 2.2394, "step": 75360 }, { "epoch": 0.94, "learning_rate": 2.1508790192722942e-05, "loss": 2.228, "step": 75368 }, { "epoch": 0.94, "learning_rate": 2.1503597530752563e-05, "loss": 2.2567, "step": 75376 }, { "epoch": 0.94, "learning_rate": 2.1498413744469898e-05, "loss": 2.2294, "step": 75384 }, { "epoch": 0.94, "learning_rate": 2.149323883439487e-05, "loss": 2.2359, "step": 75392 }, { "epoch": 0.94, "learning_rate": 2.148807280104646e-05, "loss": 2.2376, "step": 75400 }, { "epoch": 0.94, "learning_rate": 2.1482915644942824e-05, "loss": 2.2386, "step": 75408 }, { "epoch": 0.94, "learning_rate": 2.147776736660119e-05, "loss": 2.2475, "step": 75416 }, { "epoch": 0.94, "learning_rate": 2.1472627966537884e-05, "loss": 2.238, "step": 75424 }, { "epoch": 0.94, "learning_rate": 2.1467497445268367e-05, "loss": 2.2305, "step": 75432 }, { "epoch": 0.94, "learning_rate": 2.146237580330721e-05, "loss": 2.2387, "step": 75440 }, { "epoch": 0.94, "learning_rate": 2.1457263041168072e-05, "loss": 2.2314, "step": 75448 }, { "epoch": 0.94, "learning_rate": 2.1452159159363742e-05, "loss": 2.2354, "step": 75456 }, { "epoch": 0.94, "learning_rate": 2.1447064158406117e-05, "loss": 2.2385, "step": 75464 }, { "epoch": 0.94, "learning_rate": 2.1441978038806173e-05, "loss": 2.2464, "step": 75472 }, { "epoch": 0.94, "learning_rate": 2.143690080107405e-05, "loss": 2.2307, "step": 75480 }, { "epoch": 0.94, "learning_rate": 2.143183244571894e-05, "loss": 2.2457, "step": 75488 }, { "epoch": 0.94, "learning_rate": 2.142677297324919e-05, "loss": 2.2368, "step": 75496 }, { "epoch": 0.94, "learning_rate": 2.142172238417222e-05, "loss": 2.231, "step": 75504 }, { "epoch": 0.94, "learning_rate": 2.1416680678994573e-05, "loss": 2.2311, "step": 75512 }, { "epoch": 0.94, "learning_rate": 2.1411647858221933e-05, "loss": 2.2324, "step": 75520 }, { "epoch": 0.94, "learning_rate": 2.1406623922359037e-05, "loss": 2.2232, "step": 75528 }, { "epoch": 0.94, "learning_rate": 2.140160887190976e-05, "loss": 2.2303, "step": 75536 }, { "epoch": 0.94, "learning_rate": 2.1396602707377092e-05, "loss": 2.2486, "step": 75544 }, { "epoch": 0.94, "learning_rate": 2.1391605429263105e-05, "loss": 2.2087, "step": 75552 }, { "epoch": 0.94, "learning_rate": 2.1386617038069028e-05, "loss": 2.2148, "step": 75560 }, { "epoch": 0.94, "learning_rate": 2.1381637534295142e-05, "loss": 2.2314, "step": 75568 }, { "epoch": 0.94, "learning_rate": 2.1376666918440866e-05, "loss": 2.2323, "step": 75576 }, { "epoch": 0.94, "learning_rate": 2.137170519100474e-05, "loss": 2.2413, "step": 75584 }, { "epoch": 0.94, "learning_rate": 2.136675235248438e-05, "loss": 2.2466, "step": 75592 }, { "epoch": 0.94, "learning_rate": 2.1361808403376545e-05, "loss": 2.2355, "step": 75600 }, { "epoch": 0.95, "learning_rate": 2.135687334417708e-05, "loss": 2.2621, "step": 75608 }, { "epoch": 0.95, "learning_rate": 2.135194717538092e-05, "loss": 2.2427, "step": 75616 }, { "epoch": 0.95, "learning_rate": 2.1347029897482162e-05, "loss": 2.2395, "step": 75624 }, { "epoch": 0.95, "learning_rate": 2.1342121510973965e-05, "loss": 2.2454, "step": 75632 }, { "epoch": 0.95, "learning_rate": 2.1337222016348623e-05, "loss": 2.2385, "step": 75640 }, { "epoch": 0.95, "learning_rate": 2.1332331414097532e-05, "loss": 2.251, "step": 75648 }, { "epoch": 0.95, "learning_rate": 2.1327449704711154e-05, "loss": 2.2387, "step": 75656 }, { "epoch": 0.95, "learning_rate": 2.1322576888679147e-05, "loss": 2.2252, "step": 75664 }, { "epoch": 0.95, "learning_rate": 2.1317712966490194e-05, "loss": 2.254, "step": 75672 }, { "epoch": 0.95, "learning_rate": 2.131285793863213e-05, "loss": 2.2415, "step": 75680 }, { "epoch": 0.95, "learning_rate": 2.130801180559188e-05, "loss": 2.2133, "step": 75688 }, { "epoch": 0.95, "learning_rate": 2.1303174567855504e-05, "loss": 2.2506, "step": 75696 }, { "epoch": 0.95, "learning_rate": 2.1298346225908124e-05, "loss": 2.2317, "step": 75704 }, { "epoch": 0.95, "learning_rate": 2.1293526780234015e-05, "loss": 2.2606, "step": 75712 }, { "epoch": 0.95, "learning_rate": 2.128871623131652e-05, "loss": 2.2449, "step": 75720 }, { "epoch": 0.95, "learning_rate": 2.1283914579638127e-05, "loss": 2.2413, "step": 75728 }, { "epoch": 0.95, "learning_rate": 2.127912182568041e-05, "loss": 2.2343, "step": 75736 }, { "epoch": 0.95, "learning_rate": 2.1274337969924053e-05, "loss": 2.2433, "step": 75744 }, { "epoch": 0.95, "learning_rate": 2.1269563012848852e-05, "loss": 2.2403, "step": 75752 }, { "epoch": 0.95, "learning_rate": 2.1264796954933705e-05, "loss": 2.2141, "step": 75760 }, { "epoch": 0.95, "learning_rate": 2.126003979665662e-05, "loss": 2.249, "step": 75768 }, { "epoch": 0.95, "learning_rate": 2.1255291538494716e-05, "loss": 2.246, "step": 75776 }, { "epoch": 0.95, "learning_rate": 2.125055218092422e-05, "loss": 2.2447, "step": 75784 }, { "epoch": 0.95, "learning_rate": 2.1245821724420452e-05, "loss": 2.2255, "step": 75792 }, { "epoch": 0.95, "learning_rate": 2.1241100169457858e-05, "loss": 2.2512, "step": 75800 }, { "epoch": 0.95, "learning_rate": 2.1236387516509975e-05, "loss": 2.2507, "step": 75808 }, { "epoch": 0.95, "learning_rate": 2.1231683766049474e-05, "loss": 2.2261, "step": 75816 }, { "epoch": 0.95, "learning_rate": 2.12269889185481e-05, "loss": 2.2401, "step": 75824 }, { "epoch": 0.95, "learning_rate": 2.1222302974476722e-05, "loss": 2.2361, "step": 75832 }, { "epoch": 0.95, "learning_rate": 2.1217625934305306e-05, "loss": 2.251, "step": 75840 }, { "epoch": 0.95, "learning_rate": 2.1212957798502937e-05, "loss": 2.2386, "step": 75848 }, { "epoch": 0.95, "learning_rate": 2.1208298567537817e-05, "loss": 2.2223, "step": 75856 }, { "epoch": 0.95, "learning_rate": 2.1203648241877217e-05, "loss": 2.2267, "step": 75864 }, { "epoch": 0.95, "learning_rate": 2.119900682198757e-05, "loss": 2.238, "step": 75872 }, { "epoch": 0.95, "learning_rate": 2.119437430833435e-05, "loss": 2.2564, "step": 75880 }, { "epoch": 0.95, "learning_rate": 2.1189750701382184e-05, "loss": 2.2322, "step": 75888 }, { "epoch": 0.95, "learning_rate": 2.1185136001594807e-05, "loss": 2.2453, "step": 75896 }, { "epoch": 0.95, "learning_rate": 2.1180530209435026e-05, "loss": 2.2442, "step": 75904 }, { "epoch": 0.95, "learning_rate": 2.1175933325364788e-05, "loss": 2.2405, "step": 75912 }, { "epoch": 0.95, "learning_rate": 2.117134534984514e-05, "loss": 2.2277, "step": 75920 }, { "epoch": 0.95, "learning_rate": 2.1166766283336213e-05, "loss": 2.2376, "step": 75928 }, { "epoch": 0.95, "learning_rate": 2.1162196126297286e-05, "loss": 2.2292, "step": 75936 }, { "epoch": 0.95, "learning_rate": 2.1157634879186693e-05, "loss": 2.2351, "step": 75944 }, { "epoch": 0.95, "learning_rate": 2.115308254246191e-05, "loss": 2.217, "step": 75952 }, { "epoch": 0.95, "learning_rate": 2.1148539116579526e-05, "loss": 2.2187, "step": 75960 }, { "epoch": 0.95, "learning_rate": 2.1144004601995186e-05, "loss": 2.243, "step": 75968 }, { "epoch": 0.95, "learning_rate": 2.1139478999163723e-05, "loss": 2.2268, "step": 75976 }, { "epoch": 0.95, "learning_rate": 2.113496230853899e-05, "loss": 2.2519, "step": 75984 }, { "epoch": 0.95, "learning_rate": 2.113045453057401e-05, "loss": 2.234, "step": 75992 }, { "epoch": 0.95, "learning_rate": 2.1125955665720877e-05, "loss": 2.2305, "step": 76000 }, { "epoch": 0.95, "learning_rate": 2.1121465714430792e-05, "loss": 2.2575, "step": 76008 }, { "epoch": 0.95, "learning_rate": 2.1116984677154094e-05, "loss": 2.2239, "step": 76016 }, { "epoch": 0.95, "learning_rate": 2.111251255434018e-05, "loss": 2.2308, "step": 76024 }, { "epoch": 0.95, "learning_rate": 2.1108049346437613e-05, "loss": 2.269, "step": 76032 }, { "epoch": 0.95, "learning_rate": 2.1103595053893995e-05, "loss": 2.2363, "step": 76040 }, { "epoch": 0.95, "learning_rate": 2.109914967715608e-05, "loss": 2.232, "step": 76048 }, { "epoch": 0.95, "learning_rate": 2.109471321666971e-05, "loss": 2.2469, "step": 76056 }, { "epoch": 0.95, "learning_rate": 2.109028567287984e-05, "loss": 2.2459, "step": 76064 }, { "epoch": 0.95, "learning_rate": 2.1085867046230527e-05, "loss": 2.2436, "step": 76072 }, { "epoch": 0.95, "learning_rate": 2.1081457337164928e-05, "loss": 2.2493, "step": 76080 }, { "epoch": 0.95, "learning_rate": 2.1077056546125335e-05, "loss": 2.2415, "step": 76088 }, { "epoch": 0.95, "learning_rate": 2.107266467355309e-05, "loss": 2.2267, "step": 76096 }, { "epoch": 0.95, "learning_rate": 2.106828171988869e-05, "loss": 2.2126, "step": 76104 }, { "epoch": 0.95, "learning_rate": 2.1063907685571726e-05, "loss": 2.2479, "step": 76112 }, { "epoch": 0.95, "learning_rate": 2.105954257104087e-05, "loss": 2.2442, "step": 76120 }, { "epoch": 0.95, "learning_rate": 2.1055186376733946e-05, "loss": 2.2278, "step": 76128 }, { "epoch": 0.95, "learning_rate": 2.105083910308783e-05, "loss": 2.254, "step": 76136 }, { "epoch": 0.95, "learning_rate": 2.1046500750538533e-05, "loss": 2.2425, "step": 76144 }, { "epoch": 0.95, "learning_rate": 2.1042171319521184e-05, "loss": 2.2385, "step": 76152 }, { "epoch": 0.95, "learning_rate": 2.1037850810469978e-05, "loss": 2.258, "step": 76160 }, { "epoch": 0.95, "learning_rate": 2.1033539223818252e-05, "loss": 2.2431, "step": 76168 }, { "epoch": 0.95, "learning_rate": 2.102923655999844e-05, "loss": 2.2272, "step": 76176 }, { "epoch": 0.95, "learning_rate": 2.1024942819442046e-05, "loss": 2.2313, "step": 76184 }, { "epoch": 0.95, "learning_rate": 2.1020658002579742e-05, "loss": 2.2429, "step": 76192 }, { "epoch": 0.95, "learning_rate": 2.1016382109841242e-05, "loss": 2.229, "step": 76200 }, { "epoch": 0.95, "learning_rate": 2.1012115141655418e-05, "loss": 2.2388, "step": 76208 }, { "epoch": 0.95, "learning_rate": 2.1007857098450207e-05, "loss": 2.2401, "step": 76216 }, { "epoch": 0.95, "learning_rate": 2.1003607980652682e-05, "loss": 2.2248, "step": 76224 }, { "epoch": 0.95, "learning_rate": 2.0999367788688986e-05, "loss": 2.2369, "step": 76232 }, { "epoch": 0.95, "learning_rate": 2.0995136522984393e-05, "loss": 2.2496, "step": 76240 }, { "epoch": 0.95, "learning_rate": 2.0990914183963285e-05, "loss": 2.2263, "step": 76248 }, { "epoch": 0.95, "learning_rate": 2.0986700772049125e-05, "loss": 2.2265, "step": 76256 }, { "epoch": 0.95, "learning_rate": 2.0982496287664505e-05, "loss": 2.2445, "step": 76264 }, { "epoch": 0.95, "learning_rate": 2.09783007312311e-05, "loss": 2.2595, "step": 76272 }, { "epoch": 0.95, "learning_rate": 2.0974114103169712e-05, "loss": 2.2307, "step": 76280 }, { "epoch": 0.95, "learning_rate": 2.0969936403900237e-05, "loss": 2.2428, "step": 76288 }, { "epoch": 0.95, "learning_rate": 2.096576763384166e-05, "loss": 2.2354, "step": 76296 }, { "epoch": 0.95, "learning_rate": 2.096160779341209e-05, "loss": 2.2173, "step": 76304 }, { "epoch": 0.95, "learning_rate": 2.0957456883028748e-05, "loss": 2.2393, "step": 76312 }, { "epoch": 0.95, "learning_rate": 2.0953314903107927e-05, "loss": 2.2408, "step": 76320 }, { "epoch": 0.95, "learning_rate": 2.094918185406507e-05, "loss": 2.2343, "step": 76328 }, { "epoch": 0.95, "learning_rate": 2.0945057736314678e-05, "loss": 2.2339, "step": 76336 }, { "epoch": 0.95, "learning_rate": 2.094094255027038e-05, "loss": 2.2546, "step": 76344 }, { "epoch": 0.95, "learning_rate": 2.0936836296344903e-05, "loss": 2.2234, "step": 76352 }, { "epoch": 0.95, "learning_rate": 2.0932738974950095e-05, "loss": 2.228, "step": 76360 }, { "epoch": 0.95, "learning_rate": 2.0928650586496873e-05, "loss": 2.2398, "step": 76368 }, { "epoch": 0.95, "learning_rate": 2.09245711313953e-05, "loss": 2.2478, "step": 76376 }, { "epoch": 0.95, "learning_rate": 2.0920500610054515e-05, "loss": 2.2262, "step": 76384 }, { "epoch": 0.95, "learning_rate": 2.0916439022882756e-05, "loss": 2.2402, "step": 76392 }, { "epoch": 0.95, "learning_rate": 2.0912386370287397e-05, "loss": 2.215, "step": 76400 }, { "epoch": 0.96, "learning_rate": 2.090834265267489e-05, "loss": 2.244, "step": 76408 }, { "epoch": 0.96, "learning_rate": 2.090430787045078e-05, "loss": 2.2251, "step": 76416 }, { "epoch": 0.96, "learning_rate": 2.090028202401976e-05, "loss": 2.2402, "step": 76424 }, { "epoch": 0.96, "learning_rate": 2.089626511378557e-05, "loss": 2.25, "step": 76432 }, { "epoch": 0.96, "learning_rate": 2.0892257140151124e-05, "loss": 2.2311, "step": 76440 }, { "epoch": 0.96, "learning_rate": 2.0888258103518353e-05, "loss": 2.22, "step": 76448 }, { "epoch": 0.96, "learning_rate": 2.088426800428836e-05, "loss": 2.2566, "step": 76456 }, { "epoch": 0.96, "learning_rate": 2.0880286842861346e-05, "loss": 2.229, "step": 76464 }, { "epoch": 0.96, "learning_rate": 2.0876314619636568e-05, "loss": 2.2548, "step": 76472 }, { "epoch": 0.96, "learning_rate": 2.0872351335012433e-05, "loss": 2.2492, "step": 76480 }, { "epoch": 0.96, "learning_rate": 2.0868396989386437e-05, "loss": 2.2348, "step": 76488 }, { "epoch": 0.96, "learning_rate": 2.0864451583155166e-05, "loss": 2.2561, "step": 76496 }, { "epoch": 0.96, "learning_rate": 2.0860515116714342e-05, "loss": 2.2596, "step": 76504 }, { "epoch": 0.96, "learning_rate": 2.0856587590458753e-05, "loss": 2.2306, "step": 76512 }, { "epoch": 0.96, "learning_rate": 2.085266900478232e-05, "loss": 2.238, "step": 76520 }, { "epoch": 0.96, "learning_rate": 2.084875936007806e-05, "loss": 2.2385, "step": 76528 }, { "epoch": 0.96, "learning_rate": 2.0844858656738057e-05, "loss": 2.2453, "step": 76536 }, { "epoch": 0.96, "learning_rate": 2.0840966895153553e-05, "loss": 2.2062, "step": 76544 }, { "epoch": 0.96, "learning_rate": 2.083708407571487e-05, "loss": 2.2469, "step": 76552 }, { "epoch": 0.96, "learning_rate": 2.0833210198811433e-05, "loss": 2.2279, "step": 76560 }, { "epoch": 0.96, "learning_rate": 2.0829345264831763e-05, "loss": 2.2523, "step": 76568 }, { "epoch": 0.96, "learning_rate": 2.0825489274163497e-05, "loss": 2.2186, "step": 76576 }, { "epoch": 0.96, "learning_rate": 2.082164222719336e-05, "loss": 2.2257, "step": 76584 }, { "epoch": 0.96, "learning_rate": 2.08178041243072e-05, "loss": 2.2485, "step": 76592 }, { "epoch": 0.96, "learning_rate": 2.0813974965889955e-05, "loss": 2.2378, "step": 76600 }, { "epoch": 0.96, "learning_rate": 2.0810154752325655e-05, "loss": 2.2468, "step": 76608 }, { "epoch": 0.96, "learning_rate": 2.080634348399746e-05, "loss": 2.2371, "step": 76616 }, { "epoch": 0.96, "learning_rate": 2.080254116128762e-05, "loss": 2.2318, "step": 76624 }, { "epoch": 0.96, "learning_rate": 2.0798747784577474e-05, "loss": 2.2211, "step": 76632 }, { "epoch": 0.96, "learning_rate": 2.0794963354247494e-05, "loss": 2.2234, "step": 76640 }, { "epoch": 0.96, "learning_rate": 2.0791187870677214e-05, "loss": 2.2508, "step": 76648 }, { "epoch": 0.96, "learning_rate": 2.0787421334245304e-05, "loss": 2.2229, "step": 76656 }, { "epoch": 0.96, "learning_rate": 2.0783663745329536e-05, "loss": 2.2505, "step": 76664 }, { "epoch": 0.96, "learning_rate": 2.0779915104306773e-05, "loss": 2.2243, "step": 76672 }, { "epoch": 0.96, "learning_rate": 2.077617541155296e-05, "loss": 2.2237, "step": 76680 }, { "epoch": 0.96, "learning_rate": 2.077244466744319e-05, "loss": 2.2423, "step": 76688 }, { "epoch": 0.96, "learning_rate": 2.0768722872351633e-05, "loss": 2.2419, "step": 76696 }, { "epoch": 0.96, "learning_rate": 2.076501002665156e-05, "loss": 2.2397, "step": 76704 }, { "epoch": 0.96, "learning_rate": 2.0761306130715338e-05, "loss": 2.2437, "step": 76712 }, { "epoch": 0.96, "learning_rate": 2.0757611184914464e-05, "loss": 2.2341, "step": 76720 }, { "epoch": 0.96, "learning_rate": 2.0753925189619506e-05, "loss": 2.216, "step": 76728 }, { "epoch": 0.96, "learning_rate": 2.0750248145200168e-05, "loss": 2.2277, "step": 76736 }, { "epoch": 0.96, "learning_rate": 2.0746580052025205e-05, "loss": 2.2487, "step": 76744 }, { "epoch": 0.96, "learning_rate": 2.0742920910462544e-05, "loss": 2.2416, "step": 76752 }, { "epoch": 0.96, "learning_rate": 2.073927072087915e-05, "loss": 2.2349, "step": 76760 }, { "epoch": 0.96, "learning_rate": 2.0735629483641123e-05, "loss": 2.2419, "step": 76768 }, { "epoch": 0.96, "learning_rate": 2.073199719911366e-05, "loss": 2.2411, "step": 76776 }, { "epoch": 0.96, "learning_rate": 2.0728373867661055e-05, "loss": 2.2221, "step": 76784 }, { "epoch": 0.96, "learning_rate": 2.072475948964671e-05, "loss": 2.2256, "step": 76792 }, { "epoch": 0.96, "learning_rate": 2.072115406543314e-05, "loss": 2.2426, "step": 76800 }, { "epoch": 0.96, "learning_rate": 2.071755759538192e-05, "loss": 2.2584, "step": 76808 }, { "epoch": 0.96, "learning_rate": 2.0713970079853773e-05, "loss": 2.225, "step": 76816 }, { "epoch": 0.96, "learning_rate": 2.07103915192085e-05, "loss": 2.2333, "step": 76824 }, { "epoch": 0.96, "learning_rate": 2.0706821913805026e-05, "loss": 2.2245, "step": 76832 }, { "epoch": 0.96, "learning_rate": 2.0703261264001354e-05, "loss": 2.2356, "step": 76840 }, { "epoch": 0.96, "learning_rate": 2.069970957015458e-05, "loss": 2.2199, "step": 76848 }, { "epoch": 0.96, "learning_rate": 2.0696166832620943e-05, "loss": 2.2511, "step": 76856 }, { "epoch": 0.96, "learning_rate": 2.0692633051755745e-05, "loss": 2.2168, "step": 76864 }, { "epoch": 0.96, "learning_rate": 2.068910822791341e-05, "loss": 2.2543, "step": 76872 }, { "epoch": 0.96, "learning_rate": 2.0685592361447457e-05, "loss": 2.2399, "step": 76880 }, { "epoch": 0.96, "learning_rate": 2.06820854527105e-05, "loss": 2.2422, "step": 76888 }, { "epoch": 0.96, "learning_rate": 2.0678587502054273e-05, "loss": 2.2219, "step": 76896 }, { "epoch": 0.96, "learning_rate": 2.06750985098296e-05, "loss": 2.2463, "step": 76904 }, { "epoch": 0.96, "learning_rate": 2.0671618476386406e-05, "loss": 2.2289, "step": 76912 }, { "epoch": 0.96, "learning_rate": 2.066814740207371e-05, "loss": 2.227, "step": 76920 }, { "epoch": 0.96, "learning_rate": 2.0664685287239648e-05, "loss": 2.2387, "step": 76928 }, { "epoch": 0.96, "learning_rate": 2.0661232132231454e-05, "loss": 2.226, "step": 76936 }, { "epoch": 0.96, "learning_rate": 2.065778793739545e-05, "loss": 2.229, "step": 76944 }, { "epoch": 0.96, "learning_rate": 2.0654352703077074e-05, "loss": 2.2434, "step": 76952 }, { "epoch": 0.96, "learning_rate": 2.065092642962086e-05, "loss": 2.2277, "step": 76960 }, { "epoch": 0.96, "learning_rate": 2.0647509117370455e-05, "loss": 2.2219, "step": 76968 }, { "epoch": 0.96, "learning_rate": 2.0644100766668583e-05, "loss": 2.2315, "step": 76976 }, { "epoch": 0.96, "learning_rate": 2.064070137785708e-05, "loss": 2.2423, "step": 76984 }, { "epoch": 0.96, "learning_rate": 2.0637310951276906e-05, "loss": 2.2514, "step": 76992 }, { "epoch": 0.96, "learning_rate": 2.0633929487268075e-05, "loss": 2.2376, "step": 77000 }, { "epoch": 0.96, "learning_rate": 2.063055698616974e-05, "loss": 2.2254, "step": 77008 }, { "epoch": 0.96, "learning_rate": 2.0627193448320145e-05, "loss": 2.2406, "step": 77016 }, { "epoch": 0.96, "learning_rate": 2.0623838874056637e-05, "loss": 2.24, "step": 77024 }, { "epoch": 0.96, "learning_rate": 2.062049326371566e-05, "loss": 2.2303, "step": 77032 }, { "epoch": 0.96, "learning_rate": 2.061715661763274e-05, "loss": 2.2417, "step": 77040 }, { "epoch": 0.96, "learning_rate": 2.0613828936142547e-05, "loss": 2.2405, "step": 77048 }, { "epoch": 0.96, "learning_rate": 2.0610510219578837e-05, "loss": 2.229, "step": 77056 }, { "epoch": 0.96, "learning_rate": 2.0607200468274425e-05, "loss": 2.2318, "step": 77064 }, { "epoch": 0.96, "learning_rate": 2.0603899682561285e-05, "loss": 2.2188, "step": 77072 }, { "epoch": 0.96, "learning_rate": 2.0600607862770453e-05, "loss": 2.2497, "step": 77080 }, { "epoch": 0.96, "learning_rate": 2.0597325009232105e-05, "loss": 2.2568, "step": 77088 }, { "epoch": 0.96, "learning_rate": 2.059405112227546e-05, "loss": 2.2505, "step": 77096 }, { "epoch": 0.96, "learning_rate": 2.059078620222889e-05, "loss": 2.235, "step": 77104 }, { "epoch": 0.96, "learning_rate": 2.0587530249419843e-05, "loss": 2.2255, "step": 77112 }, { "epoch": 0.96, "learning_rate": 2.0584283264174877e-05, "loss": 2.2332, "step": 77120 }, { "epoch": 0.96, "learning_rate": 2.0581045246819642e-05, "loss": 2.216, "step": 77128 }, { "epoch": 0.96, "learning_rate": 2.057781619767889e-05, "loss": 2.2365, "step": 77136 }, { "epoch": 0.96, "learning_rate": 2.0574596117076477e-05, "loss": 2.2283, "step": 77144 }, { "epoch": 0.96, "learning_rate": 2.057138500533536e-05, "loss": 2.236, "step": 77152 }, { "epoch": 0.96, "learning_rate": 2.0568182862777607e-05, "loss": 2.2369, "step": 77160 }, { "epoch": 0.96, "learning_rate": 2.0564989689724354e-05, "loss": 2.2327, "step": 77168 }, { "epoch": 0.96, "learning_rate": 2.056180548649587e-05, "loss": 2.2527, "step": 77176 }, { "epoch": 0.96, "learning_rate": 2.055863025341151e-05, "loss": 2.2318, "step": 77184 }, { "epoch": 0.96, "learning_rate": 2.055546399078974e-05, "loss": 2.2305, "step": 77192 }, { "epoch": 0.96, "learning_rate": 2.0552306698948108e-05, "loss": 2.2203, "step": 77200 }, { "epoch": 0.97, "learning_rate": 2.0549158378203272e-05, "loss": 2.2119, "step": 77208 }, { "epoch": 0.97, "learning_rate": 2.054601902887099e-05, "loss": 2.2455, "step": 77216 }, { "epoch": 0.97, "learning_rate": 2.054288865126614e-05, "loss": 2.2329, "step": 77224 }, { "epoch": 0.97, "learning_rate": 2.0539767245702658e-05, "loss": 2.2334, "step": 77232 }, { "epoch": 0.97, "learning_rate": 2.0536654812493607e-05, "loss": 2.2265, "step": 77240 }, { "epoch": 0.97, "learning_rate": 2.053355135195116e-05, "loss": 2.2399, "step": 77248 }, { "epoch": 0.97, "learning_rate": 2.053045686438656e-05, "loss": 2.2381, "step": 77256 }, { "epoch": 0.97, "learning_rate": 2.052737135011018e-05, "loss": 2.2565, "step": 77264 }, { "epoch": 0.97, "learning_rate": 2.0524294809431467e-05, "loss": 2.219, "step": 77272 }, { "epoch": 0.97, "learning_rate": 2.0521227242658988e-05, "loss": 2.2331, "step": 77280 }, { "epoch": 0.97, "learning_rate": 2.0518168650100415e-05, "loss": 2.237, "step": 77288 }, { "epoch": 0.97, "learning_rate": 2.0515119032062475e-05, "loss": 2.2303, "step": 77296 }, { "epoch": 0.97, "learning_rate": 2.0512078388851057e-05, "loss": 2.2413, "step": 77304 }, { "epoch": 0.97, "learning_rate": 2.050904672077111e-05, "loss": 2.2469, "step": 77312 }, { "epoch": 0.97, "learning_rate": 2.050602402812669e-05, "loss": 2.2276, "step": 77320 }, { "epoch": 0.97, "learning_rate": 2.0503010311220966e-05, "loss": 2.2487, "step": 77328 }, { "epoch": 0.97, "learning_rate": 2.0500005570356188e-05, "loss": 2.2489, "step": 77336 }, { "epoch": 0.97, "learning_rate": 2.0497009805833717e-05, "loss": 2.2434, "step": 77344 }, { "epoch": 0.97, "learning_rate": 2.0494023017954002e-05, "loss": 2.2272, "step": 77352 }, { "epoch": 0.97, "learning_rate": 2.049104520701661e-05, "loss": 2.227, "step": 77360 }, { "epoch": 0.97, "learning_rate": 2.048807637332021e-05, "loss": 2.2296, "step": 77368 }, { "epoch": 0.97, "learning_rate": 2.048511651716254e-05, "loss": 2.2368, "step": 77376 }, { "epoch": 0.97, "learning_rate": 2.0482165638840468e-05, "loss": 2.2245, "step": 77384 }, { "epoch": 0.97, "learning_rate": 2.047922373864994e-05, "loss": 2.2451, "step": 77392 }, { "epoch": 0.97, "learning_rate": 2.0476290816886016e-05, "loss": 2.2392, "step": 77400 }, { "epoch": 0.97, "learning_rate": 2.0473366873842868e-05, "loss": 2.24, "step": 77408 }, { "epoch": 0.97, "learning_rate": 2.0470451909813724e-05, "loss": 2.2324, "step": 77416 }, { "epoch": 0.97, "learning_rate": 2.0467545925090947e-05, "loss": 2.2356, "step": 77424 }, { "epoch": 0.97, "learning_rate": 2.0464648919966006e-05, "loss": 2.2299, "step": 77432 }, { "epoch": 0.97, "learning_rate": 2.046176089472944e-05, "loss": 2.2367, "step": 77440 }, { "epoch": 0.97, "learning_rate": 2.0458881849670902e-05, "loss": 2.2399, "step": 77448 }, { "epoch": 0.97, "learning_rate": 2.0456011785079154e-05, "loss": 2.2354, "step": 77456 }, { "epoch": 0.97, "learning_rate": 2.045315070124203e-05, "loss": 2.2395, "step": 77464 }, { "epoch": 0.97, "learning_rate": 2.04502985984465e-05, "loss": 2.2284, "step": 77472 }, { "epoch": 0.97, "learning_rate": 2.04474554769786e-05, "loss": 2.2539, "step": 77480 }, { "epoch": 0.97, "learning_rate": 2.0444621337123475e-05, "loss": 2.27, "step": 77488 }, { "epoch": 0.97, "learning_rate": 2.044179617916539e-05, "loss": 2.2458, "step": 77496 }, { "epoch": 0.97, "learning_rate": 2.0438980003387685e-05, "loss": 2.2241, "step": 77504 }, { "epoch": 0.97, "learning_rate": 2.0436172810072803e-05, "loss": 2.2251, "step": 77512 }, { "epoch": 0.97, "learning_rate": 2.043337459950229e-05, "loss": 2.2332, "step": 77520 }, { "epoch": 0.97, "learning_rate": 2.0430585371956778e-05, "loss": 2.247, "step": 77528 }, { "epoch": 0.97, "learning_rate": 2.042780512771605e-05, "loss": 2.2257, "step": 77536 }, { "epoch": 0.97, "learning_rate": 2.0425033867058905e-05, "loss": 2.2296, "step": 77544 }, { "epoch": 0.97, "learning_rate": 2.042227159026332e-05, "loss": 2.2403, "step": 77552 }, { "epoch": 0.97, "learning_rate": 2.0419518297606302e-05, "loss": 2.2169, "step": 77560 }, { "epoch": 0.97, "learning_rate": 2.0416773989364017e-05, "loss": 2.2491, "step": 77568 }, { "epoch": 0.97, "learning_rate": 2.04140386658117e-05, "loss": 2.2308, "step": 77576 }, { "epoch": 0.97, "learning_rate": 2.041131232722367e-05, "loss": 2.2296, "step": 77584 }, { "epoch": 0.97, "learning_rate": 2.0408594973873377e-05, "loss": 2.2345, "step": 77592 }, { "epoch": 0.97, "learning_rate": 2.0405886606033367e-05, "loss": 2.2345, "step": 77600 }, { "epoch": 0.97, "learning_rate": 2.040318722397525e-05, "loss": 2.2302, "step": 77608 }, { "epoch": 0.97, "learning_rate": 2.0400496827969778e-05, "loss": 2.2143, "step": 77616 }, { "epoch": 0.97, "learning_rate": 2.0397815418286778e-05, "loss": 2.2484, "step": 77624 }, { "epoch": 0.97, "learning_rate": 2.0395142995195167e-05, "loss": 2.2574, "step": 77632 }, { "epoch": 0.97, "learning_rate": 2.0392479558963003e-05, "loss": 2.2431, "step": 77640 }, { "epoch": 0.97, "learning_rate": 2.0389825109857372e-05, "loss": 2.2536, "step": 77648 }, { "epoch": 0.97, "learning_rate": 2.038717964814454e-05, "loss": 2.2308, "step": 77656 }, { "epoch": 0.97, "learning_rate": 2.0384543174089806e-05, "loss": 2.2174, "step": 77664 }, { "epoch": 0.97, "learning_rate": 2.038191568795761e-05, "loss": 2.2079, "step": 77672 }, { "epoch": 0.97, "learning_rate": 2.0379297190011457e-05, "loss": 2.2404, "step": 77680 }, { "epoch": 0.97, "learning_rate": 2.037668768051398e-05, "loss": 2.233, "step": 77688 }, { "epoch": 0.97, "learning_rate": 2.03740871597269e-05, "loss": 2.2352, "step": 77696 }, { "epoch": 0.97, "learning_rate": 2.037149562791103e-05, "loss": 2.2245, "step": 77704 }, { "epoch": 0.97, "learning_rate": 2.0368913085326274e-05, "loss": 2.2479, "step": 77712 }, { "epoch": 0.97, "learning_rate": 2.036633953223167e-05, "loss": 2.2419, "step": 77720 }, { "epoch": 0.97, "learning_rate": 2.0363774968885317e-05, "loss": 2.2211, "step": 77728 }, { "epoch": 0.97, "learning_rate": 2.036121939554442e-05, "loss": 2.2511, "step": 77736 }, { "epoch": 0.97, "learning_rate": 2.03586728124653e-05, "loss": 2.2308, "step": 77744 }, { "epoch": 0.97, "learning_rate": 2.0356135219903362e-05, "loss": 2.2328, "step": 77752 }, { "epoch": 0.97, "learning_rate": 2.035360661811312e-05, "loss": 2.2325, "step": 77760 }, { "epoch": 0.97, "learning_rate": 2.035108700734816e-05, "loss": 2.2477, "step": 77768 }, { "epoch": 0.97, "learning_rate": 2.0348576387861192e-05, "loss": 2.2618, "step": 77776 }, { "epoch": 0.97, "learning_rate": 2.034607475990403e-05, "loss": 2.2364, "step": 77784 }, { "epoch": 0.97, "learning_rate": 2.0343582123727553e-05, "loss": 2.2406, "step": 77792 }, { "epoch": 0.97, "learning_rate": 2.0341098479581766e-05, "loss": 2.23, "step": 77800 }, { "epoch": 0.97, "learning_rate": 2.0338623827715773e-05, "loss": 2.2564, "step": 77808 }, { "epoch": 0.97, "learning_rate": 2.033615816837776e-05, "loss": 2.2391, "step": 77816 }, { "epoch": 0.97, "learning_rate": 2.033370150181501e-05, "loss": 2.2595, "step": 77824 }, { "epoch": 0.97, "learning_rate": 2.0331253828273933e-05, "loss": 2.2398, "step": 77832 }, { "epoch": 0.97, "learning_rate": 2.0328815148000002e-05, "loss": 2.2326, "step": 77840 }, { "epoch": 0.97, "learning_rate": 2.0326385461237807e-05, "loss": 2.2433, "step": 77848 }, { "epoch": 0.97, "learning_rate": 2.0323964768231035e-05, "loss": 2.2549, "step": 77856 }, { "epoch": 0.97, "learning_rate": 2.0321553069222457e-05, "loss": 2.2342, "step": 77864 }, { "epoch": 0.97, "learning_rate": 2.031915036445397e-05, "loss": 2.2278, "step": 77872 }, { "epoch": 0.97, "learning_rate": 2.0316756654166528e-05, "loss": 2.2382, "step": 77880 }, { "epoch": 0.97, "learning_rate": 2.0314371938600228e-05, "loss": 2.2377, "step": 77888 }, { "epoch": 0.97, "learning_rate": 2.031199621799424e-05, "loss": 2.2243, "step": 77896 }, { "epoch": 0.97, "learning_rate": 2.0309629492586822e-05, "loss": 2.235, "step": 77904 }, { "epoch": 0.97, "learning_rate": 2.0307271762615365e-05, "loss": 2.2197, "step": 77912 }, { "epoch": 0.97, "learning_rate": 2.0304923028316314e-05, "loss": 2.2204, "step": 77920 }, { "epoch": 0.97, "learning_rate": 2.0302583289925244e-05, "loss": 2.2251, "step": 77928 }, { "epoch": 0.97, "learning_rate": 2.030025254767682e-05, "loss": 2.2559, "step": 77936 }, { "epoch": 0.97, "learning_rate": 2.0297930801804793e-05, "loss": 2.2527, "step": 77944 }, { "epoch": 0.97, "learning_rate": 2.029561805254203e-05, "loss": 2.2118, "step": 77952 }, { "epoch": 0.97, "learning_rate": 2.0293314300120483e-05, "loss": 2.2519, "step": 77960 }, { "epoch": 0.97, "learning_rate": 2.02910195447712e-05, "loss": 2.2457, "step": 77968 }, { "epoch": 0.97, "learning_rate": 2.028873378672434e-05, "loss": 2.2243, "step": 77976 }, { "epoch": 0.97, "learning_rate": 2.0286457026209153e-05, "loss": 2.2467, "step": 77984 }, { "epoch": 0.97, "learning_rate": 2.0284189263453984e-05, "loss": 2.2174, "step": 77992 }, { "epoch": 0.97, "learning_rate": 2.028193049868628e-05, "loss": 2.2481, "step": 78000 }, { "epoch": 0.98, "learning_rate": 2.0279680732132556e-05, "loss": 2.251, "step": 78008 }, { "epoch": 0.98, "learning_rate": 2.0277439964018484e-05, "loss": 2.2378, "step": 78016 }, { "epoch": 0.98, "learning_rate": 2.027520819456879e-05, "loss": 2.2365, "step": 78024 }, { "epoch": 0.98, "learning_rate": 2.0272985424007298e-05, "loss": 2.2334, "step": 78032 }, { "epoch": 0.98, "learning_rate": 2.0270771652556944e-05, "loss": 2.221, "step": 78040 }, { "epoch": 0.98, "learning_rate": 2.026856688043977e-05, "loss": 2.2326, "step": 78048 }, { "epoch": 0.98, "learning_rate": 2.0266371107876887e-05, "loss": 2.2215, "step": 78056 }, { "epoch": 0.98, "learning_rate": 2.0264184335088525e-05, "loss": 2.2252, "step": 78064 }, { "epoch": 0.98, "learning_rate": 2.0262006562293996e-05, "loss": 2.2394, "step": 78072 }, { "epoch": 0.98, "learning_rate": 2.0259837789711737e-05, "loss": 2.2565, "step": 78080 }, { "epoch": 0.98, "learning_rate": 2.0257678017559244e-05, "loss": 2.239, "step": 78088 }, { "epoch": 0.98, "learning_rate": 2.025552724605313e-05, "loss": 2.2255, "step": 78096 }, { "epoch": 0.98, "learning_rate": 2.0253385475409124e-05, "loss": 2.237, "step": 78104 }, { "epoch": 0.98, "learning_rate": 2.025125270584202e-05, "loss": 2.2484, "step": 78112 }, { "epoch": 0.98, "learning_rate": 2.0249128937565728e-05, "loss": 2.2143, "step": 78120 }, { "epoch": 0.98, "learning_rate": 2.024701417079324e-05, "loss": 2.2338, "step": 78128 }, { "epoch": 0.98, "learning_rate": 2.0244908405736664e-05, "loss": 2.2482, "step": 78136 }, { "epoch": 0.98, "learning_rate": 2.0242811642607202e-05, "loss": 2.2371, "step": 78144 }, { "epoch": 0.98, "learning_rate": 2.0240723881615138e-05, "loss": 2.2308, "step": 78152 }, { "epoch": 0.98, "learning_rate": 2.0238645122969857e-05, "loss": 2.2317, "step": 78160 }, { "epoch": 0.98, "learning_rate": 2.023657536687986e-05, "loss": 2.235, "step": 78168 }, { "epoch": 0.98, "learning_rate": 2.0234514613552726e-05, "loss": 2.2461, "step": 78176 }, { "epoch": 0.98, "learning_rate": 2.0232462863195135e-05, "loss": 2.2293, "step": 78184 }, { "epoch": 0.98, "learning_rate": 2.0230420116012868e-05, "loss": 2.2316, "step": 78192 }, { "epoch": 0.98, "learning_rate": 2.0228386372210803e-05, "loss": 2.2238, "step": 78200 }, { "epoch": 0.98, "learning_rate": 2.0226361631992915e-05, "loss": 2.2248, "step": 78208 }, { "epoch": 0.98, "learning_rate": 2.0224345895562262e-05, "loss": 2.238, "step": 78216 }, { "epoch": 0.98, "learning_rate": 2.0222339163121017e-05, "loss": 2.2434, "step": 78224 }, { "epoch": 0.98, "learning_rate": 2.022034143487045e-05, "loss": 2.2432, "step": 78232 }, { "epoch": 0.98, "learning_rate": 2.021835271101092e-05, "loss": 2.2306, "step": 78240 }, { "epoch": 0.98, "learning_rate": 2.021637299174188e-05, "loss": 2.2382, "step": 78248 }, { "epoch": 0.98, "learning_rate": 2.0214402277261886e-05, "loss": 2.2451, "step": 78256 }, { "epoch": 0.98, "learning_rate": 2.021244056776859e-05, "loss": 2.2471, "step": 78264 }, { "epoch": 0.98, "learning_rate": 2.0210487863458742e-05, "loss": 2.223, "step": 78272 }, { "epoch": 0.98, "learning_rate": 2.0208544164528183e-05, "loss": 2.2515, "step": 78280 }, { "epoch": 0.98, "learning_rate": 2.0206609471171864e-05, "loss": 2.2605, "step": 78288 }, { "epoch": 0.98, "learning_rate": 2.0204683783583813e-05, "loss": 2.2305, "step": 78296 }, { "epoch": 0.98, "learning_rate": 2.0202767101957172e-05, "loss": 2.2419, "step": 78304 }, { "epoch": 0.98, "learning_rate": 2.020085942648417e-05, "loss": 2.2399, "step": 78312 }, { "epoch": 0.98, "learning_rate": 2.019896075735614e-05, "loss": 2.2321, "step": 78320 }, { "epoch": 0.98, "learning_rate": 2.01970710947635e-05, "loss": 2.2241, "step": 78328 }, { "epoch": 0.98, "learning_rate": 2.0195190438895785e-05, "loss": 2.2436, "step": 78336 }, { "epoch": 0.98, "learning_rate": 2.01933187899416e-05, "loss": 2.27, "step": 78344 }, { "epoch": 0.98, "learning_rate": 2.0191456148088675e-05, "loss": 2.2251, "step": 78352 }, { "epoch": 0.98, "learning_rate": 2.0189602513523814e-05, "loss": 2.2259, "step": 78360 }, { "epoch": 0.98, "learning_rate": 2.018775788643292e-05, "loss": 2.2393, "step": 78368 }, { "epoch": 0.98, "learning_rate": 2.0185922267001014e-05, "loss": 2.2333, "step": 78376 }, { "epoch": 0.98, "learning_rate": 2.018409565541218e-05, "loss": 2.2339, "step": 78384 }, { "epoch": 0.98, "learning_rate": 2.018227805184963e-05, "loss": 2.2417, "step": 78392 }, { "epoch": 0.98, "learning_rate": 2.018046945649566e-05, "loss": 2.224, "step": 78400 }, { "epoch": 0.98, "learning_rate": 2.0178669869531652e-05, "loss": 2.2355, "step": 78408 }, { "epoch": 0.98, "learning_rate": 2.0176879291138118e-05, "loss": 2.2329, "step": 78416 }, { "epoch": 0.98, "learning_rate": 2.0175097721494605e-05, "loss": 2.2112, "step": 78424 }, { "epoch": 0.98, "learning_rate": 2.0173325160779817e-05, "loss": 2.2422, "step": 78432 }, { "epoch": 0.98, "learning_rate": 2.0171561609171542e-05, "loss": 2.2275, "step": 78440 }, { "epoch": 0.98, "learning_rate": 2.016980706684663e-05, "loss": 2.2327, "step": 78448 }, { "epoch": 0.98, "learning_rate": 2.0168061533981074e-05, "loss": 2.2377, "step": 78456 }, { "epoch": 0.98, "learning_rate": 2.0166325010749924e-05, "loss": 2.2249, "step": 78464 }, { "epoch": 0.98, "learning_rate": 2.0164597497327343e-05, "loss": 2.2303, "step": 78472 }, { "epoch": 0.98, "learning_rate": 2.016287899388661e-05, "loss": 2.2343, "step": 78480 }, { "epoch": 0.98, "learning_rate": 2.016116950060005e-05, "loss": 2.2415, "step": 78488 }, { "epoch": 0.98, "learning_rate": 2.015946901763915e-05, "loss": 2.2523, "step": 78496 }, { "epoch": 0.98, "learning_rate": 2.0157777545174446e-05, "loss": 2.2186, "step": 78504 }, { "epoch": 0.98, "learning_rate": 2.015609508337557e-05, "loss": 2.2368, "step": 78512 }, { "epoch": 0.98, "learning_rate": 2.0154421632411277e-05, "loss": 2.2377, "step": 78520 }, { "epoch": 0.98, "learning_rate": 2.01527571924494e-05, "loss": 2.2248, "step": 78528 }, { "epoch": 0.98, "learning_rate": 2.0151101763656882e-05, "loss": 2.2348, "step": 78536 }, { "epoch": 0.98, "learning_rate": 2.0149455346199738e-05, "loss": 2.2116, "step": 78544 }, { "epoch": 0.98, "learning_rate": 2.0147817940243103e-05, "loss": 2.2268, "step": 78552 }, { "epoch": 0.98, "learning_rate": 2.0146189545951193e-05, "loss": 2.2386, "step": 78560 }, { "epoch": 0.98, "learning_rate": 2.014457016348734e-05, "loss": 2.2375, "step": 78568 }, { "epoch": 0.98, "learning_rate": 2.0142959793013947e-05, "loss": 2.2757, "step": 78576 }, { "epoch": 0.98, "learning_rate": 2.0141358434692523e-05, "loss": 2.2283, "step": 78584 }, { "epoch": 0.98, "learning_rate": 2.0139766088683692e-05, "loss": 2.2348, "step": 78592 }, { "epoch": 0.98, "learning_rate": 2.0138182755147142e-05, "loss": 2.2494, "step": 78600 }, { "epoch": 0.98, "learning_rate": 2.013660843424167e-05, "loss": 2.2272, "step": 78608 }, { "epoch": 0.98, "learning_rate": 2.013504312612519e-05, "loss": 2.2405, "step": 78616 }, { "epoch": 0.98, "learning_rate": 2.0133486830954674e-05, "loss": 2.2454, "step": 78624 }, { "epoch": 0.98, "learning_rate": 2.0131939548886213e-05, "loss": 2.2536, "step": 78632 }, { "epoch": 0.98, "learning_rate": 2.0130401280075004e-05, "loss": 2.2421, "step": 78640 }, { "epoch": 0.98, "learning_rate": 2.012887202467531e-05, "loss": 2.2443, "step": 78648 }, { "epoch": 0.98, "learning_rate": 2.012735178284051e-05, "loss": 2.2466, "step": 78656 }, { "epoch": 0.98, "learning_rate": 2.0125840554723096e-05, "loss": 2.237, "step": 78664 }, { "epoch": 0.98, "learning_rate": 2.0124338340474614e-05, "loss": 2.2343, "step": 78672 }, { "epoch": 0.98, "learning_rate": 2.0122845140245718e-05, "loss": 2.2003, "step": 78680 }, { "epoch": 0.98, "learning_rate": 2.0121360954186197e-05, "loss": 2.2468, "step": 78688 }, { "epoch": 0.98, "learning_rate": 2.0119885782444885e-05, "loss": 2.2313, "step": 78696 }, { "epoch": 0.98, "learning_rate": 2.011841962516975e-05, "loss": 2.2486, "step": 78704 }, { "epoch": 0.98, "learning_rate": 2.011696248250782e-05, "loss": 2.2223, "step": 78712 }, { "epoch": 0.98, "learning_rate": 2.0115514354605253e-05, "loss": 2.2464, "step": 78720 }, { "epoch": 0.98, "learning_rate": 2.0114075241607274e-05, "loss": 2.2285, "step": 78728 }, { "epoch": 0.98, "learning_rate": 2.0112645143658232e-05, "loss": 2.2374, "step": 78736 }, { "epoch": 0.98, "learning_rate": 2.011122406090155e-05, "loss": 2.2452, "step": 78744 }, { "epoch": 0.98, "learning_rate": 2.0109811993479772e-05, "loss": 2.233, "step": 78752 }, { "epoch": 0.98, "learning_rate": 2.0108408941534486e-05, "loss": 2.2334, "step": 78760 }, { "epoch": 0.98, "learning_rate": 2.0107014905206432e-05, "loss": 2.2396, "step": 78768 }, { "epoch": 0.98, "learning_rate": 2.010562988463543e-05, "loss": 2.2313, "step": 78776 }, { "epoch": 0.98, "learning_rate": 2.010425387996038e-05, "loss": 2.2481, "step": 78784 }, { "epoch": 0.98, "learning_rate": 2.0102886891319288e-05, "loss": 2.2329, "step": 78792 }, { "epoch": 0.98, "learning_rate": 2.0101528918849243e-05, "loss": 2.2414, "step": 78800 }, { "epoch": 0.99, "learning_rate": 2.010017996268647e-05, "loss": 2.2341, "step": 78808 }, { "epoch": 0.99, "learning_rate": 2.0098840022966242e-05, "loss": 2.2519, "step": 78816 }, { "epoch": 0.99, "learning_rate": 2.0097509099822948e-05, "loss": 2.2226, "step": 78824 }, { "epoch": 0.99, "learning_rate": 2.009618719339008e-05, "loss": 2.2493, "step": 78832 }, { "epoch": 0.99, "learning_rate": 2.0094874303800207e-05, "loss": 2.2458, "step": 78840 }, { "epoch": 0.99, "learning_rate": 2.009357043118502e-05, "loss": 2.2471, "step": 78848 }, { "epoch": 0.99, "learning_rate": 2.0092275575675272e-05, "loss": 2.2533, "step": 78856 }, { "epoch": 0.99, "learning_rate": 2.009098973740084e-05, "loss": 2.2366, "step": 78864 }, { "epoch": 0.99, "learning_rate": 2.0089712916490687e-05, "loss": 2.2184, "step": 78872 }, { "epoch": 0.99, "learning_rate": 2.0088445113072866e-05, "loss": 2.2289, "step": 78880 }, { "epoch": 0.99, "learning_rate": 2.0087186327274542e-05, "loss": 2.231, "step": 78888 }, { "epoch": 0.99, "learning_rate": 2.0085936559221945e-05, "loss": 2.239, "step": 78896 }, { "epoch": 0.99, "learning_rate": 2.0084695809040437e-05, "loss": 2.2492, "step": 78904 }, { "epoch": 0.99, "learning_rate": 2.0083464076854454e-05, "loss": 2.2466, "step": 78912 }, { "epoch": 0.99, "learning_rate": 2.0082241362787516e-05, "loss": 2.2354, "step": 78920 }, { "epoch": 0.99, "learning_rate": 2.0081027666962274e-05, "loss": 2.2462, "step": 78928 }, { "epoch": 0.99, "learning_rate": 2.007982298950045e-05, "loss": 2.2307, "step": 78936 }, { "epoch": 0.99, "learning_rate": 2.0078627330522863e-05, "loss": 2.2384, "step": 78944 }, { "epoch": 0.99, "learning_rate": 2.007744069014944e-05, "loss": 2.2423, "step": 78952 }, { "epoch": 0.99, "learning_rate": 2.0076263068499173e-05, "loss": 2.2155, "step": 78960 }, { "epoch": 0.99, "learning_rate": 2.0075094465690194e-05, "loss": 2.2197, "step": 78968 }, { "epoch": 0.99, "learning_rate": 2.0073934881839693e-05, "loss": 2.2277, "step": 78976 }, { "epoch": 0.99, "learning_rate": 2.007278431706397e-05, "loss": 2.2463, "step": 78984 }, { "epoch": 0.99, "learning_rate": 2.007164277147843e-05, "loss": 2.2526, "step": 78992 }, { "epoch": 0.99, "learning_rate": 2.0070510245197554e-05, "loss": 2.2248, "step": 79000 }, { "epoch": 0.99, "learning_rate": 2.006938673833494e-05, "loss": 2.229, "step": 79008 }, { "epoch": 0.99, "learning_rate": 2.006827225100325e-05, "loss": 2.2295, "step": 79016 }, { "epoch": 0.99, "learning_rate": 2.006716678331428e-05, "loss": 2.2329, "step": 79024 }, { "epoch": 0.99, "learning_rate": 2.0066070335378896e-05, "loss": 2.2316, "step": 79032 }, { "epoch": 0.99, "learning_rate": 2.0064982907307055e-05, "loss": 2.2535, "step": 79040 }, { "epoch": 0.99, "learning_rate": 2.0063904499207836e-05, "loss": 2.2423, "step": 79048 }, { "epoch": 0.99, "learning_rate": 2.006283511118939e-05, "loss": 2.2355, "step": 79056 }, { "epoch": 0.99, "learning_rate": 2.0061774743358958e-05, "loss": 2.2312, "step": 79064 }, { "epoch": 0.99, "learning_rate": 2.006072339582292e-05, "loss": 2.2442, "step": 79072 }, { "epoch": 0.99, "learning_rate": 2.0059681068686686e-05, "loss": 2.2277, "step": 79080 }, { "epoch": 0.99, "learning_rate": 2.0058647762054817e-05, "loss": 2.2309, "step": 79088 }, { "epoch": 0.99, "learning_rate": 2.005762347603094e-05, "loss": 2.2382, "step": 79096 }, { "epoch": 0.99, "learning_rate": 2.0056608210717788e-05, "loss": 2.2268, "step": 79104 }, { "epoch": 0.99, "learning_rate": 2.0055601966217186e-05, "loss": 2.2441, "step": 79112 }, { "epoch": 0.99, "learning_rate": 2.005460474263005e-05, "loss": 2.2518, "step": 79120 }, { "epoch": 0.99, "learning_rate": 2.0053616540056407e-05, "loss": 2.2292, "step": 79128 }, { "epoch": 0.99, "learning_rate": 2.0052637358595355e-05, "loss": 2.2464, "step": 79136 }, { "epoch": 0.99, "learning_rate": 2.0051667198345107e-05, "loss": 2.2307, "step": 79144 }, { "epoch": 0.99, "learning_rate": 2.0050706059402963e-05, "loss": 2.2525, "step": 79152 }, { "epoch": 0.99, "learning_rate": 2.0049753941865323e-05, "loss": 2.2297, "step": 79160 }, { "epoch": 0.99, "learning_rate": 2.0048810845827668e-05, "loss": 2.238, "step": 79168 }, { "epoch": 0.99, "learning_rate": 2.0047876771384603e-05, "loss": 2.2423, "step": 79176 }, { "epoch": 0.99, "learning_rate": 2.00469517186298e-05, "loss": 2.2368, "step": 79184 }, { "epoch": 0.99, "learning_rate": 2.0046035687656034e-05, "loss": 2.2312, "step": 79192 }, { "epoch": 0.99, "learning_rate": 2.004512867855519e-05, "loss": 2.2288, "step": 79200 }, { "epoch": 0.99, "learning_rate": 2.0044230691418218e-05, "loss": 2.2322, "step": 79208 }, { "epoch": 0.99, "learning_rate": 2.0043341726335195e-05, "loss": 2.2314, "step": 79216 }, { "epoch": 0.99, "learning_rate": 2.004246178339527e-05, "loss": 2.2284, "step": 79224 }, { "epoch": 0.99, "learning_rate": 2.00415908626867e-05, "loss": 2.2363, "step": 79232 }, { "epoch": 0.99, "learning_rate": 2.004072896429684e-05, "loss": 2.2534, "step": 79240 }, { "epoch": 0.99, "learning_rate": 2.0039876088312115e-05, "loss": 2.2355, "step": 79248 }, { "epoch": 0.99, "learning_rate": 2.0039032234818092e-05, "loss": 2.236, "step": 79256 }, { "epoch": 0.99, "learning_rate": 2.003819740389938e-05, "loss": 2.2601, "step": 79264 }, { "epoch": 0.99, "learning_rate": 2.0037371595639714e-05, "loss": 2.2406, "step": 79272 }, { "epoch": 0.99, "learning_rate": 2.0036554810121933e-05, "loss": 2.214, "step": 79280 }, { "epoch": 0.99, "learning_rate": 2.003574704742793e-05, "loss": 2.2247, "step": 79288 }, { "epoch": 0.99, "learning_rate": 2.003494830763874e-05, "loss": 2.2331, "step": 79296 }, { "epoch": 0.99, "learning_rate": 2.003415859083446e-05, "loss": 2.2412, "step": 79304 }, { "epoch": 0.99, "learning_rate": 2.0033377897094306e-05, "loss": 2.22, "step": 79312 }, { "epoch": 0.99, "learning_rate": 2.0032606226496564e-05, "loss": 2.231, "step": 79320 }, { "epoch": 0.99, "learning_rate": 2.0031843579118633e-05, "loss": 2.2411, "step": 79328 }, { "epoch": 0.99, "learning_rate": 2.0031089955037012e-05, "loss": 2.214, "step": 79336 }, { "epoch": 0.99, "learning_rate": 2.0030345354327265e-05, "loss": 2.2529, "step": 79344 }, { "epoch": 0.99, "learning_rate": 2.0029609777064096e-05, "loss": 2.2182, "step": 79352 }, { "epoch": 0.99, "learning_rate": 2.0028883223321254e-05, "loss": 2.2367, "step": 79360 }, { "epoch": 0.99, "learning_rate": 2.0028165693171628e-05, "loss": 2.2448, "step": 79368 }, { "epoch": 0.99, "learning_rate": 2.002745718668717e-05, "loss": 2.2383, "step": 79376 }, { "epoch": 0.99, "learning_rate": 2.0026757703938943e-05, "loss": 2.2237, "step": 79384 }, { "epoch": 0.99, "learning_rate": 2.0026067244997105e-05, "loss": 2.2053, "step": 79392 }, { "epoch": 0.99, "learning_rate": 2.00253858099309e-05, "loss": 2.2349, "step": 79400 }, { "epoch": 0.99, "learning_rate": 2.0024713398808675e-05, "loss": 2.2406, "step": 79408 }, { "epoch": 0.99, "learning_rate": 2.0024050011697874e-05, "loss": 2.2394, "step": 79416 }, { "epoch": 0.99, "learning_rate": 2.0023395648665012e-05, "loss": 2.2366, "step": 79424 }, { "epoch": 0.99, "learning_rate": 2.0022750309775738e-05, "loss": 2.2293, "step": 79432 }, { "epoch": 0.99, "learning_rate": 2.0022113995094772e-05, "loss": 2.2284, "step": 79440 }, { "epoch": 0.99, "learning_rate": 2.0021486704685923e-05, "loss": 2.2304, "step": 79448 }, { "epoch": 0.99, "learning_rate": 2.0020868438612118e-05, "loss": 2.2389, "step": 79456 }, { "epoch": 0.99, "learning_rate": 2.0020259196935346e-05, "loss": 2.2463, "step": 79464 }, { "epoch": 0.99, "learning_rate": 2.001965897971674e-05, "loss": 2.238, "step": 79472 }, { "epoch": 0.99, "learning_rate": 2.0019067787016464e-05, "loss": 2.2463, "step": 79480 }, { "epoch": 0.99, "learning_rate": 2.001848561889385e-05, "loss": 2.2288, "step": 79488 }, { "epoch": 0.99, "learning_rate": 2.0017912475407247e-05, "loss": 2.221, "step": 79496 }, { "epoch": 0.99, "learning_rate": 2.001734835661417e-05, "loss": 2.2409, "step": 79504 }, { "epoch": 0.99, "learning_rate": 2.001679326257117e-05, "loss": 2.2415, "step": 79512 }, { "epoch": 0.99, "learning_rate": 2.001624719333394e-05, "loss": 2.246, "step": 79520 }, { "epoch": 0.99, "learning_rate": 2.001571014895724e-05, "loss": 2.2236, "step": 79528 }, { "epoch": 0.99, "learning_rate": 2.0015182129494924e-05, "loss": 2.242, "step": 79536 }, { "epoch": 0.99, "learning_rate": 2.0014663134999974e-05, "loss": 2.2388, "step": 79544 }, { "epoch": 0.99, "learning_rate": 2.0014153165524418e-05, "loss": 2.2419, "step": 79552 }, { "epoch": 0.99, "learning_rate": 2.001365222111941e-05, "loss": 2.2431, "step": 79560 }, { "epoch": 0.99, "learning_rate": 2.0013160301835194e-05, "loss": 2.2318, "step": 79568 }, { "epoch": 0.99, "learning_rate": 2.0012677407721108e-05, "loss": 2.2461, "step": 79576 }, { "epoch": 0.99, "learning_rate": 2.0012203538825586e-05, "loss": 2.2449, "step": 79584 }, { "epoch": 0.99, "learning_rate": 2.0011738695196146e-05, "loss": 2.2485, "step": 79592 }, { "epoch": 0.99, "learning_rate": 2.0011282876879414e-05, "loss": 2.2389, "step": 79600 }, { "epoch": 1.0, "learning_rate": 2.0010836083921104e-05, "loss": 2.244, "step": 79608 }, { "epoch": 1.0, "learning_rate": 2.001039831636603e-05, "loss": 2.2274, "step": 79616 }, { "epoch": 1.0, "learning_rate": 2.000996957425809e-05, "loss": 2.2348, "step": 79624 }, { "epoch": 1.0, "learning_rate": 2.00095498576403e-05, "loss": 2.2384, "step": 79632 }, { "epoch": 1.0, "learning_rate": 2.000913916655473e-05, "loss": 2.2064, "step": 79640 }, { "epoch": 1.0, "learning_rate": 2.0008737501042602e-05, "loss": 2.2263, "step": 79648 }, { "epoch": 1.0, "learning_rate": 2.0008344861144177e-05, "loss": 2.2422, "step": 79656 }, { "epoch": 1.0, "learning_rate": 2.0007961246898837e-05, "loss": 2.2516, "step": 79664 }, { "epoch": 1.0, "learning_rate": 2.0007586658345072e-05, "loss": 2.2487, "step": 79672 }, { "epoch": 1.0, "learning_rate": 2.000722109552043e-05, "loss": 2.2108, "step": 79680 }, { "epoch": 1.0, "learning_rate": 2.0006864558461583e-05, "loss": 2.2362, "step": 79688 }, { "epoch": 1.0, "learning_rate": 2.0006517047204305e-05, "loss": 2.242, "step": 79696 }, { "epoch": 1.0, "learning_rate": 2.000617856178342e-05, "loss": 2.2201, "step": 79704 }, { "epoch": 1.0, "learning_rate": 2.0005849102232897e-05, "loss": 2.236, "step": 79712 }, { "epoch": 1.0, "learning_rate": 2.0005528668585782e-05, "loss": 2.2307, "step": 79720 }, { "epoch": 1.0, "learning_rate": 2.0005217260874207e-05, "loss": 2.2414, "step": 79728 }, { "epoch": 1.0, "learning_rate": 2.0004914879129394e-05, "loss": 2.2384, "step": 79736 }, { "epoch": 1.0, "learning_rate": 2.0004621523381677e-05, "loss": 2.2263, "step": 79744 }, { "epoch": 1.0, "learning_rate": 2.0004337193660482e-05, "loss": 2.2403, "step": 79752 }, { "epoch": 1.0, "learning_rate": 2.000406188999432e-05, "loss": 2.2434, "step": 79760 }, { "epoch": 1.0, "learning_rate": 2.0003795612410807e-05, "loss": 2.2473, "step": 79768 }, { "epoch": 1.0, "learning_rate": 2.0003538360936653e-05, "loss": 2.2207, "step": 79776 }, { "epoch": 1.0, "learning_rate": 2.000329013559765e-05, "loss": 2.2414, "step": 79784 }, { "epoch": 1.0, "learning_rate": 2.0003050936418692e-05, "loss": 2.2256, "step": 79792 }, { "epoch": 1.0, "learning_rate": 2.000282076342378e-05, "loss": 2.2544, "step": 79800 }, { "epoch": 1.0, "learning_rate": 2.000259961663599e-05, "loss": 2.2385, "step": 79808 }, { "epoch": 1.0, "learning_rate": 2.0002387496077508e-05, "loss": 2.2498, "step": 79816 }, { "epoch": 1.0, "learning_rate": 2.00021844017696e-05, "loss": 2.216, "step": 79824 }, { "epoch": 1.0, "learning_rate": 2.0001990333732647e-05, "loss": 2.2405, "step": 79832 }, { "epoch": 1.0, "learning_rate": 2.0001805291986103e-05, "loss": 2.2351, "step": 79840 }, { "epoch": 1.0, "learning_rate": 2.000162927654854e-05, "loss": 2.2393, "step": 79848 }, { "epoch": 1.0, "learning_rate": 2.000146228743759e-05, "loss": 2.2303, "step": 79856 }, { "epoch": 1.0, "learning_rate": 2.000130432467001e-05, "loss": 2.2186, "step": 79864 }, { "epoch": 1.0, "learning_rate": 2.0001155388261656e-05, "loss": 2.2078, "step": 79872 }, { "epoch": 1.0, "learning_rate": 2.0001015478227448e-05, "loss": 2.244, "step": 79880 }, { "epoch": 1.0, "learning_rate": 2.0000884594581425e-05, "loss": 2.2441, "step": 79888 }, { "epoch": 1.0, "learning_rate": 2.000076273733672e-05, "loss": 2.2301, "step": 79896 }, { "epoch": 1.0, "learning_rate": 2.0000649906505543e-05, "loss": 2.2391, "step": 79904 }, { "epoch": 1.0, "learning_rate": 2.0000546102099226e-05, "loss": 2.2307, "step": 79912 }, { "epoch": 1.0, "learning_rate": 2.000045132412816e-05, "loss": 2.2252, "step": 79920 }, { "epoch": 1.0, "learning_rate": 2.0000365572601862e-05, "loss": 2.2481, "step": 79928 }, { "epoch": 1.0, "learning_rate": 2.000028884752893e-05, "loss": 2.235, "step": 79936 }, { "epoch": 1.0, "learning_rate": 2.0000221148917062e-05, "loss": 2.2301, "step": 79944 }, { "epoch": 1.0, "learning_rate": 2.0000162476773048e-05, "loss": 2.2623, "step": 79952 }, { "epoch": 1.0, "learning_rate": 2.0000112831102773e-05, "loss": 2.2336, "step": 79960 }, { "epoch": 1.0, "learning_rate": 2.0000072211911203e-05, "loss": 2.2275, "step": 79968 }, { "epoch": 1.0, "learning_rate": 2.0000040619202434e-05, "loss": 2.2352, "step": 79976 }, { "epoch": 1.0, "learning_rate": 2.0000018052979615e-05, "loss": 2.2677, "step": 79984 }, { "epoch": 1.0, "learning_rate": 2.0000004513245018e-05, "loss": 2.2489, "step": 79992 }, { "epoch": 1.0, "learning_rate": 2e-05, "loss": 2.2439, "step": 80000 }, { "epoch": 0.5, "learning_rate": 7.38147229679313e-05, "loss": 2.2966, "step": 80008 }, { "epoch": 0.5, "learning_rate": 7.380880403687231e-05, "loss": 2.3107, "step": 80016 }, { "epoch": 0.5, "learning_rate": 7.380288476252493e-05, "loss": 2.286, "step": 80024 }, { "epoch": 0.5, "learning_rate": 7.379696514503625e-05, "loss": 2.2986, "step": 80032 }, { "epoch": 0.5, "learning_rate": 7.379104518455349e-05, "loss": 2.2907, "step": 80040 }, { "epoch": 0.5, "learning_rate": 7.378512488122382e-05, "loss": 2.3108, "step": 80048 }, { "epoch": 0.5, "learning_rate": 7.377920423519435e-05, "loss": 2.2866, "step": 80056 }, { "epoch": 0.5, "learning_rate": 7.377328324661236e-05, "loss": 2.3207, "step": 80064 }, { "epoch": 0.5, "learning_rate": 7.376736191562496e-05, "loss": 2.2933, "step": 80072 }, { "epoch": 0.5, "learning_rate": 7.376144024237946e-05, "loss": 2.3103, "step": 80080 }, { "epoch": 0.5, "learning_rate": 7.375551822702295e-05, "loss": 2.2943, "step": 80088 }, { "epoch": 0.5, "learning_rate": 7.374959586970274e-05, "loss": 2.2651, "step": 80096 }, { "epoch": 0.5, "learning_rate": 7.374367317056606e-05, "loss": 2.2916, "step": 80104 }, { "epoch": 0.5, "learning_rate": 7.373775012976008e-05, "loss": 2.2736, "step": 80112 }, { "epoch": 0.5, "learning_rate": 7.373182674743209e-05, "loss": 2.2699, "step": 80120 }, { "epoch": 0.5, "learning_rate": 7.372590302372936e-05, "loss": 2.2665, "step": 80128 }, { "epoch": 0.5, "learning_rate": 7.371997895879916e-05, "loss": 2.2664, "step": 80136 }, { "epoch": 0.5, "learning_rate": 7.371405455278872e-05, "loss": 2.2644, "step": 80144 }, { "epoch": 0.5, "learning_rate": 7.370812980584536e-05, "loss": 2.2634, "step": 80152 }, { "epoch": 0.5, "learning_rate": 7.370220471811635e-05, "loss": 2.2723, "step": 80160 }, { "epoch": 0.5, "learning_rate": 7.369627928974898e-05, "loss": 2.2508, "step": 80168 }, { "epoch": 0.5, "learning_rate": 7.36903535208906e-05, "loss": 2.2603, "step": 80176 }, { "epoch": 0.5, "learning_rate": 7.368442741168846e-05, "loss": 2.2474, "step": 80184 }, { "epoch": 0.5, "learning_rate": 7.367850096228994e-05, "loss": 2.2315, "step": 80192 }, { "epoch": 0.5, "learning_rate": 7.367257417284235e-05, "loss": 2.2511, "step": 80200 }, { "epoch": 0.5, "learning_rate": 7.366664704349303e-05, "loss": 2.2528, "step": 80208 }, { "epoch": 0.5, "learning_rate": 7.366071957438931e-05, "loss": 2.247, "step": 80216 }, { "epoch": 0.5, "learning_rate": 7.36547917656786e-05, "loss": 2.2485, "step": 80224 }, { "epoch": 0.5, "learning_rate": 7.364886361750822e-05, "loss": 2.2404, "step": 80232 }, { "epoch": 0.5, "learning_rate": 7.364293513002556e-05, "loss": 2.2477, "step": 80240 }, { "epoch": 0.5, "learning_rate": 7.363700630337803e-05, "loss": 2.2476, "step": 80248 }, { "epoch": 0.5, "learning_rate": 7.363107713771295e-05, "loss": 2.25, "step": 80256 }, { "epoch": 0.5, "learning_rate": 7.362514763317778e-05, "loss": 2.2357, "step": 80264 }, { "epoch": 0.5, "learning_rate": 7.361921778991992e-05, "loss": 2.2522, "step": 80272 }, { "epoch": 0.5, "learning_rate": 7.361328760808676e-05, "loss": 2.2628, "step": 80280 }, { "epoch": 0.5, "learning_rate": 7.360735708782575e-05, "loss": 2.2491, "step": 80288 }, { "epoch": 0.5, "learning_rate": 7.360142622928432e-05, "loss": 2.2538, "step": 80296 }, { "epoch": 0.5, "learning_rate": 7.359549503260992e-05, "loss": 2.2652, "step": 80304 }, { "epoch": 0.5, "learning_rate": 7.358956349794996e-05, "loss": 2.2593, "step": 80312 }, { "epoch": 0.5, "learning_rate": 7.358363162545194e-05, "loss": 2.2539, "step": 80320 }, { "epoch": 0.5, "learning_rate": 7.357769941526334e-05, "loss": 2.2555, "step": 80328 }, { "epoch": 0.5, "learning_rate": 7.357176686753156e-05, "loss": 2.2586, "step": 80336 }, { "epoch": 0.5, "learning_rate": 7.356583398240415e-05, "loss": 2.2395, "step": 80344 }, { "epoch": 0.5, "learning_rate": 7.355990076002861e-05, "loss": 2.2513, "step": 80352 }, { "epoch": 0.5, "learning_rate": 7.355396720055241e-05, "loss": 2.2422, "step": 80360 }, { "epoch": 0.5, "learning_rate": 7.354803330412303e-05, "loss": 2.2432, "step": 80368 }, { "epoch": 0.5, "learning_rate": 7.354209907088804e-05, "loss": 2.2373, "step": 80376 }, { "epoch": 0.5, "learning_rate": 7.353616450099496e-05, "loss": 2.2376, "step": 80384 }, { "epoch": 0.5, "learning_rate": 7.35302295945913e-05, "loss": 2.2508, "step": 80392 }, { "epoch": 0.5, "learning_rate": 7.352429435182462e-05, "loss": 2.2441, "step": 80400 }, { "epoch": 0.5, "learning_rate": 7.351835877284246e-05, "loss": 2.2479, "step": 80408 }, { "epoch": 0.5, "learning_rate": 7.351242285779241e-05, "loss": 2.2488, "step": 80416 }, { "epoch": 0.5, "learning_rate": 7.350648660682197e-05, "loss": 2.243, "step": 80424 }, { "epoch": 0.5, "learning_rate": 7.350055002007878e-05, "loss": 2.2452, "step": 80432 }, { "epoch": 0.5, "learning_rate": 7.34946130977104e-05, "loss": 2.2454, "step": 80440 }, { "epoch": 0.5, "learning_rate": 7.348867583986443e-05, "loss": 2.2646, "step": 80448 }, { "epoch": 0.5, "learning_rate": 7.348273824668846e-05, "loss": 2.2679, "step": 80456 }, { "epoch": 0.5, "learning_rate": 7.347680031833008e-05, "loss": 2.255, "step": 80464 }, { "epoch": 0.5, "learning_rate": 7.347086205493696e-05, "loss": 2.2689, "step": 80472 }, { "epoch": 0.5, "learning_rate": 7.34649234566567e-05, "loss": 2.2683, "step": 80480 }, { "epoch": 0.5, "learning_rate": 7.345898452363693e-05, "loss": 2.2572, "step": 80488 }, { "epoch": 0.5, "learning_rate": 7.345304525602528e-05, "loss": 2.2435, "step": 80496 }, { "epoch": 0.5, "learning_rate": 7.344710565396942e-05, "loss": 2.2718, "step": 80504 }, { "epoch": 0.5, "learning_rate": 7.344116571761701e-05, "loss": 2.252, "step": 80512 }, { "epoch": 0.5, "learning_rate": 7.343522544711572e-05, "loss": 2.2653, "step": 80520 }, { "epoch": 0.5, "learning_rate": 7.34292848426132e-05, "loss": 2.2687, "step": 80528 }, { "epoch": 0.5, "learning_rate": 7.342334390425715e-05, "loss": 2.2641, "step": 80536 }, { "epoch": 0.5, "learning_rate": 7.34174026321953e-05, "loss": 2.2609, "step": 80544 }, { "epoch": 0.5, "learning_rate": 7.341146102657528e-05, "loss": 2.2604, "step": 80552 }, { "epoch": 0.5, "learning_rate": 7.340551908754485e-05, "loss": 2.2573, "step": 80560 }, { "epoch": 0.5, "learning_rate": 7.339957681525171e-05, "loss": 2.2714, "step": 80568 }, { "epoch": 0.5, "learning_rate": 7.33936342098436e-05, "loss": 2.2757, "step": 80576 }, { "epoch": 0.5, "learning_rate": 7.33876912714682e-05, "loss": 2.2602, "step": 80584 }, { "epoch": 0.5, "learning_rate": 7.338174800027333e-05, "loss": 2.263, "step": 80592 }, { "epoch": 0.5, "learning_rate": 7.337580439640668e-05, "loss": 2.2645, "step": 80600 }, { "epoch": 0.5, "learning_rate": 7.336986046001603e-05, "loss": 2.2812, "step": 80608 }, { "epoch": 0.5, "learning_rate": 7.336391619124918e-05, "loss": 2.2673, "step": 80616 }, { "epoch": 0.5, "learning_rate": 7.335797159025386e-05, "loss": 2.2672, "step": 80624 }, { "epoch": 0.5, "learning_rate": 7.335202665717786e-05, "loss": 2.2697, "step": 80632 }, { "epoch": 0.5, "learning_rate": 7.334608139216899e-05, "loss": 2.2499, "step": 80640 }, { "epoch": 0.5, "learning_rate": 7.334013579537503e-05, "loss": 2.2636, "step": 80648 }, { "epoch": 0.5, "learning_rate": 7.333418986694381e-05, "loss": 2.2493, "step": 80656 }, { "epoch": 0.5, "learning_rate": 7.33282436070231e-05, "loss": 2.2479, "step": 80664 }, { "epoch": 0.5, "learning_rate": 7.332229701576078e-05, "loss": 2.2426, "step": 80672 }, { "epoch": 0.5, "learning_rate": 7.331635009330466e-05, "loss": 2.259, "step": 80680 }, { "epoch": 0.5, "learning_rate": 7.33104028398026e-05, "loss": 2.2529, "step": 80688 }, { "epoch": 0.5, "learning_rate": 7.330445525540242e-05, "loss": 2.2591, "step": 80696 }, { "epoch": 0.5, "learning_rate": 7.329850734025199e-05, "loss": 2.2717, "step": 80704 }, { "epoch": 0.5, "learning_rate": 7.329255909449917e-05, "loss": 2.2394, "step": 80712 }, { "epoch": 0.5, "learning_rate": 7.328661051829182e-05, "loss": 2.2555, "step": 80720 }, { "epoch": 0.5, "learning_rate": 7.328066161177789e-05, "loss": 2.2517, "step": 80728 }, { "epoch": 0.5, "learning_rate": 7.327471237510517e-05, "loss": 2.2377, "step": 80736 }, { "epoch": 0.5, "learning_rate": 7.326876280842166e-05, "loss": 2.2513, "step": 80744 }, { "epoch": 0.5, "learning_rate": 7.32628129118752e-05, "loss": 2.2567, "step": 80752 }, { "epoch": 0.5, "learning_rate": 7.325686268561372e-05, "loss": 2.2512, "step": 80760 }, { "epoch": 0.5, "learning_rate": 7.325091212978512e-05, "loss": 2.2509, "step": 80768 }, { "epoch": 0.5, "learning_rate": 7.32449612445374e-05, "loss": 2.2414, "step": 80776 }, { "epoch": 0.5, "learning_rate": 7.323901003001842e-05, "loss": 2.2325, "step": 80784 }, { "epoch": 0.5, "learning_rate": 7.32330584863762e-05, "loss": 2.2383, "step": 80792 }, { "epoch": 0.51, "learning_rate": 7.322710661375864e-05, "loss": 2.2356, "step": 80800 }, { "epoch": 0.51, "learning_rate": 7.322115441231374e-05, "loss": 2.2269, "step": 80808 }, { "epoch": 0.51, "learning_rate": 7.321520188218944e-05, "loss": 2.2349, "step": 80816 }, { "epoch": 0.51, "learning_rate": 7.320924902353374e-05, "loss": 2.231, "step": 80824 }, { "epoch": 0.51, "learning_rate": 7.320329583649466e-05, "loss": 2.248, "step": 80832 }, { "epoch": 0.51, "learning_rate": 7.319734232122011e-05, "loss": 2.2198, "step": 80840 }, { "epoch": 0.51, "learning_rate": 7.319138847785818e-05, "loss": 2.2308, "step": 80848 }, { "epoch": 0.51, "learning_rate": 7.318543430655686e-05, "loss": 2.2546, "step": 80856 }, { "epoch": 0.51, "learning_rate": 7.317947980746416e-05, "loss": 2.2496, "step": 80864 }, { "epoch": 0.51, "learning_rate": 7.317352498072809e-05, "loss": 2.2337, "step": 80872 }, { "epoch": 0.51, "learning_rate": 7.316756982649675e-05, "loss": 2.2613, "step": 80880 }, { "epoch": 0.51, "learning_rate": 7.316161434491813e-05, "loss": 2.2481, "step": 80888 }, { "epoch": 0.51, "learning_rate": 7.315565853614028e-05, "loss": 2.2504, "step": 80896 }, { "epoch": 0.51, "learning_rate": 7.314970240031131e-05, "loss": 2.2487, "step": 80904 }, { "epoch": 0.51, "learning_rate": 7.314374593757924e-05, "loss": 2.2561, "step": 80912 }, { "epoch": 0.51, "learning_rate": 7.31377891480922e-05, "loss": 2.2646, "step": 80920 }, { "epoch": 0.51, "learning_rate": 7.313183203199823e-05, "loss": 2.2603, "step": 80928 }, { "epoch": 0.51, "learning_rate": 7.312587458944542e-05, "loss": 2.2585, "step": 80936 }, { "epoch": 0.51, "learning_rate": 7.311991682058193e-05, "loss": 2.241, "step": 80944 }, { "epoch": 0.51, "learning_rate": 7.311395872555582e-05, "loss": 2.2645, "step": 80952 }, { "epoch": 0.51, "learning_rate": 7.310800030451523e-05, "loss": 2.2588, "step": 80960 }, { "epoch": 0.51, "learning_rate": 7.310204155760829e-05, "loss": 2.2659, "step": 80968 }, { "epoch": 0.51, "learning_rate": 7.309608248498312e-05, "loss": 2.2607, "step": 80976 }, { "epoch": 0.51, "learning_rate": 7.309012308678787e-05, "loss": 2.2587, "step": 80984 }, { "epoch": 0.51, "learning_rate": 7.308416336317068e-05, "loss": 2.255, "step": 80992 }, { "epoch": 0.51, "learning_rate": 7.307820331427973e-05, "loss": 2.2608, "step": 81000 }, { "epoch": 0.51, "learning_rate": 7.307224294026318e-05, "loss": 2.2463, "step": 81008 }, { "epoch": 0.51, "learning_rate": 7.306628224126921e-05, "loss": 2.2428, "step": 81016 }, { "epoch": 0.51, "learning_rate": 7.306032121744597e-05, "loss": 2.2431, "step": 81024 }, { "epoch": 0.51, "learning_rate": 7.305435986894169e-05, "loss": 2.2466, "step": 81032 }, { "epoch": 0.51, "learning_rate": 7.304839819590459e-05, "loss": 2.2468, "step": 81040 }, { "epoch": 0.51, "learning_rate": 7.304243619848281e-05, "loss": 2.2519, "step": 81048 }, { "epoch": 0.51, "learning_rate": 7.303647387682462e-05, "loss": 2.2492, "step": 81056 }, { "epoch": 0.51, "learning_rate": 7.303051123107822e-05, "loss": 2.2464, "step": 81064 }, { "epoch": 0.51, "learning_rate": 7.302454826139185e-05, "loss": 2.2334, "step": 81072 }, { "epoch": 0.51, "learning_rate": 7.301858496791376e-05, "loss": 2.2378, "step": 81080 }, { "epoch": 0.51, "learning_rate": 7.301262135079216e-05, "loss": 2.2409, "step": 81088 }, { "epoch": 0.51, "learning_rate": 7.300665741017535e-05, "loss": 2.2441, "step": 81096 }, { "epoch": 0.51, "learning_rate": 7.300069314621161e-05, "loss": 2.2521, "step": 81104 }, { "epoch": 0.51, "learning_rate": 7.299472855904914e-05, "loss": 2.258, "step": 81112 }, { "epoch": 0.51, "learning_rate": 7.298876364883626e-05, "loss": 2.2478, "step": 81120 }, { "epoch": 0.51, "learning_rate": 7.298279841572126e-05, "loss": 2.2501, "step": 81128 }, { "epoch": 0.51, "learning_rate": 7.297683285985246e-05, "loss": 2.2488, "step": 81136 }, { "epoch": 0.51, "learning_rate": 7.297086698137812e-05, "loss": 2.2596, "step": 81144 }, { "epoch": 0.51, "learning_rate": 7.296490078044656e-05, "loss": 2.2385, "step": 81152 }, { "epoch": 0.51, "learning_rate": 7.295893425720615e-05, "loss": 2.2482, "step": 81160 }, { "epoch": 0.51, "learning_rate": 7.295296741180513e-05, "loss": 2.2539, "step": 81168 }, { "epoch": 0.51, "learning_rate": 7.294700024439191e-05, "loss": 2.2507, "step": 81176 }, { "epoch": 0.51, "learning_rate": 7.294103275511484e-05, "loss": 2.2616, "step": 81184 }, { "epoch": 0.51, "learning_rate": 7.293506494412222e-05, "loss": 2.2651, "step": 81192 }, { "epoch": 0.51, "learning_rate": 7.292909681156241e-05, "loss": 2.2529, "step": 81200 }, { "epoch": 0.51, "learning_rate": 7.292312835758382e-05, "loss": 2.2598, "step": 81208 }, { "epoch": 0.51, "learning_rate": 7.291715958233482e-05, "loss": 2.2445, "step": 81216 }, { "epoch": 0.51, "learning_rate": 7.291119048596377e-05, "loss": 2.2491, "step": 81224 }, { "epoch": 0.51, "learning_rate": 7.29052210686191e-05, "loss": 2.258, "step": 81232 }, { "epoch": 0.51, "learning_rate": 7.289925133044915e-05, "loss": 2.2497, "step": 81240 }, { "epoch": 0.51, "learning_rate": 7.28932812716024e-05, "loss": 2.2516, "step": 81248 }, { "epoch": 0.51, "learning_rate": 7.28873108922272e-05, "loss": 2.2635, "step": 81256 }, { "epoch": 0.51, "learning_rate": 7.288134019247203e-05, "loss": 2.2599, "step": 81264 }, { "epoch": 0.51, "learning_rate": 7.287536917248528e-05, "loss": 2.2758, "step": 81272 }, { "epoch": 0.51, "learning_rate": 7.286939783241542e-05, "loss": 2.2603, "step": 81280 }, { "epoch": 0.51, "learning_rate": 7.286342617241089e-05, "loss": 2.2543, "step": 81288 }, { "epoch": 0.51, "learning_rate": 7.285745419262012e-05, "loss": 2.2551, "step": 81296 }, { "epoch": 0.51, "learning_rate": 7.28514818931916e-05, "loss": 2.2465, "step": 81304 }, { "epoch": 0.51, "learning_rate": 7.284550927427383e-05, "loss": 2.2359, "step": 81312 }, { "epoch": 0.51, "learning_rate": 7.283953633601523e-05, "loss": 2.2736, "step": 81320 }, { "epoch": 0.51, "learning_rate": 7.283356307856432e-05, "loss": 2.248, "step": 81328 }, { "epoch": 0.51, "learning_rate": 7.282758950206958e-05, "loss": 2.2566, "step": 81336 }, { "epoch": 0.51, "learning_rate": 7.282161560667955e-05, "loss": 2.2479, "step": 81344 }, { "epoch": 0.51, "learning_rate": 7.281564139254271e-05, "loss": 2.2379, "step": 81352 }, { "epoch": 0.51, "learning_rate": 7.28096668598076e-05, "loss": 2.2586, "step": 81360 }, { "epoch": 0.51, "learning_rate": 7.280369200862269e-05, "loss": 2.2411, "step": 81368 }, { "epoch": 0.51, "learning_rate": 7.279771683913661e-05, "loss": 2.2503, "step": 81376 }, { "epoch": 0.51, "learning_rate": 7.279174135149782e-05, "loss": 2.2509, "step": 81384 }, { "epoch": 0.51, "learning_rate": 7.278576554585493e-05, "loss": 2.2578, "step": 81392 }, { "epoch": 0.51, "learning_rate": 7.277978942235644e-05, "loss": 2.2582, "step": 81400 }, { "epoch": 0.51, "learning_rate": 7.277381298115098e-05, "loss": 2.2685, "step": 81408 }, { "epoch": 0.51, "learning_rate": 7.27678362223871e-05, "loss": 2.2655, "step": 81416 }, { "epoch": 0.51, "learning_rate": 7.276185914621334e-05, "loss": 2.2534, "step": 81424 }, { "epoch": 0.51, "learning_rate": 7.275588175277837e-05, "loss": 2.2563, "step": 81432 }, { "epoch": 0.51, "learning_rate": 7.274990404223074e-05, "loss": 2.2573, "step": 81440 }, { "epoch": 0.51, "learning_rate": 7.274392601471907e-05, "loss": 2.2627, "step": 81448 }, { "epoch": 0.51, "learning_rate": 7.273794767039195e-05, "loss": 2.2621, "step": 81456 }, { "epoch": 0.51, "learning_rate": 7.273196900939802e-05, "loss": 2.2709, "step": 81464 }, { "epoch": 0.51, "learning_rate": 7.272599003188593e-05, "loss": 2.255, "step": 81472 }, { "epoch": 0.51, "learning_rate": 7.27200107380043e-05, "loss": 2.2664, "step": 81480 }, { "epoch": 0.51, "learning_rate": 7.271403112790177e-05, "loss": 2.2685, "step": 81488 }, { "epoch": 0.51, "learning_rate": 7.270805120172702e-05, "loss": 2.2815, "step": 81496 }, { "epoch": 0.51, "learning_rate": 7.270207095962864e-05, "loss": 2.2348, "step": 81504 }, { "epoch": 0.51, "learning_rate": 7.26960904017554e-05, "loss": 2.2584, "step": 81512 }, { "epoch": 0.51, "learning_rate": 7.26901095282559e-05, "loss": 2.2523, "step": 81520 }, { "epoch": 0.51, "learning_rate": 7.268412833927887e-05, "loss": 2.2553, "step": 81528 }, { "epoch": 0.51, "learning_rate": 7.267814683497298e-05, "loss": 2.2599, "step": 81536 }, { "epoch": 0.51, "learning_rate": 7.267216501548692e-05, "loss": 2.261, "step": 81544 }, { "epoch": 0.51, "learning_rate": 7.266618288096944e-05, "loss": 2.2645, "step": 81552 }, { "epoch": 0.51, "learning_rate": 7.266020043156922e-05, "loss": 2.277, "step": 81560 }, { "epoch": 0.51, "learning_rate": 7.2654217667435e-05, "loss": 2.2653, "step": 81568 }, { "epoch": 0.51, "learning_rate": 7.264823458871552e-05, "loss": 2.2611, "step": 81576 }, { "epoch": 0.51, "learning_rate": 7.26422511955595e-05, "loss": 2.2761, "step": 81584 }, { "epoch": 0.51, "learning_rate": 7.26362674881157e-05, "loss": 2.2728, "step": 81592 }, { "epoch": 0.51, "learning_rate": 7.263028346653287e-05, "loss": 2.2616, "step": 81600 }, { "epoch": 0.51, "learning_rate": 7.262429913095976e-05, "loss": 2.2612, "step": 81608 }, { "epoch": 0.51, "learning_rate": 7.261831448154516e-05, "loss": 2.2662, "step": 81616 }, { "epoch": 0.51, "learning_rate": 7.261232951843789e-05, "loss": 2.2677, "step": 81624 }, { "epoch": 0.51, "learning_rate": 7.260634424178665e-05, "loss": 2.2633, "step": 81632 }, { "epoch": 0.51, "learning_rate": 7.260035865174028e-05, "loss": 2.2668, "step": 81640 }, { "epoch": 0.51, "learning_rate": 7.25943727484476e-05, "loss": 2.2859, "step": 81648 }, { "epoch": 0.51, "learning_rate": 7.258838653205737e-05, "loss": 2.2493, "step": 81656 }, { "epoch": 0.51, "learning_rate": 7.258240000271848e-05, "loss": 2.2704, "step": 81664 }, { "epoch": 0.51, "learning_rate": 7.257641316057969e-05, "loss": 2.2799, "step": 81672 }, { "epoch": 0.51, "learning_rate": 7.257042600578985e-05, "loss": 2.2558, "step": 81680 }, { "epoch": 0.51, "learning_rate": 7.256443853849784e-05, "loss": 2.2631, "step": 81688 }, { "epoch": 0.51, "learning_rate": 7.255845075885244e-05, "loss": 2.2643, "step": 81696 }, { "epoch": 0.51, "learning_rate": 7.255246266700258e-05, "loss": 2.2586, "step": 81704 }, { "epoch": 0.51, "learning_rate": 7.254647426309706e-05, "loss": 2.2551, "step": 81712 }, { "epoch": 0.51, "learning_rate": 7.254048554728479e-05, "loss": 2.2583, "step": 81720 }, { "epoch": 0.51, "learning_rate": 7.253449651971467e-05, "loss": 2.2445, "step": 81728 }, { "epoch": 0.51, "learning_rate": 7.252850718053552e-05, "loss": 2.253, "step": 81736 }, { "epoch": 0.51, "learning_rate": 7.252251752989629e-05, "loss": 2.2464, "step": 81744 }, { "epoch": 0.51, "learning_rate": 7.251652756794587e-05, "loss": 2.2358, "step": 81752 }, { "epoch": 0.51, "learning_rate": 7.251053729483317e-05, "loss": 2.2483, "step": 81760 }, { "epoch": 0.51, "learning_rate": 7.250454671070712e-05, "loss": 2.2392, "step": 81768 }, { "epoch": 0.51, "learning_rate": 7.249855581571662e-05, "loss": 2.2474, "step": 81776 }, { "epoch": 0.51, "learning_rate": 7.249256461001064e-05, "loss": 2.2435, "step": 81784 }, { "epoch": 0.51, "learning_rate": 7.248657309373807e-05, "loss": 2.2508, "step": 81792 }, { "epoch": 0.51, "learning_rate": 7.24805812670479e-05, "loss": 2.2451, "step": 81800 }, { "epoch": 0.51, "learning_rate": 7.247458913008911e-05, "loss": 2.2468, "step": 81808 }, { "epoch": 0.51, "learning_rate": 7.246859668301063e-05, "loss": 2.2458, "step": 81816 }, { "epoch": 0.51, "learning_rate": 7.24626039259614e-05, "loss": 2.2378, "step": 81824 }, { "epoch": 0.51, "learning_rate": 7.245661085909048e-05, "loss": 2.2381, "step": 81832 }, { "epoch": 0.51, "learning_rate": 7.24506174825468e-05, "loss": 2.2402, "step": 81840 }, { "epoch": 0.51, "learning_rate": 7.244462379647936e-05, "loss": 2.2334, "step": 81848 }, { "epoch": 0.51, "learning_rate": 7.24386298010372e-05, "loss": 2.2462, "step": 81856 }, { "epoch": 0.51, "learning_rate": 7.243263549636927e-05, "loss": 2.239, "step": 81864 }, { "epoch": 0.51, "learning_rate": 7.242664088262465e-05, "loss": 2.2508, "step": 81872 }, { "epoch": 0.51, "learning_rate": 7.242064595995234e-05, "loss": 2.2407, "step": 81880 }, { "epoch": 0.51, "learning_rate": 7.24146507285014e-05, "loss": 2.2584, "step": 81888 }, { "epoch": 0.51, "learning_rate": 7.240865518842081e-05, "loss": 2.2453, "step": 81896 }, { "epoch": 0.51, "learning_rate": 7.24026593398597e-05, "loss": 2.2648, "step": 81904 }, { "epoch": 0.51, "learning_rate": 7.239666318296707e-05, "loss": 2.2606, "step": 81912 }, { "epoch": 0.51, "learning_rate": 7.239066671789198e-05, "loss": 2.243, "step": 81920 }, { "epoch": 0.51, "learning_rate": 7.238466994478357e-05, "loss": 2.2477, "step": 81928 }, { "epoch": 0.51, "learning_rate": 7.237867286379085e-05, "loss": 2.2656, "step": 81936 }, { "epoch": 0.51, "learning_rate": 7.237267547506295e-05, "loss": 2.2684, "step": 81944 }, { "epoch": 0.51, "learning_rate": 7.23666777787489e-05, "loss": 2.2658, "step": 81952 }, { "epoch": 0.51, "learning_rate": 7.23606797749979e-05, "loss": 2.2537, "step": 81960 }, { "epoch": 0.51, "learning_rate": 7.235468146395901e-05, "loss": 2.2549, "step": 81968 }, { "epoch": 0.51, "learning_rate": 7.234868284578136e-05, "loss": 2.2607, "step": 81976 }, { "epoch": 0.51, "learning_rate": 7.234268392061402e-05, "loss": 2.2431, "step": 81984 }, { "epoch": 0.51, "learning_rate": 7.233668468860622e-05, "loss": 2.2528, "step": 81992 }, { "epoch": 0.51, "learning_rate": 7.233068514990704e-05, "loss": 2.2399, "step": 82000 }, { "epoch": 0.51, "learning_rate": 7.232468530466566e-05, "loss": 2.2587, "step": 82008 }, { "epoch": 0.51, "learning_rate": 7.23186851530312e-05, "loss": 2.2555, "step": 82016 }, { "epoch": 0.51, "learning_rate": 7.231268469515284e-05, "loss": 2.253, "step": 82024 }, { "epoch": 0.51, "learning_rate": 7.230668393117979e-05, "loss": 2.2544, "step": 82032 }, { "epoch": 0.51, "learning_rate": 7.230068286126117e-05, "loss": 2.258, "step": 82040 }, { "epoch": 0.51, "learning_rate": 7.229468148554619e-05, "loss": 2.2482, "step": 82048 }, { "epoch": 0.51, "learning_rate": 7.228867980418405e-05, "loss": 2.2572, "step": 82056 }, { "epoch": 0.51, "learning_rate": 7.228267781732397e-05, "loss": 2.2559, "step": 82064 }, { "epoch": 0.51, "learning_rate": 7.227667552511512e-05, "loss": 2.2448, "step": 82072 }, { "epoch": 0.51, "learning_rate": 7.227067292770675e-05, "loss": 2.2496, "step": 82080 }, { "epoch": 0.51, "learning_rate": 7.226467002524806e-05, "loss": 2.2634, "step": 82088 }, { "epoch": 0.51, "learning_rate": 7.225866681788833e-05, "loss": 2.2274, "step": 82096 }, { "epoch": 0.51, "learning_rate": 7.225266330577673e-05, "loss": 2.2452, "step": 82104 }, { "epoch": 0.51, "learning_rate": 7.224665948906258e-05, "loss": 2.2395, "step": 82112 }, { "epoch": 0.51, "learning_rate": 7.224065536789508e-05, "loss": 2.2495, "step": 82120 }, { "epoch": 0.51, "learning_rate": 7.22346509424235e-05, "loss": 2.2621, "step": 82128 }, { "epoch": 0.51, "learning_rate": 7.222864621279714e-05, "loss": 2.2444, "step": 82136 }, { "epoch": 0.51, "learning_rate": 7.222264117916529e-05, "loss": 2.2538, "step": 82144 }, { "epoch": 0.51, "learning_rate": 7.221663584167718e-05, "loss": 2.246, "step": 82152 }, { "epoch": 0.51, "learning_rate": 7.221063020048213e-05, "loss": 2.2546, "step": 82160 }, { "epoch": 0.51, "learning_rate": 7.220462425572947e-05, "loss": 2.2229, "step": 82168 }, { "epoch": 0.51, "learning_rate": 7.219861800756844e-05, "loss": 2.2587, "step": 82176 }, { "epoch": 0.51, "learning_rate": 7.219261145614841e-05, "loss": 2.2364, "step": 82184 }, { "epoch": 0.51, "learning_rate": 7.218660460161872e-05, "loss": 2.2613, "step": 82192 }, { "epoch": 0.51, "learning_rate": 7.218059744412864e-05, "loss": 2.2516, "step": 82200 }, { "epoch": 0.51, "learning_rate": 7.217458998382756e-05, "loss": 2.2416, "step": 82208 }, { "epoch": 0.51, "learning_rate": 7.21685822208648e-05, "loss": 2.254, "step": 82216 }, { "epoch": 0.51, "learning_rate": 7.216257415538971e-05, "loss": 2.26, "step": 82224 }, { "epoch": 0.51, "learning_rate": 7.21565657875517e-05, "loss": 2.2307, "step": 82232 }, { "epoch": 0.51, "learning_rate": 7.215055711750007e-05, "loss": 2.2419, "step": 82240 }, { "epoch": 0.51, "learning_rate": 7.214454814538423e-05, "loss": 2.2425, "step": 82248 }, { "epoch": 0.51, "learning_rate": 7.213853887135355e-05, "loss": 2.2364, "step": 82256 }, { "epoch": 0.51, "learning_rate": 7.213252929555745e-05, "loss": 2.2425, "step": 82264 }, { "epoch": 0.51, "learning_rate": 7.21265194181453e-05, "loss": 2.2477, "step": 82272 }, { "epoch": 0.51, "learning_rate": 7.212050923926653e-05, "loss": 2.253, "step": 82280 }, { "epoch": 0.51, "learning_rate": 7.211449875907052e-05, "loss": 2.2556, "step": 82288 }, { "epoch": 0.51, "learning_rate": 7.210848797770673e-05, "loss": 2.2464, "step": 82296 }, { "epoch": 0.51, "learning_rate": 7.210247689532456e-05, "loss": 2.2655, "step": 82304 }, { "epoch": 0.51, "learning_rate": 7.209646551207348e-05, "loss": 2.254, "step": 82312 }, { "epoch": 0.51, "learning_rate": 7.209045382810286e-05, "loss": 2.2426, "step": 82320 }, { "epoch": 0.51, "learning_rate": 7.208444184356225e-05, "loss": 2.2469, "step": 82328 }, { "epoch": 0.51, "learning_rate": 7.207842955860105e-05, "loss": 2.2529, "step": 82336 }, { "epoch": 0.51, "learning_rate": 7.207241697336871e-05, "loss": 2.2771, "step": 82344 }, { "epoch": 0.51, "learning_rate": 7.206640408801476e-05, "loss": 2.2681, "step": 82352 }, { "epoch": 0.51, "learning_rate": 7.206039090268861e-05, "loss": 2.2641, "step": 82360 }, { "epoch": 0.51, "learning_rate": 7.205437741753985e-05, "loss": 2.2525, "step": 82368 }, { "epoch": 0.51, "learning_rate": 7.204836363271788e-05, "loss": 2.252, "step": 82376 }, { "epoch": 0.51, "learning_rate": 7.204234954837223e-05, "loss": 2.2666, "step": 82384 }, { "epoch": 0.51, "learning_rate": 7.203633516465242e-05, "loss": 2.2679, "step": 82392 }, { "epoch": 0.52, "learning_rate": 7.203032048170797e-05, "loss": 2.2674, "step": 82400 }, { "epoch": 0.52, "learning_rate": 7.202430549968841e-05, "loss": 2.2706, "step": 82408 }, { "epoch": 0.52, "learning_rate": 7.201829021874327e-05, "loss": 2.2649, "step": 82416 }, { "epoch": 0.52, "learning_rate": 7.201227463902207e-05, "loss": 2.2745, "step": 82424 }, { "epoch": 0.52, "learning_rate": 7.200625876067439e-05, "loss": 2.281, "step": 82432 }, { "epoch": 0.52, "learning_rate": 7.200024258384977e-05, "loss": 2.2768, "step": 82440 }, { "epoch": 0.52, "learning_rate": 7.199422610869777e-05, "loss": 2.2875, "step": 82448 }, { "epoch": 0.52, "learning_rate": 7.198820933536796e-05, "loss": 2.2823, "step": 82456 }, { "epoch": 0.52, "learning_rate": 7.198219226400993e-05, "loss": 2.2704, "step": 82464 }, { "epoch": 0.52, "learning_rate": 7.197617489477327e-05, "loss": 2.2702, "step": 82472 }, { "epoch": 0.52, "learning_rate": 7.19701572278075e-05, "loss": 2.2734, "step": 82480 }, { "epoch": 0.52, "learning_rate": 7.196413926326233e-05, "loss": 2.2815, "step": 82488 }, { "epoch": 0.52, "learning_rate": 7.19581210012873e-05, "loss": 2.2658, "step": 82496 }, { "epoch": 0.52, "learning_rate": 7.195210244203205e-05, "loss": 2.271, "step": 82504 }, { "epoch": 0.52, "learning_rate": 7.194608358564618e-05, "loss": 2.2777, "step": 82512 }, { "epoch": 0.52, "learning_rate": 7.194006443227934e-05, "loss": 2.2748, "step": 82520 }, { "epoch": 0.52, "learning_rate": 7.193404498208116e-05, "loss": 2.2643, "step": 82528 }, { "epoch": 0.52, "learning_rate": 7.192802523520128e-05, "loss": 2.2604, "step": 82536 }, { "epoch": 0.52, "learning_rate": 7.192200519178933e-05, "loss": 2.2815, "step": 82544 }, { "epoch": 0.52, "learning_rate": 7.191598485199505e-05, "loss": 2.2765, "step": 82552 }, { "epoch": 0.52, "learning_rate": 7.190996421596798e-05, "loss": 2.2724, "step": 82560 }, { "epoch": 0.52, "learning_rate": 7.190394328385792e-05, "loss": 2.2564, "step": 82568 }, { "epoch": 0.52, "learning_rate": 7.189792205581445e-05, "loss": 2.2486, "step": 82576 }, { "epoch": 0.52, "learning_rate": 7.189190053198734e-05, "loss": 2.2341, "step": 82584 }, { "epoch": 0.52, "learning_rate": 7.188587871252624e-05, "loss": 2.2757, "step": 82592 }, { "epoch": 0.52, "learning_rate": 7.187985659758085e-05, "loss": 2.2657, "step": 82600 }, { "epoch": 0.52, "learning_rate": 7.18738341873009e-05, "loss": 2.2527, "step": 82608 }, { "epoch": 0.52, "learning_rate": 7.18678114818361e-05, "loss": 2.262, "step": 82616 }, { "epoch": 0.52, "learning_rate": 7.186178848133618e-05, "loss": 2.2693, "step": 82624 }, { "epoch": 0.52, "learning_rate": 7.185576518595085e-05, "loss": 2.2448, "step": 82632 }, { "epoch": 0.52, "learning_rate": 7.184974159582987e-05, "loss": 2.2549, "step": 82640 }, { "epoch": 0.52, "learning_rate": 7.184371771112299e-05, "loss": 2.2588, "step": 82648 }, { "epoch": 0.52, "learning_rate": 7.183769353197998e-05, "loss": 2.2652, "step": 82656 }, { "epoch": 0.52, "learning_rate": 7.183166905855054e-05, "loss": 2.2532, "step": 82664 }, { "epoch": 0.52, "learning_rate": 7.182564429098451e-05, "loss": 2.2644, "step": 82672 }, { "epoch": 0.52, "learning_rate": 7.181961922943162e-05, "loss": 2.2583, "step": 82680 }, { "epoch": 0.52, "learning_rate": 7.18135938740417e-05, "loss": 2.2663, "step": 82688 }, { "epoch": 0.52, "learning_rate": 7.180756822496449e-05, "loss": 2.2569, "step": 82696 }, { "epoch": 0.52, "learning_rate": 7.180154228234979e-05, "loss": 2.2576, "step": 82704 }, { "epoch": 0.52, "learning_rate": 7.179551604634742e-05, "loss": 2.2575, "step": 82712 }, { "epoch": 0.52, "learning_rate": 7.178948951710724e-05, "loss": 2.2486, "step": 82720 }, { "epoch": 0.52, "learning_rate": 7.1783462694779e-05, "loss": 2.239, "step": 82728 }, { "epoch": 0.52, "learning_rate": 7.177743557951255e-05, "loss": 2.2637, "step": 82736 }, { "epoch": 0.52, "learning_rate": 7.177140817145775e-05, "loss": 2.2522, "step": 82744 }, { "epoch": 0.52, "learning_rate": 7.176538047076442e-05, "loss": 2.2419, "step": 82752 }, { "epoch": 0.52, "learning_rate": 7.175935247758242e-05, "loss": 2.252, "step": 82760 }, { "epoch": 0.52, "learning_rate": 7.175332419206157e-05, "loss": 2.2455, "step": 82768 }, { "epoch": 0.52, "learning_rate": 7.174729561435178e-05, "loss": 2.2605, "step": 82776 }, { "epoch": 0.52, "learning_rate": 7.17412667446029e-05, "loss": 2.2584, "step": 82784 }, { "epoch": 0.52, "learning_rate": 7.173523758296481e-05, "loss": 2.2553, "step": 82792 }, { "epoch": 0.52, "learning_rate": 7.17292081295874e-05, "loss": 2.25, "step": 82800 }, { "epoch": 0.52, "learning_rate": 7.172317838462054e-05, "loss": 2.2651, "step": 82808 }, { "epoch": 0.52, "learning_rate": 7.171714834821417e-05, "loss": 2.2611, "step": 82816 }, { "epoch": 0.52, "learning_rate": 7.171111802051818e-05, "loss": 2.2599, "step": 82824 }, { "epoch": 0.52, "learning_rate": 7.170508740168247e-05, "loss": 2.2501, "step": 82832 }, { "epoch": 0.52, "learning_rate": 7.1699056491857e-05, "loss": 2.2524, "step": 82840 }, { "epoch": 0.52, "learning_rate": 7.169302529119165e-05, "loss": 2.2522, "step": 82848 }, { "epoch": 0.52, "learning_rate": 7.168699379983636e-05, "loss": 2.2737, "step": 82856 }, { "epoch": 0.52, "learning_rate": 7.168096201794112e-05, "loss": 2.2611, "step": 82864 }, { "epoch": 0.52, "learning_rate": 7.167492994565586e-05, "loss": 2.2644, "step": 82872 }, { "epoch": 0.52, "learning_rate": 7.166889758313053e-05, "loss": 2.2417, "step": 82880 }, { "epoch": 0.52, "learning_rate": 7.166286493051509e-05, "loss": 2.2413, "step": 82888 }, { "epoch": 0.52, "learning_rate": 7.165683198795952e-05, "loss": 2.2536, "step": 82896 }, { "epoch": 0.52, "learning_rate": 7.16507987556138e-05, "loss": 2.2655, "step": 82904 }, { "epoch": 0.52, "learning_rate": 7.164476523362791e-05, "loss": 2.2566, "step": 82912 }, { "epoch": 0.52, "learning_rate": 7.163873142215186e-05, "loss": 2.258, "step": 82920 }, { "epoch": 0.52, "learning_rate": 7.163269732133562e-05, "loss": 2.2585, "step": 82928 }, { "epoch": 0.52, "learning_rate": 7.162666293132922e-05, "loss": 2.2676, "step": 82936 }, { "epoch": 0.52, "learning_rate": 7.162062825228268e-05, "loss": 2.2548, "step": 82944 }, { "epoch": 0.52, "learning_rate": 7.161459328434603e-05, "loss": 2.2558, "step": 82952 }, { "epoch": 0.52, "learning_rate": 7.160855802766928e-05, "loss": 2.2521, "step": 82960 }, { "epoch": 0.52, "learning_rate": 7.160252248240249e-05, "loss": 2.2601, "step": 82968 }, { "epoch": 0.52, "learning_rate": 7.159648664869568e-05, "loss": 2.2397, "step": 82976 }, { "epoch": 0.52, "learning_rate": 7.15904505266989e-05, "loss": 2.2479, "step": 82984 }, { "epoch": 0.52, "learning_rate": 7.158441411656222e-05, "loss": 2.2351, "step": 82992 }, { "epoch": 0.52, "learning_rate": 7.157837741843574e-05, "loss": 2.2545, "step": 83000 }, { "epoch": 0.52, "learning_rate": 7.157234043246946e-05, "loss": 2.2335, "step": 83008 }, { "epoch": 0.52, "learning_rate": 7.15663031588135e-05, "loss": 2.2452, "step": 83016 }, { "epoch": 0.52, "learning_rate": 7.156026559761795e-05, "loss": 2.2375, "step": 83024 }, { "epoch": 0.52, "learning_rate": 7.15542277490329e-05, "loss": 2.249, "step": 83032 }, { "epoch": 0.52, "learning_rate": 7.154818961320849e-05, "loss": 2.2578, "step": 83040 }, { "epoch": 0.52, "learning_rate": 7.154215119029475e-05, "loss": 2.2398, "step": 83048 }, { "epoch": 0.52, "learning_rate": 7.153611248044183e-05, "loss": 2.2569, "step": 83056 }, { "epoch": 0.52, "learning_rate": 7.153007348379987e-05, "loss": 2.2575, "step": 83064 }, { "epoch": 0.52, "learning_rate": 7.152403420051899e-05, "loss": 2.2509, "step": 83072 }, { "epoch": 0.52, "learning_rate": 7.151799463074936e-05, "loss": 2.2492, "step": 83080 }, { "epoch": 0.52, "learning_rate": 7.151195477464104e-05, "loss": 2.2289, "step": 83088 }, { "epoch": 0.52, "learning_rate": 7.150591463234426e-05, "loss": 2.2448, "step": 83096 }, { "epoch": 0.52, "learning_rate": 7.149987420400914e-05, "loss": 2.2501, "step": 83104 }, { "epoch": 0.52, "learning_rate": 7.149383348978587e-05, "loss": 2.2479, "step": 83112 }, { "epoch": 0.52, "learning_rate": 7.14877924898246e-05, "loss": 2.2367, "step": 83120 }, { "epoch": 0.52, "learning_rate": 7.148175120427552e-05, "loss": 2.2548, "step": 83128 }, { "epoch": 0.52, "learning_rate": 7.147570963328882e-05, "loss": 2.2445, "step": 83136 }, { "epoch": 0.52, "learning_rate": 7.146966777701469e-05, "loss": 2.2582, "step": 83144 }, { "epoch": 0.52, "learning_rate": 7.146362563560333e-05, "loss": 2.262, "step": 83152 }, { "epoch": 0.52, "learning_rate": 7.145758320920495e-05, "loss": 2.2427, "step": 83160 }, { "epoch": 0.52, "learning_rate": 7.145154049796976e-05, "loss": 2.2685, "step": 83168 }, { "epoch": 0.52, "learning_rate": 7.144549750204801e-05, "loss": 2.256, "step": 83176 }, { "epoch": 0.52, "learning_rate": 7.143945422158988e-05, "loss": 2.2506, "step": 83184 }, { "epoch": 0.52, "learning_rate": 7.143341065674567e-05, "loss": 2.264, "step": 83192 }, { "epoch": 0.52, "learning_rate": 7.142736680766555e-05, "loss": 2.2491, "step": 83200 }, { "epoch": 0.52, "learning_rate": 7.142132267449984e-05, "loss": 2.2572, "step": 83208 }, { "epoch": 0.52, "learning_rate": 7.141527825739875e-05, "loss": 2.2794, "step": 83216 }, { "epoch": 0.52, "learning_rate": 7.140923355651257e-05, "loss": 2.2724, "step": 83224 }, { "epoch": 0.52, "learning_rate": 7.140318857199155e-05, "loss": 2.263, "step": 83232 }, { "epoch": 0.52, "learning_rate": 7.1397143303986e-05, "loss": 2.262, "step": 83240 }, { "epoch": 0.52, "learning_rate": 7.139109775264617e-05, "loss": 2.2444, "step": 83248 }, { "epoch": 0.52, "learning_rate": 7.13850519181224e-05, "loss": 2.2507, "step": 83256 }, { "epoch": 0.52, "learning_rate": 7.137900580056494e-05, "loss": 2.2522, "step": 83264 }, { "epoch": 0.52, "learning_rate": 7.137295940012412e-05, "loss": 2.2545, "step": 83272 }, { "epoch": 0.52, "learning_rate": 7.136691271695024e-05, "loss": 2.2658, "step": 83280 }, { "epoch": 0.52, "learning_rate": 7.136086575119366e-05, "loss": 2.2469, "step": 83288 }, { "epoch": 0.52, "learning_rate": 7.135481850300467e-05, "loss": 2.2468, "step": 83296 }, { "epoch": 0.52, "learning_rate": 7.134877097253363e-05, "loss": 2.269, "step": 83304 }, { "epoch": 0.52, "learning_rate": 7.134272315993087e-05, "loss": 2.2697, "step": 83312 }, { "epoch": 0.52, "learning_rate": 7.133667506534672e-05, "loss": 2.2593, "step": 83320 }, { "epoch": 0.52, "learning_rate": 7.133062668893155e-05, "loss": 2.2559, "step": 83328 }, { "epoch": 0.52, "learning_rate": 7.132457803083576e-05, "loss": 2.2667, "step": 83336 }, { "epoch": 0.52, "learning_rate": 7.131852909120968e-05, "loss": 2.269, "step": 83344 }, { "epoch": 0.52, "learning_rate": 7.131247987020368e-05, "loss": 2.2502, "step": 83352 }, { "epoch": 0.52, "learning_rate": 7.130643036796818e-05, "loss": 2.2697, "step": 83360 }, { "epoch": 0.52, "learning_rate": 7.130038058465355e-05, "loss": 2.2432, "step": 83368 }, { "epoch": 0.52, "learning_rate": 7.12943305204102e-05, "loss": 2.257, "step": 83376 }, { "epoch": 0.52, "learning_rate": 7.128828017538849e-05, "loss": 2.254, "step": 83384 }, { "epoch": 0.52, "learning_rate": 7.12822295497389e-05, "loss": 2.2448, "step": 83392 }, { "epoch": 0.52, "learning_rate": 7.127617864361183e-05, "loss": 2.2589, "step": 83400 }, { "epoch": 0.52, "learning_rate": 7.127012745715766e-05, "loss": 2.2354, "step": 83408 }, { "epoch": 0.52, "learning_rate": 7.126407599052687e-05, "loss": 2.2514, "step": 83416 }, { "epoch": 0.52, "learning_rate": 7.125802424386989e-05, "loss": 2.2562, "step": 83424 }, { "epoch": 0.52, "learning_rate": 7.125197221733717e-05, "loss": 2.2517, "step": 83432 }, { "epoch": 0.52, "learning_rate": 7.124591991107914e-05, "loss": 2.26, "step": 83440 }, { "epoch": 0.52, "learning_rate": 7.123986732524628e-05, "loss": 2.2482, "step": 83448 }, { "epoch": 0.52, "learning_rate": 7.123381445998906e-05, "loss": 2.2492, "step": 83456 }, { "epoch": 0.52, "learning_rate": 7.122776131545797e-05, "loss": 2.2308, "step": 83464 }, { "epoch": 0.52, "learning_rate": 7.122170789180347e-05, "loss": 2.2531, "step": 83472 }, { "epoch": 0.52, "learning_rate": 7.121565418917604e-05, "loss": 2.2589, "step": 83480 }, { "epoch": 0.52, "learning_rate": 7.12096002077262e-05, "loss": 2.2524, "step": 83488 }, { "epoch": 0.52, "learning_rate": 7.120354594760443e-05, "loss": 2.2568, "step": 83496 }, { "epoch": 0.52, "learning_rate": 7.119749140896124e-05, "loss": 2.2542, "step": 83504 }, { "epoch": 0.52, "learning_rate": 7.119143659194718e-05, "loss": 2.2605, "step": 83512 }, { "epoch": 0.52, "learning_rate": 7.118538149671275e-05, "loss": 2.2524, "step": 83520 }, { "epoch": 0.52, "learning_rate": 7.117932612340847e-05, "loss": 2.2628, "step": 83528 }, { "epoch": 0.52, "learning_rate": 7.11732704721849e-05, "loss": 2.2435, "step": 83536 }, { "epoch": 0.52, "learning_rate": 7.116721454319256e-05, "loss": 2.2373, "step": 83544 }, { "epoch": 0.52, "learning_rate": 7.116115833658201e-05, "loss": 2.2498, "step": 83552 }, { "epoch": 0.52, "learning_rate": 7.115510185250383e-05, "loss": 2.2364, "step": 83560 }, { "epoch": 0.52, "learning_rate": 7.114904509110856e-05, "loss": 2.2681, "step": 83568 }, { "epoch": 0.52, "learning_rate": 7.114298805254675e-05, "loss": 2.2619, "step": 83576 }, { "epoch": 0.52, "learning_rate": 7.113693073696905e-05, "loss": 2.2579, "step": 83584 }, { "epoch": 0.52, "learning_rate": 7.113087314452598e-05, "loss": 2.2558, "step": 83592 }, { "epoch": 0.52, "learning_rate": 7.112481527536816e-05, "loss": 2.248, "step": 83600 }, { "epoch": 0.52, "learning_rate": 7.11187571296462e-05, "loss": 2.263, "step": 83608 }, { "epoch": 0.52, "learning_rate": 7.111269870751065e-05, "loss": 2.2614, "step": 83616 }, { "epoch": 0.52, "learning_rate": 7.11066400091122e-05, "loss": 2.2429, "step": 83624 }, { "epoch": 0.52, "learning_rate": 7.11005810346014e-05, "loss": 2.2571, "step": 83632 }, { "epoch": 0.52, "learning_rate": 7.109452178412895e-05, "loss": 2.2657, "step": 83640 }, { "epoch": 0.52, "learning_rate": 7.108846225784543e-05, "loss": 2.2684, "step": 83648 }, { "epoch": 0.52, "learning_rate": 7.108240245590147e-05, "loss": 2.2455, "step": 83656 }, { "epoch": 0.52, "learning_rate": 7.107634237844776e-05, "loss": 2.2543, "step": 83664 }, { "epoch": 0.52, "learning_rate": 7.107028202563492e-05, "loss": 2.2591, "step": 83672 }, { "epoch": 0.52, "learning_rate": 7.106422139761366e-05, "loss": 2.2517, "step": 83680 }, { "epoch": 0.52, "learning_rate": 7.10581604945346e-05, "loss": 2.2556, "step": 83688 }, { "epoch": 0.52, "learning_rate": 7.105209931654842e-05, "loss": 2.2418, "step": 83696 }, { "epoch": 0.52, "learning_rate": 7.104603786380581e-05, "loss": 2.2615, "step": 83704 }, { "epoch": 0.52, "learning_rate": 7.103997613645748e-05, "loss": 2.2365, "step": 83712 }, { "epoch": 0.52, "learning_rate": 7.103391413465408e-05, "loss": 2.2385, "step": 83720 }, { "epoch": 0.52, "learning_rate": 7.102785185854634e-05, "loss": 2.258, "step": 83728 }, { "epoch": 0.52, "learning_rate": 7.102178930828497e-05, "loss": 2.2485, "step": 83736 }, { "epoch": 0.52, "learning_rate": 7.101572648402071e-05, "loss": 2.2472, "step": 83744 }, { "epoch": 0.52, "learning_rate": 7.10096633859042e-05, "loss": 2.2491, "step": 83752 }, { "epoch": 0.52, "learning_rate": 7.100360001408625e-05, "loss": 2.2468, "step": 83760 }, { "epoch": 0.52, "learning_rate": 7.099753636871757e-05, "loss": 2.2475, "step": 83768 }, { "epoch": 0.52, "learning_rate": 7.09914724499489e-05, "loss": 2.2511, "step": 83776 }, { "epoch": 0.52, "learning_rate": 7.098540825793101e-05, "loss": 2.2716, "step": 83784 }, { "epoch": 0.52, "learning_rate": 7.097934379281461e-05, "loss": 2.2544, "step": 83792 }, { "epoch": 0.52, "learning_rate": 7.097327905475051e-05, "loss": 2.2428, "step": 83800 }, { "epoch": 0.52, "learning_rate": 7.096721404388944e-05, "loss": 2.2555, "step": 83808 }, { "epoch": 0.52, "learning_rate": 7.096114876038223e-05, "loss": 2.2446, "step": 83816 }, { "epoch": 0.52, "learning_rate": 7.09550832043796e-05, "loss": 2.2555, "step": 83824 }, { "epoch": 0.52, "learning_rate": 7.094901737603239e-05, "loss": 2.2544, "step": 83832 }, { "epoch": 0.52, "learning_rate": 7.09429512754914e-05, "loss": 2.2544, "step": 83840 }, { "epoch": 0.52, "learning_rate": 7.093688490290738e-05, "loss": 2.255, "step": 83848 }, { "epoch": 0.52, "learning_rate": 7.093081825843117e-05, "loss": 2.2317, "step": 83856 }, { "epoch": 0.52, "learning_rate": 7.092475134221361e-05, "loss": 2.2404, "step": 83864 }, { "epoch": 0.52, "learning_rate": 7.09186841544055e-05, "loss": 2.2733, "step": 83872 }, { "epoch": 0.52, "learning_rate": 7.091261669515767e-05, "loss": 2.2654, "step": 83880 }, { "epoch": 0.52, "learning_rate": 7.090654896462098e-05, "loss": 2.2284, "step": 83888 }, { "epoch": 0.52, "learning_rate": 7.090048096294626e-05, "loss": 2.2625, "step": 83896 }, { "epoch": 0.52, "learning_rate": 7.089441269028433e-05, "loss": 2.2347, "step": 83904 }, { "epoch": 0.52, "learning_rate": 7.088834414678612e-05, "loss": 2.2376, "step": 83912 }, { "epoch": 0.52, "learning_rate": 7.088227533260244e-05, "loss": 2.2321, "step": 83920 }, { "epoch": 0.52, "learning_rate": 7.087620624788416e-05, "loss": 2.254, "step": 83928 }, { "epoch": 0.52, "learning_rate": 7.087013689278219e-05, "loss": 2.2453, "step": 83936 }, { "epoch": 0.52, "learning_rate": 7.086406726744737e-05, "loss": 2.2339, "step": 83944 }, { "epoch": 0.52, "learning_rate": 7.085799737203064e-05, "loss": 2.2417, "step": 83952 }, { "epoch": 0.52, "learning_rate": 7.085192720668288e-05, "loss": 2.2462, "step": 83960 }, { "epoch": 0.52, "learning_rate": 7.084585677155498e-05, "loss": 2.2567, "step": 83968 }, { "epoch": 0.52, "learning_rate": 7.083978606679787e-05, "loss": 2.2476, "step": 83976 }, { "epoch": 0.52, "learning_rate": 7.083371509256247e-05, "loss": 2.2514, "step": 83984 }, { "epoch": 0.52, "learning_rate": 7.082764384899969e-05, "loss": 2.2555, "step": 83992 }, { "epoch": 0.53, "learning_rate": 7.082157233626046e-05, "loss": 2.2408, "step": 84000 }, { "epoch": 0.53, "learning_rate": 7.081550055449573e-05, "loss": 2.2528, "step": 84008 }, { "epoch": 0.53, "learning_rate": 7.080942850385645e-05, "loss": 2.2587, "step": 84016 }, { "epoch": 0.53, "learning_rate": 7.080335618449357e-05, "loss": 2.2437, "step": 84024 }, { "epoch": 0.53, "learning_rate": 7.079728359655804e-05, "loss": 2.2539, "step": 84032 }, { "epoch": 0.53, "learning_rate": 7.079121074020081e-05, "loss": 2.2458, "step": 84040 }, { "epoch": 0.53, "learning_rate": 7.078513761557289e-05, "loss": 2.2379, "step": 84048 }, { "epoch": 0.53, "learning_rate": 7.077906422282523e-05, "loss": 2.2446, "step": 84056 }, { "epoch": 0.53, "learning_rate": 7.077299056210884e-05, "loss": 2.2356, "step": 84064 }, { "epoch": 0.53, "learning_rate": 7.076691663357469e-05, "loss": 2.2438, "step": 84072 }, { "epoch": 0.53, "learning_rate": 7.076084243737376e-05, "loss": 2.2507, "step": 84080 }, { "epoch": 0.53, "learning_rate": 7.07547679736571e-05, "loss": 2.2628, "step": 84088 }, { "epoch": 0.53, "learning_rate": 7.07486932425757e-05, "loss": 2.2429, "step": 84096 }, { "epoch": 0.53, "learning_rate": 7.074261824428057e-05, "loss": 2.2451, "step": 84104 }, { "epoch": 0.53, "learning_rate": 7.073654297892276e-05, "loss": 2.2418, "step": 84112 }, { "epoch": 0.53, "learning_rate": 7.073046744665328e-05, "loss": 2.2519, "step": 84120 }, { "epoch": 0.53, "learning_rate": 7.072439164762317e-05, "loss": 2.2551, "step": 84128 }, { "epoch": 0.53, "learning_rate": 7.07183155819835e-05, "loss": 2.2412, "step": 84136 }, { "epoch": 0.53, "learning_rate": 7.071223924988528e-05, "loss": 2.2539, "step": 84144 }, { "epoch": 0.53, "learning_rate": 7.07061626514796e-05, "loss": 2.2493, "step": 84152 }, { "epoch": 0.53, "learning_rate": 7.070008578691751e-05, "loss": 2.2277, "step": 84160 }, { "epoch": 0.53, "learning_rate": 7.06940086563501e-05, "loss": 2.2482, "step": 84168 }, { "epoch": 0.53, "learning_rate": 7.068793125992843e-05, "loss": 2.259, "step": 84176 }, { "epoch": 0.53, "learning_rate": 7.068185359780358e-05, "loss": 2.2385, "step": 84184 }, { "epoch": 0.53, "learning_rate": 7.067577567012664e-05, "loss": 2.2575, "step": 84192 }, { "epoch": 0.53, "learning_rate": 7.066969747704874e-05, "loss": 2.2397, "step": 84200 }, { "epoch": 0.53, "learning_rate": 7.066361901872098e-05, "loss": 2.2625, "step": 84208 }, { "epoch": 0.53, "learning_rate": 7.065754029529444e-05, "loss": 2.2415, "step": 84216 }, { "epoch": 0.53, "learning_rate": 7.065146130692022e-05, "loss": 2.2456, "step": 84224 }, { "epoch": 0.53, "learning_rate": 7.064538205374953e-05, "loss": 2.2505, "step": 84232 }, { "epoch": 0.53, "learning_rate": 7.063930253593341e-05, "loss": 2.2584, "step": 84240 }, { "epoch": 0.53, "learning_rate": 7.063322275362306e-05, "loss": 2.2596, "step": 84248 }, { "epoch": 0.53, "learning_rate": 7.062714270696957e-05, "loss": 2.2395, "step": 84256 }, { "epoch": 0.53, "learning_rate": 7.062106239612414e-05, "loss": 2.2464, "step": 84264 }, { "epoch": 0.53, "learning_rate": 7.061498182123792e-05, "loss": 2.248, "step": 84272 }, { "epoch": 0.53, "learning_rate": 7.060890098246202e-05, "loss": 2.2727, "step": 84280 }, { "epoch": 0.53, "learning_rate": 7.060281987994768e-05, "loss": 2.243, "step": 84288 }, { "epoch": 0.53, "learning_rate": 7.059673851384602e-05, "loss": 2.2448, "step": 84296 }, { "epoch": 0.53, "learning_rate": 7.05906568843083e-05, "loss": 2.2532, "step": 84304 }, { "epoch": 0.53, "learning_rate": 7.058457499148563e-05, "loss": 2.2555, "step": 84312 }, { "epoch": 0.53, "learning_rate": 7.057849283552924e-05, "loss": 2.2436, "step": 84320 }, { "epoch": 0.53, "learning_rate": 7.057241041659035e-05, "loss": 2.251, "step": 84328 }, { "epoch": 0.53, "learning_rate": 7.056632773482012e-05, "loss": 2.255, "step": 84336 }, { "epoch": 0.53, "learning_rate": 7.056024479036982e-05, "loss": 2.2623, "step": 84344 }, { "epoch": 0.53, "learning_rate": 7.055416158339066e-05, "loss": 2.2664, "step": 84352 }, { "epoch": 0.53, "learning_rate": 7.054807811403384e-05, "loss": 2.2647, "step": 84360 }, { "epoch": 0.53, "learning_rate": 7.054199438245062e-05, "loss": 2.2485, "step": 84368 }, { "epoch": 0.53, "learning_rate": 7.053591038879221e-05, "loss": 2.2654, "step": 84376 }, { "epoch": 0.53, "learning_rate": 7.052982613320993e-05, "loss": 2.2678, "step": 84384 }, { "epoch": 0.53, "learning_rate": 7.052374161585495e-05, "loss": 2.2547, "step": 84392 }, { "epoch": 0.53, "learning_rate": 7.05176568368786e-05, "loss": 2.2511, "step": 84400 }, { "epoch": 0.53, "learning_rate": 7.051157179643213e-05, "loss": 2.2734, "step": 84408 }, { "epoch": 0.53, "learning_rate": 7.050548649466677e-05, "loss": 2.2698, "step": 84416 }, { "epoch": 0.53, "learning_rate": 7.049940093173389e-05, "loss": 2.2446, "step": 84424 }, { "epoch": 0.53, "learning_rate": 7.049331510778468e-05, "loss": 2.2431, "step": 84432 }, { "epoch": 0.53, "learning_rate": 7.048722902297049e-05, "loss": 2.2504, "step": 84440 }, { "epoch": 0.53, "learning_rate": 7.048114267744262e-05, "loss": 2.2524, "step": 84448 }, { "epoch": 0.53, "learning_rate": 7.047505607135235e-05, "loss": 2.2543, "step": 84456 }, { "epoch": 0.53, "learning_rate": 7.0468969204851e-05, "loss": 2.26, "step": 84464 }, { "epoch": 0.53, "learning_rate": 7.046288207808991e-05, "loss": 2.2542, "step": 84472 }, { "epoch": 0.53, "learning_rate": 7.045679469122041e-05, "loss": 2.2705, "step": 84480 }, { "epoch": 0.53, "learning_rate": 7.045070704439385e-05, "loss": 2.2524, "step": 84488 }, { "epoch": 0.53, "learning_rate": 7.044461913776148e-05, "loss": 2.2632, "step": 84496 }, { "epoch": 0.53, "learning_rate": 7.043853097147475e-05, "loss": 2.256, "step": 84504 }, { "epoch": 0.53, "learning_rate": 7.043244254568495e-05, "loss": 2.2507, "step": 84512 }, { "epoch": 0.53, "learning_rate": 7.042635386054345e-05, "loss": 2.2633, "step": 84520 }, { "epoch": 0.53, "learning_rate": 7.042026491620164e-05, "loss": 2.2486, "step": 84528 }, { "epoch": 0.53, "learning_rate": 7.041417571281089e-05, "loss": 2.2547, "step": 84536 }, { "epoch": 0.53, "learning_rate": 7.040808625052253e-05, "loss": 2.2653, "step": 84544 }, { "epoch": 0.53, "learning_rate": 7.0401996529488e-05, "loss": 2.2391, "step": 84552 }, { "epoch": 0.53, "learning_rate": 7.039590654985867e-05, "loss": 2.2689, "step": 84560 }, { "epoch": 0.53, "learning_rate": 7.03898163117859e-05, "loss": 2.2586, "step": 84568 }, { "epoch": 0.53, "learning_rate": 7.038372581542116e-05, "loss": 2.2485, "step": 84576 }, { "epoch": 0.53, "learning_rate": 7.037763506091584e-05, "loss": 2.2616, "step": 84584 }, { "epoch": 0.53, "learning_rate": 7.037154404842133e-05, "loss": 2.2692, "step": 84592 }, { "epoch": 0.53, "learning_rate": 7.036545277808908e-05, "loss": 2.2605, "step": 84600 }, { "epoch": 0.53, "learning_rate": 7.03593612500705e-05, "loss": 2.2522, "step": 84608 }, { "epoch": 0.53, "learning_rate": 7.035326946451706e-05, "loss": 2.2671, "step": 84616 }, { "epoch": 0.53, "learning_rate": 7.034717742158015e-05, "loss": 2.2599, "step": 84624 }, { "epoch": 0.53, "learning_rate": 7.034108512141127e-05, "loss": 2.2649, "step": 84632 }, { "epoch": 0.53, "learning_rate": 7.033499256416185e-05, "loss": 2.253, "step": 84640 }, { "epoch": 0.53, "learning_rate": 7.032889974998336e-05, "loss": 2.2673, "step": 84648 }, { "epoch": 0.53, "learning_rate": 7.032280667902724e-05, "loss": 2.2588, "step": 84656 }, { "epoch": 0.53, "learning_rate": 7.031671335144501e-05, "loss": 2.2557, "step": 84664 }, { "epoch": 0.53, "learning_rate": 7.031061976738814e-05, "loss": 2.2702, "step": 84672 }, { "epoch": 0.53, "learning_rate": 7.030452592700806e-05, "loss": 2.2631, "step": 84680 }, { "epoch": 0.53, "learning_rate": 7.029843183045635e-05, "loss": 2.2538, "step": 84688 }, { "epoch": 0.53, "learning_rate": 7.029233747788446e-05, "loss": 2.2537, "step": 84696 }, { "epoch": 0.53, "learning_rate": 7.02862428694439e-05, "loss": 2.2692, "step": 84704 }, { "epoch": 0.53, "learning_rate": 7.028014800528619e-05, "loss": 2.2571, "step": 84712 }, { "epoch": 0.53, "learning_rate": 7.027405288556286e-05, "loss": 2.26, "step": 84720 }, { "epoch": 0.53, "learning_rate": 7.026795751042541e-05, "loss": 2.2572, "step": 84728 }, { "epoch": 0.53, "learning_rate": 7.026186188002537e-05, "loss": 2.2563, "step": 84736 }, { "epoch": 0.53, "learning_rate": 7.025576599451432e-05, "loss": 2.27, "step": 84744 }, { "epoch": 0.53, "learning_rate": 7.024966985404376e-05, "loss": 2.2609, "step": 84752 }, { "epoch": 0.53, "learning_rate": 7.024357345876527e-05, "loss": 2.2706, "step": 84760 }, { "epoch": 0.53, "learning_rate": 7.023747680883037e-05, "loss": 2.2646, "step": 84768 }, { "epoch": 0.53, "learning_rate": 7.023137990439066e-05, "loss": 2.265, "step": 84776 }, { "epoch": 0.53, "learning_rate": 7.02252827455977e-05, "loss": 2.272, "step": 84784 }, { "epoch": 0.53, "learning_rate": 7.021918533260308e-05, "loss": 2.2684, "step": 84792 }, { "epoch": 0.53, "learning_rate": 7.021308766555834e-05, "loss": 2.2523, "step": 84800 }, { "epoch": 0.53, "learning_rate": 7.020698974461511e-05, "loss": 2.2656, "step": 84808 }, { "epoch": 0.53, "learning_rate": 7.020089156992497e-05, "loss": 2.2766, "step": 84816 }, { "epoch": 0.53, "learning_rate": 7.019479314163951e-05, "loss": 2.264, "step": 84824 }, { "epoch": 0.53, "learning_rate": 7.018869445991037e-05, "loss": 2.2779, "step": 84832 }, { "epoch": 0.53, "learning_rate": 7.01825955248891e-05, "loss": 2.2599, "step": 84840 }, { "epoch": 0.53, "learning_rate": 7.01764963367274e-05, "loss": 2.2503, "step": 84848 }, { "epoch": 0.53, "learning_rate": 7.017039689557686e-05, "loss": 2.2519, "step": 84856 }, { "epoch": 0.53, "learning_rate": 7.01642972015891e-05, "loss": 2.2594, "step": 84864 }, { "epoch": 0.53, "learning_rate": 7.015819725491577e-05, "loss": 2.2694, "step": 84872 }, { "epoch": 0.53, "learning_rate": 7.015209705570851e-05, "loss": 2.2895, "step": 84880 }, { "epoch": 0.53, "learning_rate": 7.0145996604119e-05, "loss": 2.2595, "step": 84888 }, { "epoch": 0.53, "learning_rate": 7.013989590029885e-05, "loss": 2.267, "step": 84896 }, { "epoch": 0.53, "learning_rate": 7.013379494439978e-05, "loss": 2.2637, "step": 84904 }, { "epoch": 0.53, "learning_rate": 7.012769373657342e-05, "loss": 2.2559, "step": 84912 }, { "epoch": 0.53, "learning_rate": 7.012159227697143e-05, "loss": 2.2916, "step": 84920 }, { "epoch": 0.53, "learning_rate": 7.011549056574555e-05, "loss": 2.2583, "step": 84928 }, { "epoch": 0.53, "learning_rate": 7.010938860304743e-05, "loss": 2.2785, "step": 84936 }, { "epoch": 0.53, "learning_rate": 7.010328638902876e-05, "loss": 2.2617, "step": 84944 }, { "epoch": 0.53, "learning_rate": 7.00971839238413e-05, "loss": 2.2486, "step": 84952 }, { "epoch": 0.53, "learning_rate": 7.009108120763667e-05, "loss": 2.2561, "step": 84960 }, { "epoch": 0.53, "learning_rate": 7.008497824056665e-05, "loss": 2.2801, "step": 84968 }, { "epoch": 0.53, "learning_rate": 7.007887502278297e-05, "loss": 2.2679, "step": 84976 }, { "epoch": 0.53, "learning_rate": 7.007277155443727e-05, "loss": 2.2672, "step": 84984 }, { "epoch": 0.53, "learning_rate": 7.006666783568137e-05, "loss": 2.2623, "step": 84992 }, { "epoch": 0.53, "learning_rate": 7.006056386666694e-05, "loss": 2.2533, "step": 85000 }, { "epoch": 0.53, "learning_rate": 7.005445964754582e-05, "loss": 2.2587, "step": 85008 }, { "epoch": 0.53, "learning_rate": 7.004835517846969e-05, "loss": 2.2697, "step": 85016 }, { "epoch": 0.53, "learning_rate": 7.00422504595903e-05, "loss": 2.2482, "step": 85024 }, { "epoch": 0.53, "learning_rate": 7.003614549105946e-05, "loss": 2.2414, "step": 85032 }, { "epoch": 0.53, "learning_rate": 7.003004027302888e-05, "loss": 2.2542, "step": 85040 }, { "epoch": 0.53, "learning_rate": 7.002393480565041e-05, "loss": 2.266, "step": 85048 }, { "epoch": 0.53, "learning_rate": 7.00178290890758e-05, "loss": 2.2651, "step": 85056 }, { "epoch": 0.53, "learning_rate": 7.00117231234568e-05, "loss": 2.2467, "step": 85064 }, { "epoch": 0.53, "learning_rate": 7.000561690894527e-05, "loss": 2.2784, "step": 85072 }, { "epoch": 0.53, "learning_rate": 6.999951044569298e-05, "loss": 2.2382, "step": 85080 }, { "epoch": 0.53, "learning_rate": 6.999340373385172e-05, "loss": 2.2536, "step": 85088 }, { "epoch": 0.53, "learning_rate": 6.998729677357332e-05, "loss": 2.2561, "step": 85096 }, { "epoch": 0.53, "learning_rate": 6.998118956500962e-05, "loss": 2.2468, "step": 85104 }, { "epoch": 0.53, "learning_rate": 6.997508210831242e-05, "loss": 2.259, "step": 85112 }, { "epoch": 0.53, "learning_rate": 6.996897440363356e-05, "loss": 2.2539, "step": 85120 }, { "epoch": 0.53, "learning_rate": 6.996286645112488e-05, "loss": 2.2511, "step": 85128 }, { "epoch": 0.53, "learning_rate": 6.995675825093821e-05, "loss": 2.2517, "step": 85136 }, { "epoch": 0.53, "learning_rate": 6.995064980322543e-05, "loss": 2.258, "step": 85144 }, { "epoch": 0.53, "learning_rate": 6.994454110813838e-05, "loss": 2.2453, "step": 85152 }, { "epoch": 0.53, "learning_rate": 6.993843216582891e-05, "loss": 2.2408, "step": 85160 }, { "epoch": 0.53, "learning_rate": 6.993232297644891e-05, "loss": 2.2653, "step": 85168 }, { "epoch": 0.53, "learning_rate": 6.992621354015024e-05, "loss": 2.2579, "step": 85176 }, { "epoch": 0.53, "learning_rate": 6.992010385708478e-05, "loss": 2.2491, "step": 85184 }, { "epoch": 0.53, "learning_rate": 6.991399392740446e-05, "loss": 2.251, "step": 85192 }, { "epoch": 0.53, "learning_rate": 6.990788375126109e-05, "loss": 2.2546, "step": 85200 }, { "epoch": 0.53, "learning_rate": 6.990177332880665e-05, "loss": 2.2506, "step": 85208 }, { "epoch": 0.53, "learning_rate": 6.9895662660193e-05, "loss": 2.2566, "step": 85216 }, { "epoch": 0.53, "learning_rate": 6.988955174557208e-05, "loss": 2.2691, "step": 85224 }, { "epoch": 0.53, "learning_rate": 6.98834405850958e-05, "loss": 2.2405, "step": 85232 }, { "epoch": 0.53, "learning_rate": 6.987732917891605e-05, "loss": 2.2535, "step": 85240 }, { "epoch": 0.53, "learning_rate": 6.987121752718479e-05, "loss": 2.2466, "step": 85248 }, { "epoch": 0.53, "learning_rate": 6.986510563005398e-05, "loss": 2.2283, "step": 85256 }, { "epoch": 0.53, "learning_rate": 6.985899348767553e-05, "loss": 2.2585, "step": 85264 }, { "epoch": 0.53, "learning_rate": 6.985288110020138e-05, "loss": 2.2503, "step": 85272 }, { "epoch": 0.53, "learning_rate": 6.98467684677835e-05, "loss": 2.2437, "step": 85280 }, { "epoch": 0.53, "learning_rate": 6.984065559057389e-05, "loss": 2.2509, "step": 85288 }, { "epoch": 0.53, "learning_rate": 6.983454246872444e-05, "loss": 2.2397, "step": 85296 }, { "epoch": 0.53, "learning_rate": 6.982842910238718e-05, "loss": 2.2499, "step": 85304 }, { "epoch": 0.53, "learning_rate": 6.982231549171405e-05, "loss": 2.2451, "step": 85312 }, { "epoch": 0.53, "learning_rate": 6.981620163685707e-05, "loss": 2.2509, "step": 85320 }, { "epoch": 0.53, "learning_rate": 6.98100875379682e-05, "loss": 2.2524, "step": 85328 }, { "epoch": 0.53, "learning_rate": 6.980397319519947e-05, "loss": 2.25, "step": 85336 }, { "epoch": 0.53, "learning_rate": 6.979785860870288e-05, "loss": 2.2464, "step": 85344 }, { "epoch": 0.53, "learning_rate": 6.979174377863038e-05, "loss": 2.2609, "step": 85352 }, { "epoch": 0.53, "learning_rate": 6.978562870513408e-05, "loss": 2.2505, "step": 85360 }, { "epoch": 0.53, "learning_rate": 6.977951338836591e-05, "loss": 2.2403, "step": 85368 }, { "epoch": 0.53, "learning_rate": 6.977339782847796e-05, "loss": 2.2497, "step": 85376 }, { "epoch": 0.53, "learning_rate": 6.976728202562225e-05, "loss": 2.2443, "step": 85384 }, { "epoch": 0.53, "learning_rate": 6.976116597995081e-05, "loss": 2.2443, "step": 85392 }, { "epoch": 0.53, "learning_rate": 6.975504969161568e-05, "loss": 2.2356, "step": 85400 }, { "epoch": 0.53, "learning_rate": 6.974893316076891e-05, "loss": 2.2571, "step": 85408 }, { "epoch": 0.53, "learning_rate": 6.97428163875626e-05, "loss": 2.2249, "step": 85416 }, { "epoch": 0.53, "learning_rate": 6.973669937214877e-05, "loss": 2.2403, "step": 85424 }, { "epoch": 0.53, "learning_rate": 6.973058211467948e-05, "loss": 2.2618, "step": 85432 }, { "epoch": 0.53, "learning_rate": 6.972446461530685e-05, "loss": 2.2554, "step": 85440 }, { "epoch": 0.53, "learning_rate": 6.971834687418293e-05, "loss": 2.2349, "step": 85448 }, { "epoch": 0.53, "learning_rate": 6.971222889145984e-05, "loss": 2.2491, "step": 85456 }, { "epoch": 0.53, "learning_rate": 6.970611066728961e-05, "loss": 2.2639, "step": 85464 }, { "epoch": 0.53, "learning_rate": 6.969999220182439e-05, "loss": 2.2479, "step": 85472 }, { "epoch": 0.53, "learning_rate": 6.96938734952163e-05, "loss": 2.2498, "step": 85480 }, { "epoch": 0.53, "learning_rate": 6.96877545476174e-05, "loss": 2.2486, "step": 85488 }, { "epoch": 0.53, "learning_rate": 6.968163535917985e-05, "loss": 2.2561, "step": 85496 }, { "epoch": 0.53, "learning_rate": 6.967551593005574e-05, "loss": 2.2497, "step": 85504 }, { "epoch": 0.53, "learning_rate": 6.966939626039723e-05, "loss": 2.2605, "step": 85512 }, { "epoch": 0.53, "learning_rate": 6.966327635035646e-05, "loss": 2.2325, "step": 85520 }, { "epoch": 0.53, "learning_rate": 6.965715620008553e-05, "loss": 2.2499, "step": 85528 }, { "epoch": 0.53, "learning_rate": 6.965103580973665e-05, "loss": 2.2493, "step": 85536 }, { "epoch": 0.53, "learning_rate": 6.96449151794619e-05, "loss": 2.2485, "step": 85544 }, { "epoch": 0.53, "learning_rate": 6.963879430941349e-05, "loss": 2.2778, "step": 85552 }, { "epoch": 0.53, "learning_rate": 6.963267319974356e-05, "loss": 2.2639, "step": 85560 }, { "epoch": 0.53, "learning_rate": 6.96265518506043e-05, "loss": 2.2475, "step": 85568 }, { "epoch": 0.53, "learning_rate": 6.962043026214789e-05, "loss": 2.2642, "step": 85576 }, { "epoch": 0.53, "learning_rate": 6.96143084345265e-05, "loss": 2.2556, "step": 85584 }, { "epoch": 0.53, "learning_rate": 6.960818636789233e-05, "loss": 2.2386, "step": 85592 }, { "epoch": 0.54, "learning_rate": 6.960206406239756e-05, "loss": 2.2641, "step": 85600 }, { "epoch": 0.54, "learning_rate": 6.95959415181944e-05, "loss": 2.2567, "step": 85608 }, { "epoch": 0.54, "learning_rate": 6.958981873543507e-05, "loss": 2.268, "step": 85616 }, { "epoch": 0.54, "learning_rate": 6.958369571427174e-05, "loss": 2.2621, "step": 85624 }, { "epoch": 0.54, "learning_rate": 6.957757245485669e-05, "loss": 2.2506, "step": 85632 }, { "epoch": 0.54, "learning_rate": 6.957144895734212e-05, "loss": 2.2544, "step": 85640 }, { "epoch": 0.54, "learning_rate": 6.956532522188022e-05, "loss": 2.2599, "step": 85648 }, { "epoch": 0.54, "learning_rate": 6.955920124862328e-05, "loss": 2.2657, "step": 85656 }, { "epoch": 0.54, "learning_rate": 6.955307703772352e-05, "loss": 2.2414, "step": 85664 }, { "epoch": 0.54, "learning_rate": 6.954695258933321e-05, "loss": 2.2801, "step": 85672 }, { "epoch": 0.54, "learning_rate": 6.954082790360456e-05, "loss": 2.2534, "step": 85680 }, { "epoch": 0.54, "learning_rate": 6.953470298068988e-05, "loss": 2.2643, "step": 85688 }, { "epoch": 0.54, "learning_rate": 6.95285778207414e-05, "loss": 2.253, "step": 85696 }, { "epoch": 0.54, "learning_rate": 6.952245242391142e-05, "loss": 2.251, "step": 85704 }, { "epoch": 0.54, "learning_rate": 6.95163267903522e-05, "loss": 2.2628, "step": 85712 }, { "epoch": 0.54, "learning_rate": 6.951020092021603e-05, "loss": 2.2504, "step": 85720 }, { "epoch": 0.54, "learning_rate": 6.95040748136552e-05, "loss": 2.2648, "step": 85728 }, { "epoch": 0.54, "learning_rate": 6.9497948470822e-05, "loss": 2.2517, "step": 85736 }, { "epoch": 0.54, "learning_rate": 6.949182189186871e-05, "loss": 2.2465, "step": 85744 }, { "epoch": 0.54, "learning_rate": 6.948569507694769e-05, "loss": 2.2647, "step": 85752 }, { "epoch": 0.54, "learning_rate": 6.947956802621122e-05, "loss": 2.245, "step": 85760 }, { "epoch": 0.54, "learning_rate": 6.947344073981163e-05, "loss": 2.2408, "step": 85768 }, { "epoch": 0.54, "learning_rate": 6.946731321790123e-05, "loss": 2.2398, "step": 85776 }, { "epoch": 0.54, "learning_rate": 6.946118546063237e-05, "loss": 2.2501, "step": 85784 }, { "epoch": 0.54, "learning_rate": 6.94550574681574e-05, "loss": 2.2558, "step": 85792 }, { "epoch": 0.54, "learning_rate": 6.944892924062861e-05, "loss": 2.2527, "step": 85800 }, { "epoch": 0.54, "learning_rate": 6.944280077819838e-05, "loss": 2.2496, "step": 85808 }, { "epoch": 0.54, "learning_rate": 6.943667208101907e-05, "loss": 2.2476, "step": 85816 }, { "epoch": 0.54, "learning_rate": 6.943054314924303e-05, "loss": 2.2456, "step": 85824 }, { "epoch": 0.54, "learning_rate": 6.942441398302264e-05, "loss": 2.2518, "step": 85832 }, { "epoch": 0.54, "learning_rate": 6.941828458251023e-05, "loss": 2.2498, "step": 85840 }, { "epoch": 0.54, "learning_rate": 6.941215494785825e-05, "loss": 2.2535, "step": 85848 }, { "epoch": 0.54, "learning_rate": 6.940602507921902e-05, "loss": 2.2658, "step": 85856 }, { "epoch": 0.54, "learning_rate": 6.939989497674495e-05, "loss": 2.2591, "step": 85864 }, { "epoch": 0.54, "learning_rate": 6.939376464058844e-05, "loss": 2.2579, "step": 85872 }, { "epoch": 0.54, "learning_rate": 6.938763407090188e-05, "loss": 2.2475, "step": 85880 }, { "epoch": 0.54, "learning_rate": 6.93815032678377e-05, "loss": 2.2563, "step": 85888 }, { "epoch": 0.54, "learning_rate": 6.937537223154828e-05, "loss": 2.2421, "step": 85896 }, { "epoch": 0.54, "learning_rate": 6.936924096218607e-05, "loss": 2.253, "step": 85904 }, { "epoch": 0.54, "learning_rate": 6.936310945990347e-05, "loss": 2.2453, "step": 85912 }, { "epoch": 0.54, "learning_rate": 6.935697772485292e-05, "loss": 2.2574, "step": 85920 }, { "epoch": 0.54, "learning_rate": 6.935084575718685e-05, "loss": 2.2359, "step": 85928 }, { "epoch": 0.54, "learning_rate": 6.934471355705771e-05, "loss": 2.2653, "step": 85936 }, { "epoch": 0.54, "learning_rate": 6.933858112461794e-05, "loss": 2.2693, "step": 85944 }, { "epoch": 0.54, "learning_rate": 6.933244846002001e-05, "loss": 2.2528, "step": 85952 }, { "epoch": 0.54, "learning_rate": 6.932631556341635e-05, "loss": 2.2348, "step": 85960 }, { "epoch": 0.54, "learning_rate": 6.932018243495944e-05, "loss": 2.2594, "step": 85968 }, { "epoch": 0.54, "learning_rate": 6.931404907480173e-05, "loss": 2.2535, "step": 85976 }, { "epoch": 0.54, "learning_rate": 6.930791548309574e-05, "loss": 2.2578, "step": 85984 }, { "epoch": 0.54, "learning_rate": 6.930178165999393e-05, "loss": 2.2678, "step": 85992 }, { "epoch": 0.54, "learning_rate": 6.929564760564875e-05, "loss": 2.249, "step": 86000 }, { "epoch": 0.54, "learning_rate": 6.928951332021276e-05, "loss": 2.2441, "step": 86008 }, { "epoch": 0.54, "learning_rate": 6.928337880383842e-05, "loss": 2.2651, "step": 86016 }, { "epoch": 0.54, "learning_rate": 6.927724405667824e-05, "loss": 2.2483, "step": 86024 }, { "epoch": 0.54, "learning_rate": 6.927110907888473e-05, "loss": 2.2611, "step": 86032 }, { "epoch": 0.54, "learning_rate": 6.926497387061042e-05, "loss": 2.2646, "step": 86040 }, { "epoch": 0.54, "learning_rate": 6.92588384320078e-05, "loss": 2.2505, "step": 86048 }, { "epoch": 0.54, "learning_rate": 6.925270276322941e-05, "loss": 2.2559, "step": 86056 }, { "epoch": 0.54, "learning_rate": 6.924656686442783e-05, "loss": 2.2602, "step": 86064 }, { "epoch": 0.54, "learning_rate": 6.924043073575554e-05, "loss": 2.2747, "step": 86072 }, { "epoch": 0.54, "learning_rate": 6.92342943773651e-05, "loss": 2.2624, "step": 86080 }, { "epoch": 0.54, "learning_rate": 6.922815778940907e-05, "loss": 2.2588, "step": 86088 }, { "epoch": 0.54, "learning_rate": 6.922202097204e-05, "loss": 2.2466, "step": 86096 }, { "epoch": 0.54, "learning_rate": 6.921588392541047e-05, "loss": 2.2552, "step": 86104 }, { "epoch": 0.54, "learning_rate": 6.920974664967302e-05, "loss": 2.2554, "step": 86112 }, { "epoch": 0.54, "learning_rate": 6.92036091449802e-05, "loss": 2.262, "step": 86120 }, { "epoch": 0.54, "learning_rate": 6.919747141148467e-05, "loss": 2.2657, "step": 86128 }, { "epoch": 0.54, "learning_rate": 6.919133344933896e-05, "loss": 2.263, "step": 86136 }, { "epoch": 0.54, "learning_rate": 6.918519525869567e-05, "loss": 2.2634, "step": 86144 }, { "epoch": 0.54, "learning_rate": 6.917905683970738e-05, "loss": 2.2628, "step": 86152 }, { "epoch": 0.54, "learning_rate": 6.917291819252671e-05, "loss": 2.2493, "step": 86160 }, { "epoch": 0.54, "learning_rate": 6.916677931730628e-05, "loss": 2.2679, "step": 86168 }, { "epoch": 0.54, "learning_rate": 6.916064021419868e-05, "loss": 2.2683, "step": 86176 }, { "epoch": 0.54, "learning_rate": 6.915450088335653e-05, "loss": 2.2533, "step": 86184 }, { "epoch": 0.54, "learning_rate": 6.914836132493247e-05, "loss": 2.2612, "step": 86192 }, { "epoch": 0.54, "learning_rate": 6.914222153907912e-05, "loss": 2.2513, "step": 86200 }, { "epoch": 0.54, "learning_rate": 6.913608152594911e-05, "loss": 2.2554, "step": 86208 }, { "epoch": 0.54, "learning_rate": 6.912994128569508e-05, "loss": 2.2486, "step": 86216 }, { "epoch": 0.54, "learning_rate": 6.912380081846972e-05, "loss": 2.2574, "step": 86224 }, { "epoch": 0.54, "learning_rate": 6.911766012442562e-05, "loss": 2.2671, "step": 86232 }, { "epoch": 0.54, "learning_rate": 6.911151920371547e-05, "loss": 2.2621, "step": 86240 }, { "epoch": 0.54, "learning_rate": 6.910537805649194e-05, "loss": 2.2553, "step": 86248 }, { "epoch": 0.54, "learning_rate": 6.909923668290767e-05, "loss": 2.2658, "step": 86256 }, { "epoch": 0.54, "learning_rate": 6.909309508311538e-05, "loss": 2.2468, "step": 86264 }, { "epoch": 0.54, "learning_rate": 6.90869532572677e-05, "loss": 2.2458, "step": 86272 }, { "epoch": 0.54, "learning_rate": 6.908081120551737e-05, "loss": 2.2633, "step": 86280 }, { "epoch": 0.54, "learning_rate": 6.907466892801703e-05, "loss": 2.2664, "step": 86288 }, { "epoch": 0.54, "learning_rate": 6.906852642491941e-05, "loss": 2.2457, "step": 86296 }, { "epoch": 0.54, "learning_rate": 6.906238369637721e-05, "loss": 2.2417, "step": 86304 }, { "epoch": 0.54, "learning_rate": 6.905624074254313e-05, "loss": 2.2494, "step": 86312 }, { "epoch": 0.54, "learning_rate": 6.90500975635699e-05, "loss": 2.2431, "step": 86320 }, { "epoch": 0.54, "learning_rate": 6.904395415961022e-05, "loss": 2.2505, "step": 86328 }, { "epoch": 0.54, "learning_rate": 6.903781053081682e-05, "loss": 2.2415, "step": 86336 }, { "epoch": 0.54, "learning_rate": 6.903166667734244e-05, "loss": 2.2583, "step": 86344 }, { "epoch": 0.54, "learning_rate": 6.902552259933983e-05, "loss": 2.2459, "step": 86352 }, { "epoch": 0.54, "learning_rate": 6.90193782969617e-05, "loss": 2.2451, "step": 86360 }, { "epoch": 0.54, "learning_rate": 6.90132337703608e-05, "loss": 2.2529, "step": 86368 }, { "epoch": 0.54, "learning_rate": 6.90070890196899e-05, "loss": 2.2494, "step": 86376 }, { "epoch": 0.54, "learning_rate": 6.900094404510179e-05, "loss": 2.2391, "step": 86384 }, { "epoch": 0.54, "learning_rate": 6.899479884674918e-05, "loss": 2.2596, "step": 86392 }, { "epoch": 0.54, "learning_rate": 6.898865342478484e-05, "loss": 2.2585, "step": 86400 }, { "epoch": 0.54, "learning_rate": 6.898250777936159e-05, "loss": 2.2482, "step": 86408 }, { "epoch": 0.54, "learning_rate": 6.89763619106322e-05, "loss": 2.2564, "step": 86416 }, { "epoch": 0.54, "learning_rate": 6.897021581874943e-05, "loss": 2.2446, "step": 86424 }, { "epoch": 0.54, "learning_rate": 6.89640695038661e-05, "loss": 2.2573, "step": 86432 }, { "epoch": 0.54, "learning_rate": 6.895792296613498e-05, "loss": 2.2605, "step": 86440 }, { "epoch": 0.54, "learning_rate": 6.895177620570889e-05, "loss": 2.2488, "step": 86448 }, { "epoch": 0.54, "learning_rate": 6.894562922274065e-05, "loss": 2.2668, "step": 86456 }, { "epoch": 0.54, "learning_rate": 6.893948201738305e-05, "loss": 2.2546, "step": 86464 }, { "epoch": 0.54, "learning_rate": 6.893333458978894e-05, "loss": 2.2544, "step": 86472 }, { "epoch": 0.54, "learning_rate": 6.892718694011114e-05, "loss": 2.2479, "step": 86480 }, { "epoch": 0.54, "learning_rate": 6.892103906850245e-05, "loss": 2.2491, "step": 86488 }, { "epoch": 0.54, "learning_rate": 6.891489097511572e-05, "loss": 2.2567, "step": 86496 }, { "epoch": 0.54, "learning_rate": 6.890874266010381e-05, "loss": 2.2584, "step": 86504 }, { "epoch": 0.54, "learning_rate": 6.890259412361956e-05, "loss": 2.2493, "step": 86512 }, { "epoch": 0.54, "learning_rate": 6.889644536581583e-05, "loss": 2.2556, "step": 86520 }, { "epoch": 0.54, "learning_rate": 6.889029638684546e-05, "loss": 2.2456, "step": 86528 }, { "epoch": 0.54, "learning_rate": 6.888414718686133e-05, "loss": 2.26, "step": 86536 }, { "epoch": 0.54, "learning_rate": 6.88779977660163e-05, "loss": 2.2661, "step": 86544 }, { "epoch": 0.54, "learning_rate": 6.887184812446325e-05, "loss": 2.265, "step": 86552 }, { "epoch": 0.54, "learning_rate": 6.886569826235507e-05, "loss": 2.2602, "step": 86560 }, { "epoch": 0.54, "learning_rate": 6.885954817984462e-05, "loss": 2.2508, "step": 86568 }, { "epoch": 0.54, "learning_rate": 6.885339787708482e-05, "loss": 2.2718, "step": 86576 }, { "epoch": 0.54, "learning_rate": 6.884724735422854e-05, "loss": 2.2637, "step": 86584 }, { "epoch": 0.54, "learning_rate": 6.884109661142871e-05, "loss": 2.2613, "step": 86592 }, { "epoch": 0.54, "learning_rate": 6.883494564883823e-05, "loss": 2.2637, "step": 86600 }, { "epoch": 0.54, "learning_rate": 6.882879446661001e-05, "loss": 2.2509, "step": 86608 }, { "epoch": 0.54, "learning_rate": 6.882264306489696e-05, "loss": 2.2473, "step": 86616 }, { "epoch": 0.54, "learning_rate": 6.881649144385202e-05, "loss": 2.2441, "step": 86624 }, { "epoch": 0.54, "learning_rate": 6.881033960362811e-05, "loss": 2.2658, "step": 86632 }, { "epoch": 0.54, "learning_rate": 6.880418754437817e-05, "loss": 2.25, "step": 86640 }, { "epoch": 0.54, "learning_rate": 6.879803526625514e-05, "loss": 2.2593, "step": 86648 }, { "epoch": 0.54, "learning_rate": 6.879188276941197e-05, "loss": 2.2412, "step": 86656 }, { "epoch": 0.54, "learning_rate": 6.87857300540016e-05, "loss": 2.2632, "step": 86664 }, { "epoch": 0.54, "learning_rate": 6.877957712017699e-05, "loss": 2.2218, "step": 86672 }, { "epoch": 0.54, "learning_rate": 6.877342396809112e-05, "loss": 2.2558, "step": 86680 }, { "epoch": 0.54, "learning_rate": 6.876727059789694e-05, "loss": 2.2527, "step": 86688 }, { "epoch": 0.54, "learning_rate": 6.876111700974743e-05, "loss": 2.2569, "step": 86696 }, { "epoch": 0.54, "learning_rate": 6.875496320379557e-05, "loss": 2.2607, "step": 86704 }, { "epoch": 0.54, "learning_rate": 6.874880918019435e-05, "loss": 2.226, "step": 86712 }, { "epoch": 0.54, "learning_rate": 6.874265493909674e-05, "loss": 2.2544, "step": 86720 }, { "epoch": 0.54, "learning_rate": 6.873650048065577e-05, "loss": 2.2478, "step": 86728 }, { "epoch": 0.54, "learning_rate": 6.873034580502437e-05, "loss": 2.2394, "step": 86736 }, { "epoch": 0.54, "learning_rate": 6.872419091235564e-05, "loss": 2.2506, "step": 86744 }, { "epoch": 0.54, "learning_rate": 6.871803580280252e-05, "loss": 2.2536, "step": 86752 }, { "epoch": 0.54, "learning_rate": 6.871188047651807e-05, "loss": 2.2457, "step": 86760 }, { "epoch": 0.54, "learning_rate": 6.870572493365527e-05, "loss": 2.253, "step": 86768 }, { "epoch": 0.54, "learning_rate": 6.86995691743672e-05, "loss": 2.255, "step": 86776 }, { "epoch": 0.54, "learning_rate": 6.869341319880685e-05, "loss": 2.2341, "step": 86784 }, { "epoch": 0.54, "learning_rate": 6.868725700712727e-05, "loss": 2.2402, "step": 86792 }, { "epoch": 0.54, "learning_rate": 6.86811005994815e-05, "loss": 2.2486, "step": 86800 }, { "epoch": 0.54, "learning_rate": 6.867494397602261e-05, "loss": 2.2389, "step": 86808 }, { "epoch": 0.54, "learning_rate": 6.866878713690363e-05, "loss": 2.2519, "step": 86816 }, { "epoch": 0.54, "learning_rate": 6.866263008227764e-05, "loss": 2.2613, "step": 86824 }, { "epoch": 0.54, "learning_rate": 6.865647281229768e-05, "loss": 2.2289, "step": 86832 }, { "epoch": 0.54, "learning_rate": 6.865031532711684e-05, "loss": 2.2466, "step": 86840 }, { "epoch": 0.54, "learning_rate": 6.864415762688819e-05, "loss": 2.2364, "step": 86848 }, { "epoch": 0.54, "learning_rate": 6.863799971176481e-05, "loss": 2.2486, "step": 86856 }, { "epoch": 0.54, "learning_rate": 6.863184158189979e-05, "loss": 2.2349, "step": 86864 }, { "epoch": 0.54, "learning_rate": 6.862568323744622e-05, "loss": 2.2382, "step": 86872 }, { "epoch": 0.54, "learning_rate": 6.861952467855721e-05, "loss": 2.2398, "step": 86880 }, { "epoch": 0.54, "learning_rate": 6.861336590538583e-05, "loss": 2.2427, "step": 86888 }, { "epoch": 0.54, "learning_rate": 6.860720691808521e-05, "loss": 2.2481, "step": 86896 }, { "epoch": 0.54, "learning_rate": 6.860104771680847e-05, "loss": 2.2425, "step": 86904 }, { "epoch": 0.54, "learning_rate": 6.859488830170872e-05, "loss": 2.2498, "step": 86912 }, { "epoch": 0.54, "learning_rate": 6.858872867293907e-05, "loss": 2.2347, "step": 86920 }, { "epoch": 0.54, "learning_rate": 6.858256883065267e-05, "loss": 2.2499, "step": 86928 }, { "epoch": 0.54, "learning_rate": 6.857640877500265e-05, "loss": 2.2391, "step": 86936 }, { "epoch": 0.54, "learning_rate": 6.857024850614213e-05, "loss": 2.2527, "step": 86944 }, { "epoch": 0.54, "learning_rate": 6.856408802422429e-05, "loss": 2.2606, "step": 86952 }, { "epoch": 0.54, "learning_rate": 6.855792732940223e-05, "loss": 2.2492, "step": 86960 }, { "epoch": 0.54, "learning_rate": 6.855176642182916e-05, "loss": 2.2404, "step": 86968 }, { "epoch": 0.54, "learning_rate": 6.854560530165822e-05, "loss": 2.2579, "step": 86976 }, { "epoch": 0.54, "learning_rate": 6.853944396904258e-05, "loss": 2.252, "step": 86984 }, { "epoch": 0.54, "learning_rate": 6.853328242413536e-05, "loss": 2.2406, "step": 86992 }, { "epoch": 0.54, "learning_rate": 6.852712066708984e-05, "loss": 2.2518, "step": 87000 }, { "epoch": 0.54, "learning_rate": 6.852095869805912e-05, "loss": 2.2404, "step": 87008 }, { "epoch": 0.54, "learning_rate": 6.85147965171964e-05, "loss": 2.2545, "step": 87016 }, { "epoch": 0.54, "learning_rate": 6.850863412465489e-05, "loss": 2.2682, "step": 87024 }, { "epoch": 0.54, "learning_rate": 6.850247152058777e-05, "loss": 2.2581, "step": 87032 }, { "epoch": 0.54, "learning_rate": 6.849630870514828e-05, "loss": 2.2619, "step": 87040 }, { "epoch": 0.54, "learning_rate": 6.849014567848958e-05, "loss": 2.2613, "step": 87048 }, { "epoch": 0.54, "learning_rate": 6.848398244076492e-05, "loss": 2.2589, "step": 87056 }, { "epoch": 0.54, "learning_rate": 6.847781899212751e-05, "loss": 2.257, "step": 87064 }, { "epoch": 0.54, "learning_rate": 6.847165533273055e-05, "loss": 2.2504, "step": 87072 }, { "epoch": 0.54, "learning_rate": 6.846549146272729e-05, "loss": 2.2604, "step": 87080 }, { "epoch": 0.54, "learning_rate": 6.845932738227097e-05, "loss": 2.2576, "step": 87088 }, { "epoch": 0.54, "learning_rate": 6.845316309151481e-05, "loss": 2.27, "step": 87096 }, { "epoch": 0.54, "learning_rate": 6.84469985906121e-05, "loss": 2.263, "step": 87104 }, { "epoch": 0.54, "learning_rate": 6.844083387971603e-05, "loss": 2.2453, "step": 87112 }, { "epoch": 0.54, "learning_rate": 6.843466895897987e-05, "loss": 2.2737, "step": 87120 }, { "epoch": 0.54, "learning_rate": 6.842850382855692e-05, "loss": 2.2543, "step": 87128 }, { "epoch": 0.54, "learning_rate": 6.842233848860042e-05, "loss": 2.2581, "step": 87136 }, { "epoch": 0.54, "learning_rate": 6.841617293926362e-05, "loss": 2.2553, "step": 87144 }, { "epoch": 0.54, "learning_rate": 6.841000718069982e-05, "loss": 2.259, "step": 87152 }, { "epoch": 0.54, "learning_rate": 6.840384121306232e-05, "loss": 2.2735, "step": 87160 }, { "epoch": 0.54, "learning_rate": 6.839767503650436e-05, "loss": 2.2684, "step": 87168 }, { "epoch": 0.54, "learning_rate": 6.839150865117927e-05, "loss": 2.2514, "step": 87176 }, { "epoch": 0.54, "learning_rate": 6.838534205724034e-05, "loss": 2.2442, "step": 87184 }, { "epoch": 0.54, "learning_rate": 6.837917525484085e-05, "loss": 2.2626, "step": 87192 }, { "epoch": 0.55, "learning_rate": 6.837300824413413e-05, "loss": 2.2447, "step": 87200 }, { "epoch": 0.55, "learning_rate": 6.836684102527346e-05, "loss": 2.2562, "step": 87208 }, { "epoch": 0.55, "learning_rate": 6.836067359841223e-05, "loss": 2.2434, "step": 87216 }, { "epoch": 0.55, "learning_rate": 6.835450596370369e-05, "loss": 2.2603, "step": 87224 }, { "epoch": 0.55, "learning_rate": 6.83483381213012e-05, "loss": 2.2493, "step": 87232 }, { "epoch": 0.55, "learning_rate": 6.834217007135807e-05, "loss": 2.2486, "step": 87240 }, { "epoch": 0.55, "learning_rate": 6.833600181402767e-05, "loss": 2.2475, "step": 87248 }, { "epoch": 0.55, "learning_rate": 6.832983334946335e-05, "loss": 2.2502, "step": 87256 }, { "epoch": 0.55, "learning_rate": 6.83236646778184e-05, "loss": 2.2601, "step": 87264 }, { "epoch": 0.55, "learning_rate": 6.831749579924623e-05, "loss": 2.2715, "step": 87272 }, { "epoch": 0.55, "learning_rate": 6.831132671390019e-05, "loss": 2.2622, "step": 87280 }, { "epoch": 0.55, "learning_rate": 6.830515742193362e-05, "loss": 2.246, "step": 87288 }, { "epoch": 0.55, "learning_rate": 6.829898792349993e-05, "loss": 2.2582, "step": 87296 }, { "epoch": 0.55, "learning_rate": 6.829281821875244e-05, "loss": 2.2445, "step": 87304 }, { "epoch": 0.55, "learning_rate": 6.828664830784457e-05, "loss": 2.2518, "step": 87312 }, { "epoch": 0.55, "learning_rate": 6.82804781909297e-05, "loss": 2.2444, "step": 87320 }, { "epoch": 0.55, "learning_rate": 6.82743078681612e-05, "loss": 2.2591, "step": 87328 }, { "epoch": 0.55, "learning_rate": 6.826813733969248e-05, "loss": 2.2639, "step": 87336 }, { "epoch": 0.55, "learning_rate": 6.826196660567694e-05, "loss": 2.2773, "step": 87344 }, { "epoch": 0.55, "learning_rate": 6.825579566626798e-05, "loss": 2.2602, "step": 87352 }, { "epoch": 0.55, "learning_rate": 6.824962452161902e-05, "loss": 2.2586, "step": 87360 }, { "epoch": 0.55, "learning_rate": 6.824345317188347e-05, "loss": 2.2518, "step": 87368 }, { "epoch": 0.55, "learning_rate": 6.823728161721477e-05, "loss": 2.258, "step": 87376 }, { "epoch": 0.55, "learning_rate": 6.823110985776628e-05, "loss": 2.2805, "step": 87384 }, { "epoch": 0.55, "learning_rate": 6.822493789369149e-05, "loss": 2.259, "step": 87392 }, { "epoch": 0.55, "learning_rate": 6.821876572514386e-05, "loss": 2.2629, "step": 87400 }, { "epoch": 0.55, "learning_rate": 6.821259335227674e-05, "loss": 2.2583, "step": 87408 }, { "epoch": 0.55, "learning_rate": 6.820642077524366e-05, "loss": 2.2437, "step": 87416 }, { "epoch": 0.55, "learning_rate": 6.820024799419802e-05, "loss": 2.2739, "step": 87424 }, { "epoch": 0.55, "learning_rate": 6.81940750092933e-05, "loss": 2.2644, "step": 87432 }, { "epoch": 0.55, "learning_rate": 6.818790182068295e-05, "loss": 2.2552, "step": 87440 }, { "epoch": 0.55, "learning_rate": 6.818172842852047e-05, "loss": 2.2479, "step": 87448 }, { "epoch": 0.55, "learning_rate": 6.817555483295927e-05, "loss": 2.2538, "step": 87456 }, { "epoch": 0.55, "learning_rate": 6.816938103415287e-05, "loss": 2.2618, "step": 87464 }, { "epoch": 0.55, "learning_rate": 6.816320703225475e-05, "loss": 2.2665, "step": 87472 }, { "epoch": 0.55, "learning_rate": 6.815703282741839e-05, "loss": 2.2471, "step": 87480 }, { "epoch": 0.55, "learning_rate": 6.815085841979724e-05, "loss": 2.247, "step": 87488 }, { "epoch": 0.55, "learning_rate": 6.814468380954488e-05, "loss": 2.2584, "step": 87496 }, { "epoch": 0.55, "learning_rate": 6.813850899681475e-05, "loss": 2.2551, "step": 87504 }, { "epoch": 0.55, "learning_rate": 6.813233398176038e-05, "loss": 2.26, "step": 87512 }, { "epoch": 0.55, "learning_rate": 6.812615876453527e-05, "loss": 2.2602, "step": 87520 }, { "epoch": 0.55, "learning_rate": 6.811998334529295e-05, "loss": 2.2588, "step": 87528 }, { "epoch": 0.55, "learning_rate": 6.811380772418692e-05, "loss": 2.2545, "step": 87536 }, { "epoch": 0.55, "learning_rate": 6.810763190137072e-05, "loss": 2.2586, "step": 87544 }, { "epoch": 0.55, "learning_rate": 6.810145587699787e-05, "loss": 2.2626, "step": 87552 }, { "epoch": 0.55, "learning_rate": 6.809527965122194e-05, "loss": 2.2654, "step": 87560 }, { "epoch": 0.55, "learning_rate": 6.808910322419646e-05, "loss": 2.2233, "step": 87568 }, { "epoch": 0.55, "learning_rate": 6.808292659607494e-05, "loss": 2.2642, "step": 87576 }, { "epoch": 0.55, "learning_rate": 6.807674976701096e-05, "loss": 2.2767, "step": 87584 }, { "epoch": 0.55, "learning_rate": 6.807057273715809e-05, "loss": 2.2532, "step": 87592 }, { "epoch": 0.55, "learning_rate": 6.806439550666986e-05, "loss": 2.2507, "step": 87600 }, { "epoch": 0.55, "learning_rate": 6.805821807569986e-05, "loss": 2.2574, "step": 87608 }, { "epoch": 0.55, "learning_rate": 6.805204044440166e-05, "loss": 2.2561, "step": 87616 }, { "epoch": 0.55, "learning_rate": 6.804586261292882e-05, "loss": 2.2508, "step": 87624 }, { "epoch": 0.55, "learning_rate": 6.803968458143495e-05, "loss": 2.2578, "step": 87632 }, { "epoch": 0.55, "learning_rate": 6.80335063500736e-05, "loss": 2.2566, "step": 87640 }, { "epoch": 0.55, "learning_rate": 6.80273279189984e-05, "loss": 2.2482, "step": 87648 }, { "epoch": 0.55, "learning_rate": 6.802114928836291e-05, "loss": 2.2651, "step": 87656 }, { "epoch": 0.55, "learning_rate": 6.801497045832075e-05, "loss": 2.2618, "step": 87664 }, { "epoch": 0.55, "learning_rate": 6.800879142902552e-05, "loss": 2.2705, "step": 87672 }, { "epoch": 0.55, "learning_rate": 6.800261220063085e-05, "loss": 2.2571, "step": 87680 }, { "epoch": 0.55, "learning_rate": 6.799643277329035e-05, "loss": 2.2548, "step": 87688 }, { "epoch": 0.55, "learning_rate": 6.79902531471576e-05, "loss": 2.2441, "step": 87696 }, { "epoch": 0.55, "learning_rate": 6.79840733223863e-05, "loss": 2.2634, "step": 87704 }, { "epoch": 0.55, "learning_rate": 6.797789329913002e-05, "loss": 2.2756, "step": 87712 }, { "epoch": 0.55, "learning_rate": 6.797171307754242e-05, "loss": 2.2519, "step": 87720 }, { "epoch": 0.55, "learning_rate": 6.796553265777717e-05, "loss": 2.2561, "step": 87728 }, { "epoch": 0.55, "learning_rate": 6.795935203998782e-05, "loss": 2.2539, "step": 87736 }, { "epoch": 0.55, "learning_rate": 6.795317122432814e-05, "loss": 2.2528, "step": 87744 }, { "epoch": 0.55, "learning_rate": 6.794699021095172e-05, "loss": 2.2647, "step": 87752 }, { "epoch": 0.55, "learning_rate": 6.794080900001222e-05, "loss": 2.2424, "step": 87760 }, { "epoch": 0.55, "learning_rate": 6.793462759166331e-05, "loss": 2.2518, "step": 87768 }, { "epoch": 0.55, "learning_rate": 6.792844598605868e-05, "loss": 2.2465, "step": 87776 }, { "epoch": 0.55, "learning_rate": 6.7922264183352e-05, "loss": 2.2465, "step": 87784 }, { "epoch": 0.55, "learning_rate": 6.791608218369693e-05, "loss": 2.2642, "step": 87792 }, { "epoch": 0.55, "learning_rate": 6.790989998724717e-05, "loss": 2.2429, "step": 87800 }, { "epoch": 0.55, "learning_rate": 6.790371759415642e-05, "loss": 2.2572, "step": 87808 }, { "epoch": 0.55, "learning_rate": 6.789753500457835e-05, "loss": 2.247, "step": 87816 }, { "epoch": 0.55, "learning_rate": 6.78913522186667e-05, "loss": 2.2456, "step": 87824 }, { "epoch": 0.55, "learning_rate": 6.78851692365751e-05, "loss": 2.2589, "step": 87832 }, { "epoch": 0.55, "learning_rate": 6.787898605845736e-05, "loss": 2.2388, "step": 87840 }, { "epoch": 0.55, "learning_rate": 6.787280268446712e-05, "loss": 2.2504, "step": 87848 }, { "epoch": 0.55, "learning_rate": 6.786661911475811e-05, "loss": 2.2574, "step": 87856 }, { "epoch": 0.55, "learning_rate": 6.786043534948407e-05, "loss": 2.2541, "step": 87864 }, { "epoch": 0.55, "learning_rate": 6.785425138879875e-05, "loss": 2.2582, "step": 87872 }, { "epoch": 0.55, "learning_rate": 6.784806723285584e-05, "loss": 2.2506, "step": 87880 }, { "epoch": 0.55, "learning_rate": 6.784188288180909e-05, "loss": 2.2689, "step": 87888 }, { "epoch": 0.55, "learning_rate": 6.783569833581228e-05, "loss": 2.2762, "step": 87896 }, { "epoch": 0.55, "learning_rate": 6.78295135950191e-05, "loss": 2.2427, "step": 87904 }, { "epoch": 0.55, "learning_rate": 6.782332865958334e-05, "loss": 2.2473, "step": 87912 }, { "epoch": 0.55, "learning_rate": 6.781714352965876e-05, "loss": 2.241, "step": 87920 }, { "epoch": 0.55, "learning_rate": 6.781095820539912e-05, "loss": 2.268, "step": 87928 }, { "epoch": 0.55, "learning_rate": 6.780477268695818e-05, "loss": 2.2401, "step": 87936 }, { "epoch": 0.55, "learning_rate": 6.779858697448972e-05, "loss": 2.2542, "step": 87944 }, { "epoch": 0.55, "learning_rate": 6.779240106814749e-05, "loss": 2.2429, "step": 87952 }, { "epoch": 0.55, "learning_rate": 6.77862149680853e-05, "loss": 2.2573, "step": 87960 }, { "epoch": 0.55, "learning_rate": 6.778002867445695e-05, "loss": 2.2703, "step": 87968 }, { "epoch": 0.55, "learning_rate": 6.77738421874162e-05, "loss": 2.2616, "step": 87976 }, { "epoch": 0.55, "learning_rate": 6.776765550711687e-05, "loss": 2.2723, "step": 87984 }, { "epoch": 0.55, "learning_rate": 6.776146863371275e-05, "loss": 2.2499, "step": 87992 }, { "epoch": 0.55, "learning_rate": 6.775528156735764e-05, "loss": 2.2685, "step": 88000 }, { "epoch": 0.55, "learning_rate": 6.774909430820537e-05, "loss": 2.2504, "step": 88008 }, { "epoch": 0.55, "learning_rate": 6.774290685640974e-05, "loss": 2.2546, "step": 88016 }, { "epoch": 0.55, "learning_rate": 6.773671921212459e-05, "loss": 2.2662, "step": 88024 }, { "epoch": 0.55, "learning_rate": 6.773053137550371e-05, "loss": 2.2532, "step": 88032 }, { "epoch": 0.55, "learning_rate": 6.772434334670098e-05, "loss": 2.2503, "step": 88040 }, { "epoch": 0.55, "learning_rate": 6.771815512587019e-05, "loss": 2.2742, "step": 88048 }, { "epoch": 0.55, "learning_rate": 6.77119667131652e-05, "loss": 2.2516, "step": 88056 }, { "epoch": 0.55, "learning_rate": 6.770577810873987e-05, "loss": 2.2686, "step": 88064 }, { "epoch": 0.55, "learning_rate": 6.769958931274799e-05, "loss": 2.2557, "step": 88072 }, { "epoch": 0.55, "learning_rate": 6.769340032534348e-05, "loss": 2.2564, "step": 88080 }, { "epoch": 0.55, "learning_rate": 6.768721114668017e-05, "loss": 2.2466, "step": 88088 }, { "epoch": 0.55, "learning_rate": 6.768102177691194e-05, "loss": 2.262, "step": 88096 }, { "epoch": 0.55, "learning_rate": 6.767483221619264e-05, "loss": 2.2595, "step": 88104 }, { "epoch": 0.55, "learning_rate": 6.766864246467615e-05, "loss": 2.2466, "step": 88112 }, { "epoch": 0.55, "learning_rate": 6.766245252251636e-05, "loss": 2.248, "step": 88120 }, { "epoch": 0.55, "learning_rate": 6.765626238986712e-05, "loss": 2.2568, "step": 88128 }, { "epoch": 0.55, "learning_rate": 6.765007206688236e-05, "loss": 2.2595, "step": 88136 }, { "epoch": 0.55, "learning_rate": 6.764388155371592e-05, "loss": 2.2573, "step": 88144 }, { "epoch": 0.55, "learning_rate": 6.763769085052174e-05, "loss": 2.2502, "step": 88152 }, { "epoch": 0.55, "learning_rate": 6.763149995745372e-05, "loss": 2.2472, "step": 88160 }, { "epoch": 0.55, "learning_rate": 6.762530887466576e-05, "loss": 2.2331, "step": 88168 }, { "epoch": 0.55, "learning_rate": 6.761911760231175e-05, "loss": 2.2428, "step": 88176 }, { "epoch": 0.55, "learning_rate": 6.761292614054562e-05, "loss": 2.2535, "step": 88184 }, { "epoch": 0.55, "learning_rate": 6.76067344895213e-05, "loss": 2.2409, "step": 88192 }, { "epoch": 0.55, "learning_rate": 6.76005426493927e-05, "loss": 2.2414, "step": 88200 }, { "epoch": 0.55, "learning_rate": 6.759435062031375e-05, "loss": 2.2657, "step": 88208 }, { "epoch": 0.55, "learning_rate": 6.758815840243841e-05, "loss": 2.2649, "step": 88216 }, { "epoch": 0.55, "learning_rate": 6.75819659959206e-05, "loss": 2.2678, "step": 88224 }, { "epoch": 0.55, "learning_rate": 6.757577340091425e-05, "loss": 2.2342, "step": 88232 }, { "epoch": 0.55, "learning_rate": 6.756958061757332e-05, "loss": 2.2536, "step": 88240 }, { "epoch": 0.55, "learning_rate": 6.756338764605179e-05, "loss": 2.2427, "step": 88248 }, { "epoch": 0.55, "learning_rate": 6.755719448650359e-05, "loss": 2.2434, "step": 88256 }, { "epoch": 0.55, "learning_rate": 6.755100113908266e-05, "loss": 2.2487, "step": 88264 }, { "epoch": 0.55, "learning_rate": 6.754480760394303e-05, "loss": 2.2548, "step": 88272 }, { "epoch": 0.55, "learning_rate": 6.753861388123862e-05, "loss": 2.255, "step": 88280 }, { "epoch": 0.55, "learning_rate": 6.753241997112342e-05, "loss": 2.2528, "step": 88288 }, { "epoch": 0.55, "learning_rate": 6.752622587375141e-05, "loss": 2.2342, "step": 88296 }, { "epoch": 0.55, "learning_rate": 6.75200315892766e-05, "loss": 2.2529, "step": 88304 }, { "epoch": 0.55, "learning_rate": 6.751383711785296e-05, "loss": 2.2503, "step": 88312 }, { "epoch": 0.55, "learning_rate": 6.750764245963447e-05, "loss": 2.2319, "step": 88320 }, { "epoch": 0.55, "learning_rate": 6.750144761477512e-05, "loss": 2.2568, "step": 88328 }, { "epoch": 0.55, "learning_rate": 6.749525258342899e-05, "loss": 2.2403, "step": 88336 }, { "epoch": 0.55, "learning_rate": 6.748905736575003e-05, "loss": 2.2599, "step": 88344 }, { "epoch": 0.55, "learning_rate": 6.748286196189226e-05, "loss": 2.2518, "step": 88352 }, { "epoch": 0.55, "learning_rate": 6.747666637200967e-05, "loss": 2.2575, "step": 88360 }, { "epoch": 0.55, "learning_rate": 6.747047059625636e-05, "loss": 2.2722, "step": 88368 }, { "epoch": 0.55, "learning_rate": 6.746427463478631e-05, "loss": 2.2647, "step": 88376 }, { "epoch": 0.55, "learning_rate": 6.745807848775353e-05, "loss": 2.2583, "step": 88384 }, { "epoch": 0.55, "learning_rate": 6.745188215531208e-05, "loss": 2.2584, "step": 88392 }, { "epoch": 0.55, "learning_rate": 6.744568563761602e-05, "loss": 2.2584, "step": 88400 }, { "epoch": 0.55, "learning_rate": 6.743948893481938e-05, "loss": 2.2499, "step": 88408 }, { "epoch": 0.55, "learning_rate": 6.74332920470762e-05, "loss": 2.2693, "step": 88416 }, { "epoch": 0.55, "learning_rate": 6.742709497454055e-05, "loss": 2.2669, "step": 88424 }, { "epoch": 0.55, "learning_rate": 6.742089771736651e-05, "loss": 2.259, "step": 88432 }, { "epoch": 0.55, "learning_rate": 6.741470027570808e-05, "loss": 2.2397, "step": 88440 }, { "epoch": 0.55, "learning_rate": 6.740850264971939e-05, "loss": 2.2514, "step": 88448 }, { "epoch": 0.55, "learning_rate": 6.74023048395545e-05, "loss": 2.2539, "step": 88456 }, { "epoch": 0.55, "learning_rate": 6.739610684536746e-05, "loss": 2.2582, "step": 88464 }, { "epoch": 0.55, "learning_rate": 6.73899086673124e-05, "loss": 2.2543, "step": 88472 }, { "epoch": 0.55, "learning_rate": 6.738371030554336e-05, "loss": 2.2621, "step": 88480 }, { "epoch": 0.55, "learning_rate": 6.737751176021445e-05, "loss": 2.2626, "step": 88488 }, { "epoch": 0.55, "learning_rate": 6.737131303147978e-05, "loss": 2.2467, "step": 88496 }, { "epoch": 0.55, "learning_rate": 6.736511411949344e-05, "loss": 2.2503, "step": 88504 }, { "epoch": 0.55, "learning_rate": 6.735891502440954e-05, "loss": 2.2451, "step": 88512 }, { "epoch": 0.55, "learning_rate": 6.735271574638218e-05, "loss": 2.2456, "step": 88520 }, { "epoch": 0.55, "learning_rate": 6.73465162855655e-05, "loss": 2.2509, "step": 88528 }, { "epoch": 0.55, "learning_rate": 6.734031664211357e-05, "loss": 2.2661, "step": 88536 }, { "epoch": 0.55, "learning_rate": 6.733411681618057e-05, "loss": 2.2548, "step": 88544 }, { "epoch": 0.55, "learning_rate": 6.732791680792058e-05, "loss": 2.2581, "step": 88552 }, { "epoch": 0.55, "learning_rate": 6.732171661748779e-05, "loss": 2.2503, "step": 88560 }, { "epoch": 0.55, "learning_rate": 6.731551624503626e-05, "loss": 2.2569, "step": 88568 }, { "epoch": 0.55, "learning_rate": 6.73093156907202e-05, "loss": 2.2507, "step": 88576 }, { "epoch": 0.55, "learning_rate": 6.730311495469374e-05, "loss": 2.2311, "step": 88584 }, { "epoch": 0.55, "learning_rate": 6.729691403711103e-05, "loss": 2.2592, "step": 88592 }, { "epoch": 0.55, "learning_rate": 6.729071293812619e-05, "loss": 2.2531, "step": 88600 }, { "epoch": 0.55, "learning_rate": 6.728451165789342e-05, "loss": 2.2434, "step": 88608 }, { "epoch": 0.55, "learning_rate": 6.727831019656688e-05, "loss": 2.2555, "step": 88616 }, { "epoch": 0.55, "learning_rate": 6.727210855430072e-05, "loss": 2.2447, "step": 88624 }, { "epoch": 0.55, "learning_rate": 6.726590673124913e-05, "loss": 2.2487, "step": 88632 }, { "epoch": 0.55, "learning_rate": 6.725970472756629e-05, "loss": 2.2635, "step": 88640 }, { "epoch": 0.55, "learning_rate": 6.725350254340637e-05, "loss": 2.2497, "step": 88648 }, { "epoch": 0.55, "learning_rate": 6.724730017892355e-05, "loss": 2.2646, "step": 88656 }, { "epoch": 0.55, "learning_rate": 6.724109763427206e-05, "loss": 2.2573, "step": 88664 }, { "epoch": 0.55, "learning_rate": 6.723489490960606e-05, "loss": 2.2319, "step": 88672 }, { "epoch": 0.55, "learning_rate": 6.722869200507976e-05, "loss": 2.2479, "step": 88680 }, { "epoch": 0.55, "learning_rate": 6.722248892084736e-05, "loss": 2.2436, "step": 88688 }, { "epoch": 0.55, "learning_rate": 6.721628565706308e-05, "loss": 2.2584, "step": 88696 }, { "epoch": 0.55, "learning_rate": 6.721008221388112e-05, "loss": 2.2599, "step": 88704 }, { "epoch": 0.55, "learning_rate": 6.720387859145572e-05, "loss": 2.2438, "step": 88712 }, { "epoch": 0.55, "learning_rate": 6.719767478994109e-05, "loss": 2.2467, "step": 88720 }, { "epoch": 0.55, "learning_rate": 6.719147080949144e-05, "loss": 2.2556, "step": 88728 }, { "epoch": 0.55, "learning_rate": 6.718526665026104e-05, "loss": 2.2573, "step": 88736 }, { "epoch": 0.55, "learning_rate": 6.71790623124041e-05, "loss": 2.259, "step": 88744 }, { "epoch": 0.55, "learning_rate": 6.717285779607485e-05, "loss": 2.237, "step": 88752 }, { "epoch": 0.55, "learning_rate": 6.716665310142755e-05, "loss": 2.2583, "step": 88760 }, { "epoch": 0.55, "learning_rate": 6.716044822861648e-05, "loss": 2.2594, "step": 88768 }, { "epoch": 0.55, "learning_rate": 6.715424317779585e-05, "loss": 2.2587, "step": 88776 }, { "epoch": 0.55, "learning_rate": 6.714803794911992e-05, "loss": 2.2373, "step": 88784 }, { "epoch": 0.55, "learning_rate": 6.714183254274297e-05, "loss": 2.2413, "step": 88792 }, { "epoch": 0.56, "learning_rate": 6.713562695881928e-05, "loss": 2.2512, "step": 88800 }, { "epoch": 0.56, "learning_rate": 6.712942119750308e-05, "loss": 2.2581, "step": 88808 }, { "epoch": 0.56, "learning_rate": 6.712321525894867e-05, "loss": 2.2469, "step": 88816 }, { "epoch": 0.56, "learning_rate": 6.711700914331034e-05, "loss": 2.2575, "step": 88824 }, { "epoch": 0.56, "learning_rate": 6.711080285074236e-05, "loss": 2.2496, "step": 88832 }, { "epoch": 0.56, "learning_rate": 6.710459638139903e-05, "loss": 2.2676, "step": 88840 }, { "epoch": 0.56, "learning_rate": 6.709838973543463e-05, "loss": 2.25, "step": 88848 }, { "epoch": 0.56, "learning_rate": 6.709218291300346e-05, "loss": 2.2408, "step": 88856 }, { "epoch": 0.56, "learning_rate": 6.708597591425983e-05, "loss": 2.2462, "step": 88864 }, { "epoch": 0.56, "learning_rate": 6.707976873935804e-05, "loss": 2.2594, "step": 88872 }, { "epoch": 0.56, "learning_rate": 6.707356138845242e-05, "loss": 2.2512, "step": 88880 }, { "epoch": 0.56, "learning_rate": 6.706735386169724e-05, "loss": 2.2675, "step": 88888 }, { "epoch": 0.56, "learning_rate": 6.706114615924688e-05, "loss": 2.2537, "step": 88896 }, { "epoch": 0.56, "learning_rate": 6.705493828125564e-05, "loss": 2.2515, "step": 88904 }, { "epoch": 0.56, "learning_rate": 6.704873022787783e-05, "loss": 2.2612, "step": 88912 }, { "epoch": 0.56, "learning_rate": 6.704252199926778e-05, "loss": 2.2404, "step": 88920 }, { "epoch": 0.56, "learning_rate": 6.703631359557984e-05, "loss": 2.2505, "step": 88928 }, { "epoch": 0.56, "learning_rate": 6.703010501696839e-05, "loss": 2.2547, "step": 88936 }, { "epoch": 0.56, "learning_rate": 6.702389626358772e-05, "loss": 2.2377, "step": 88944 }, { "epoch": 0.56, "learning_rate": 6.70176873355922e-05, "loss": 2.2476, "step": 88952 }, { "epoch": 0.56, "learning_rate": 6.70114782331362e-05, "loss": 2.2466, "step": 88960 }, { "epoch": 0.56, "learning_rate": 6.700526895637404e-05, "loss": 2.2431, "step": 88968 }, { "epoch": 0.56, "learning_rate": 6.699905950546012e-05, "loss": 2.2633, "step": 88976 }, { "epoch": 0.56, "learning_rate": 6.699284988054879e-05, "loss": 2.2349, "step": 88984 }, { "epoch": 0.56, "learning_rate": 6.698664008179445e-05, "loss": 2.2335, "step": 88992 }, { "epoch": 0.56, "learning_rate": 6.698043010935143e-05, "loss": 2.2598, "step": 89000 }, { "epoch": 0.56, "learning_rate": 6.697421996337413e-05, "loss": 2.2434, "step": 89008 }, { "epoch": 0.56, "learning_rate": 6.696800964401695e-05, "loss": 2.2536, "step": 89016 }, { "epoch": 0.56, "learning_rate": 6.696179915143428e-05, "loss": 2.2394, "step": 89024 }, { "epoch": 0.56, "learning_rate": 6.695558848578049e-05, "loss": 2.2605, "step": 89032 }, { "epoch": 0.56, "learning_rate": 6.694937764720998e-05, "loss": 2.2528, "step": 89040 }, { "epoch": 0.56, "learning_rate": 6.694316663587717e-05, "loss": 2.2357, "step": 89048 }, { "epoch": 0.56, "learning_rate": 6.693695545193648e-05, "loss": 2.2562, "step": 89056 }, { "epoch": 0.56, "learning_rate": 6.693074409554227e-05, "loss": 2.2192, "step": 89064 }, { "epoch": 0.56, "learning_rate": 6.692453256684899e-05, "loss": 2.2508, "step": 89072 }, { "epoch": 0.56, "learning_rate": 6.691832086601106e-05, "loss": 2.2353, "step": 89080 }, { "epoch": 0.56, "learning_rate": 6.69121089931829e-05, "loss": 2.24, "step": 89088 }, { "epoch": 0.56, "learning_rate": 6.690589694851893e-05, "loss": 2.2371, "step": 89096 }, { "epoch": 0.56, "learning_rate": 6.689968473217356e-05, "loss": 2.2313, "step": 89104 }, { "epoch": 0.56, "learning_rate": 6.68934723443013e-05, "loss": 2.2446, "step": 89112 }, { "epoch": 0.56, "learning_rate": 6.688725978505652e-05, "loss": 2.246, "step": 89120 }, { "epoch": 0.56, "learning_rate": 6.68810470545937e-05, "loss": 2.2629, "step": 89128 }, { "epoch": 0.56, "learning_rate": 6.687483415306727e-05, "loss": 2.2416, "step": 89136 }, { "epoch": 0.56, "learning_rate": 6.686862108063168e-05, "loss": 2.2382, "step": 89144 }, { "epoch": 0.56, "learning_rate": 6.686240783744142e-05, "loss": 2.2433, "step": 89152 }, { "epoch": 0.56, "learning_rate": 6.685619442365092e-05, "loss": 2.2367, "step": 89160 }, { "epoch": 0.56, "learning_rate": 6.684998083941466e-05, "loss": 2.2364, "step": 89168 }, { "epoch": 0.56, "learning_rate": 6.684376708488712e-05, "loss": 2.2636, "step": 89176 }, { "epoch": 0.56, "learning_rate": 6.683755316022274e-05, "loss": 2.2455, "step": 89184 }, { "epoch": 0.56, "learning_rate": 6.683133906557604e-05, "loss": 2.2599, "step": 89192 }, { "epoch": 0.56, "learning_rate": 6.682512480110149e-05, "loss": 2.2509, "step": 89200 }, { "epoch": 0.56, "learning_rate": 6.681891036695353e-05, "loss": 2.2545, "step": 89208 }, { "epoch": 0.56, "learning_rate": 6.681269576328674e-05, "loss": 2.2553, "step": 89216 }, { "epoch": 0.56, "learning_rate": 6.680648099025554e-05, "loss": 2.2571, "step": 89224 }, { "epoch": 0.56, "learning_rate": 6.680026604801445e-05, "loss": 2.2478, "step": 89232 }, { "epoch": 0.56, "learning_rate": 6.679405093671802e-05, "loss": 2.2516, "step": 89240 }, { "epoch": 0.56, "learning_rate": 6.678783565652072e-05, "loss": 2.2462, "step": 89248 }, { "epoch": 0.56, "learning_rate": 6.678162020757704e-05, "loss": 2.2486, "step": 89256 }, { "epoch": 0.56, "learning_rate": 6.677540459004152e-05, "loss": 2.2668, "step": 89264 }, { "epoch": 0.56, "learning_rate": 6.676918880406869e-05, "loss": 2.2289, "step": 89272 }, { "epoch": 0.56, "learning_rate": 6.676297284981306e-05, "loss": 2.25, "step": 89280 }, { "epoch": 0.56, "learning_rate": 6.675675672742918e-05, "loss": 2.2582, "step": 89288 }, { "epoch": 0.56, "learning_rate": 6.675054043707157e-05, "loss": 2.2513, "step": 89296 }, { "epoch": 0.56, "learning_rate": 6.674432397889475e-05, "loss": 2.2748, "step": 89304 }, { "epoch": 0.56, "learning_rate": 6.67381073530533e-05, "loss": 2.2593, "step": 89312 }, { "epoch": 0.56, "learning_rate": 6.673189055970173e-05, "loss": 2.2586, "step": 89320 }, { "epoch": 0.56, "learning_rate": 6.672567359899461e-05, "loss": 2.2564, "step": 89328 }, { "epoch": 0.56, "learning_rate": 6.671945647108648e-05, "loss": 2.2375, "step": 89336 }, { "epoch": 0.56, "learning_rate": 6.671323917613193e-05, "loss": 2.2498, "step": 89344 }, { "epoch": 0.56, "learning_rate": 6.670702171428549e-05, "loss": 2.252, "step": 89352 }, { "epoch": 0.56, "learning_rate": 6.670080408570172e-05, "loss": 2.2511, "step": 89360 }, { "epoch": 0.56, "learning_rate": 6.669458629053524e-05, "loss": 2.2599, "step": 89368 }, { "epoch": 0.56, "learning_rate": 6.668836832894059e-05, "loss": 2.2618, "step": 89376 }, { "epoch": 0.56, "learning_rate": 6.668215020107232e-05, "loss": 2.2562, "step": 89384 }, { "epoch": 0.56, "learning_rate": 6.667593190708508e-05, "loss": 2.2645, "step": 89392 }, { "epoch": 0.56, "learning_rate": 6.66697134471334e-05, "loss": 2.2515, "step": 89400 }, { "epoch": 0.56, "learning_rate": 6.666349482137191e-05, "loss": 2.258, "step": 89408 }, { "epoch": 0.56, "learning_rate": 6.665727602995518e-05, "loss": 2.2627, "step": 89416 }, { "epoch": 0.56, "learning_rate": 6.665105707303783e-05, "loss": 2.2532, "step": 89424 }, { "epoch": 0.56, "learning_rate": 6.664483795077448e-05, "loss": 2.2698, "step": 89432 }, { "epoch": 0.56, "learning_rate": 6.663861866331968e-05, "loss": 2.2669, "step": 89440 }, { "epoch": 0.56, "learning_rate": 6.663239921082807e-05, "loss": 2.2682, "step": 89448 }, { "epoch": 0.56, "learning_rate": 6.662617959345428e-05, "loss": 2.2668, "step": 89456 }, { "epoch": 0.56, "learning_rate": 6.661995981135293e-05, "loss": 2.2603, "step": 89464 }, { "epoch": 0.56, "learning_rate": 6.661373986467863e-05, "loss": 2.2788, "step": 89472 }, { "epoch": 0.56, "learning_rate": 6.660751975358602e-05, "loss": 2.2575, "step": 89480 }, { "epoch": 0.56, "learning_rate": 6.660129947822973e-05, "loss": 2.2544, "step": 89488 }, { "epoch": 0.56, "learning_rate": 6.659507903876438e-05, "loss": 2.2669, "step": 89496 }, { "epoch": 0.56, "learning_rate": 6.658885843534465e-05, "loss": 2.2611, "step": 89504 }, { "epoch": 0.56, "learning_rate": 6.658263766812514e-05, "loss": 2.2624, "step": 89512 }, { "epoch": 0.56, "learning_rate": 6.657641673726051e-05, "loss": 2.2461, "step": 89520 }, { "epoch": 0.56, "learning_rate": 6.657019564290545e-05, "loss": 2.2479, "step": 89528 }, { "epoch": 0.56, "learning_rate": 6.656397438521458e-05, "loss": 2.2432, "step": 89536 }, { "epoch": 0.56, "learning_rate": 6.655775296434255e-05, "loss": 2.2706, "step": 89544 }, { "epoch": 0.56, "learning_rate": 6.655153138044408e-05, "loss": 2.2487, "step": 89552 }, { "epoch": 0.56, "learning_rate": 6.654530963367377e-05, "loss": 2.2424, "step": 89560 }, { "epoch": 0.56, "learning_rate": 6.653908772418633e-05, "loss": 2.2381, "step": 89568 }, { "epoch": 0.56, "learning_rate": 6.653286565213646e-05, "loss": 2.2856, "step": 89576 }, { "epoch": 0.56, "learning_rate": 6.65266434176788e-05, "loss": 2.2515, "step": 89584 }, { "epoch": 0.56, "learning_rate": 6.652042102096806e-05, "loss": 2.2476, "step": 89592 }, { "epoch": 0.56, "learning_rate": 6.651419846215892e-05, "loss": 2.2554, "step": 89600 }, { "epoch": 0.56, "learning_rate": 6.650797574140608e-05, "loss": 2.259, "step": 89608 }, { "epoch": 0.56, "learning_rate": 6.650175285886422e-05, "loss": 2.2593, "step": 89616 }, { "epoch": 0.56, "learning_rate": 6.649552981468807e-05, "loss": 2.2597, "step": 89624 }, { "epoch": 0.56, "learning_rate": 6.648930660903229e-05, "loss": 2.2667, "step": 89632 }, { "epoch": 0.56, "learning_rate": 6.648308324205166e-05, "loss": 2.2625, "step": 89640 }, { "epoch": 0.56, "learning_rate": 6.647685971390082e-05, "loss": 2.2627, "step": 89648 }, { "epoch": 0.56, "learning_rate": 6.647063602473455e-05, "loss": 2.2546, "step": 89656 }, { "epoch": 0.56, "learning_rate": 6.646441217470752e-05, "loss": 2.2482, "step": 89664 }, { "epoch": 0.56, "learning_rate": 6.64581881639745e-05, "loss": 2.244, "step": 89672 }, { "epoch": 0.56, "learning_rate": 6.645196399269018e-05, "loss": 2.2681, "step": 89680 }, { "epoch": 0.56, "learning_rate": 6.644573966100933e-05, "loss": 2.246, "step": 89688 }, { "epoch": 0.56, "learning_rate": 6.643951516908664e-05, "loss": 2.2553, "step": 89696 }, { "epoch": 0.56, "learning_rate": 6.64332905170769e-05, "loss": 2.2591, "step": 89704 }, { "epoch": 0.56, "learning_rate": 6.642706570513482e-05, "loss": 2.2474, "step": 89712 }, { "epoch": 0.56, "learning_rate": 6.64208407334152e-05, "loss": 2.2395, "step": 89720 }, { "epoch": 0.56, "learning_rate": 6.641461560207271e-05, "loss": 2.2561, "step": 89728 }, { "epoch": 0.56, "learning_rate": 6.640839031126218e-05, "loss": 2.2521, "step": 89736 }, { "epoch": 0.56, "learning_rate": 6.640216486113835e-05, "loss": 2.2485, "step": 89744 }, { "epoch": 0.56, "learning_rate": 6.639593925185598e-05, "loss": 2.2581, "step": 89752 }, { "epoch": 0.56, "learning_rate": 6.638971348356986e-05, "loss": 2.2745, "step": 89760 }, { "epoch": 0.56, "learning_rate": 6.638348755643471e-05, "loss": 2.2711, "step": 89768 }, { "epoch": 0.56, "learning_rate": 6.637726147060539e-05, "loss": 2.2642, "step": 89776 }, { "epoch": 0.56, "learning_rate": 6.63710352262366e-05, "loss": 2.2739, "step": 89784 }, { "epoch": 0.56, "learning_rate": 6.636480882348317e-05, "loss": 2.2619, "step": 89792 }, { "epoch": 0.56, "learning_rate": 6.635858226249987e-05, "loss": 2.2484, "step": 89800 }, { "epoch": 0.56, "learning_rate": 6.635235554344151e-05, "loss": 2.2572, "step": 89808 }, { "epoch": 0.56, "learning_rate": 6.634612866646286e-05, "loss": 2.2527, "step": 89816 }, { "epoch": 0.56, "learning_rate": 6.633990163171877e-05, "loss": 2.2672, "step": 89824 }, { "epoch": 0.56, "learning_rate": 6.6333674439364e-05, "loss": 2.2598, "step": 89832 }, { "epoch": 0.56, "learning_rate": 6.632744708955337e-05, "loss": 2.2577, "step": 89840 }, { "epoch": 0.56, "learning_rate": 6.632121958244171e-05, "loss": 2.2706, "step": 89848 }, { "epoch": 0.56, "learning_rate": 6.63149919181838e-05, "loss": 2.2663, "step": 89856 }, { "epoch": 0.56, "learning_rate": 6.630876409693449e-05, "loss": 2.2628, "step": 89864 }, { "epoch": 0.56, "learning_rate": 6.63025361188486e-05, "loss": 2.273, "step": 89872 }, { "epoch": 0.56, "learning_rate": 6.629630798408095e-05, "loss": 2.259, "step": 89880 }, { "epoch": 0.56, "learning_rate": 6.629007969278638e-05, "loss": 2.2721, "step": 89888 }, { "epoch": 0.56, "learning_rate": 6.628385124511974e-05, "loss": 2.255, "step": 89896 }, { "epoch": 0.56, "learning_rate": 6.627762264123584e-05, "loss": 2.2551, "step": 89904 }, { "epoch": 0.56, "learning_rate": 6.627139388128953e-05, "loss": 2.2521, "step": 89912 }, { "epoch": 0.56, "learning_rate": 6.626516496543567e-05, "loss": 2.2647, "step": 89920 }, { "epoch": 0.56, "learning_rate": 6.62589358938291e-05, "loss": 2.2563, "step": 89928 }, { "epoch": 0.56, "learning_rate": 6.625270666662469e-05, "loss": 2.2548, "step": 89936 }, { "epoch": 0.56, "learning_rate": 6.624647728397728e-05, "loss": 2.2639, "step": 89944 }, { "epoch": 0.56, "learning_rate": 6.624024774604174e-05, "loss": 2.2726, "step": 89952 }, { "epoch": 0.56, "learning_rate": 6.623401805297295e-05, "loss": 2.2561, "step": 89960 }, { "epoch": 0.56, "learning_rate": 6.62277882049258e-05, "loss": 2.2591, "step": 89968 }, { "epoch": 0.56, "learning_rate": 6.622155820205508e-05, "loss": 2.2468, "step": 89976 }, { "epoch": 0.56, "learning_rate": 6.621532804451576e-05, "loss": 2.2632, "step": 89984 }, { "epoch": 0.56, "learning_rate": 6.620909773246268e-05, "loss": 2.2732, "step": 89992 }, { "epoch": 0.56, "learning_rate": 6.620286726605074e-05, "loss": 2.2456, "step": 90000 }, { "epoch": 0.56, "learning_rate": 6.619663664543483e-05, "loss": 2.2404, "step": 90008 }, { "epoch": 0.56, "learning_rate": 6.619040587076983e-05, "loss": 2.2602, "step": 90016 }, { "epoch": 0.56, "learning_rate": 6.618417494221064e-05, "loss": 2.2589, "step": 90024 }, { "epoch": 0.56, "learning_rate": 6.617794385991217e-05, "loss": 2.2518, "step": 90032 }, { "epoch": 0.56, "learning_rate": 6.617171262402933e-05, "loss": 2.2503, "step": 90040 }, { "epoch": 0.56, "learning_rate": 6.616548123471701e-05, "loss": 2.2544, "step": 90048 }, { "epoch": 0.56, "learning_rate": 6.615924969213015e-05, "loss": 2.2615, "step": 90056 }, { "epoch": 0.56, "learning_rate": 6.615301799642362e-05, "loss": 2.2545, "step": 90064 }, { "epoch": 0.56, "learning_rate": 6.61467861477524e-05, "loss": 2.2421, "step": 90072 }, { "epoch": 0.56, "learning_rate": 6.614055414627138e-05, "loss": 2.2549, "step": 90080 }, { "epoch": 0.56, "learning_rate": 6.61343219921355e-05, "loss": 2.2602, "step": 90088 }, { "epoch": 0.56, "learning_rate": 6.612808968549967e-05, "loss": 2.2572, "step": 90096 }, { "epoch": 0.56, "learning_rate": 6.612185722651885e-05, "loss": 2.2263, "step": 90104 }, { "epoch": 0.56, "learning_rate": 6.6115624615348e-05, "loss": 2.2541, "step": 90112 }, { "epoch": 0.56, "learning_rate": 6.6109391852142e-05, "loss": 2.2563, "step": 90120 }, { "epoch": 0.56, "learning_rate": 6.610315893705583e-05, "loss": 2.2301, "step": 90128 }, { "epoch": 0.56, "learning_rate": 6.609692587024447e-05, "loss": 2.2537, "step": 90136 }, { "epoch": 0.56, "learning_rate": 6.609069265186284e-05, "loss": 2.2483, "step": 90144 }, { "epoch": 0.56, "learning_rate": 6.608445928206592e-05, "loss": 2.2467, "step": 90152 }, { "epoch": 0.56, "learning_rate": 6.607822576100864e-05, "loss": 2.2478, "step": 90160 }, { "epoch": 0.56, "learning_rate": 6.607199208884598e-05, "loss": 2.2527, "step": 90168 }, { "epoch": 0.56, "learning_rate": 6.606575826573293e-05, "loss": 2.2425, "step": 90176 }, { "epoch": 0.56, "learning_rate": 6.605952429182445e-05, "loss": 2.2639, "step": 90184 }, { "epoch": 0.56, "learning_rate": 6.60532901672755e-05, "loss": 2.2525, "step": 90192 }, { "epoch": 0.56, "learning_rate": 6.60470558922411e-05, "loss": 2.266, "step": 90200 }, { "epoch": 0.56, "learning_rate": 6.60408214668762e-05, "loss": 2.2418, "step": 90208 }, { "epoch": 0.56, "learning_rate": 6.603458689133582e-05, "loss": 2.2467, "step": 90216 }, { "epoch": 0.56, "learning_rate": 6.60283521657749e-05, "loss": 2.2491, "step": 90224 }, { "epoch": 0.56, "learning_rate": 6.602211729034848e-05, "loss": 2.2532, "step": 90232 }, { "epoch": 0.56, "learning_rate": 6.601588226521156e-05, "loss": 2.2487, "step": 90240 }, { "epoch": 0.56, "learning_rate": 6.600964709051912e-05, "loss": 2.2591, "step": 90248 }, { "epoch": 0.56, "learning_rate": 6.60034117664262e-05, "loss": 2.2445, "step": 90256 }, { "epoch": 0.56, "learning_rate": 6.599717629308775e-05, "loss": 2.2421, "step": 90264 }, { "epoch": 0.56, "learning_rate": 6.599094067065885e-05, "loss": 2.2624, "step": 90272 }, { "epoch": 0.56, "learning_rate": 6.598470489929449e-05, "loss": 2.2557, "step": 90280 }, { "epoch": 0.56, "learning_rate": 6.59784689791497e-05, "loss": 2.2502, "step": 90288 }, { "epoch": 0.56, "learning_rate": 6.597223291037948e-05, "loss": 2.2724, "step": 90296 }, { "epoch": 0.56, "learning_rate": 6.596599669313889e-05, "loss": 2.2573, "step": 90304 }, { "epoch": 0.56, "learning_rate": 6.595976032758298e-05, "loss": 2.2646, "step": 90312 }, { "epoch": 0.56, "learning_rate": 6.595352381386672e-05, "loss": 2.2539, "step": 90320 }, { "epoch": 0.56, "learning_rate": 6.594728715214523e-05, "loss": 2.2608, "step": 90328 }, { "epoch": 0.56, "learning_rate": 6.594105034257349e-05, "loss": 2.2624, "step": 90336 }, { "epoch": 0.56, "learning_rate": 6.593481338530656e-05, "loss": 2.2394, "step": 90344 }, { "epoch": 0.56, "learning_rate": 6.592857628049953e-05, "loss": 2.2452, "step": 90352 }, { "epoch": 0.56, "learning_rate": 6.59223390283074e-05, "loss": 2.2507, "step": 90360 }, { "epoch": 0.56, "learning_rate": 6.591610162888529e-05, "loss": 2.2566, "step": 90368 }, { "epoch": 0.56, "learning_rate": 6.59098640823882e-05, "loss": 2.2519, "step": 90376 }, { "epoch": 0.56, "learning_rate": 6.590362638897125e-05, "loss": 2.2633, "step": 90384 }, { "epoch": 0.56, "learning_rate": 6.589738854878948e-05, "loss": 2.2472, "step": 90392 }, { "epoch": 0.56, "learning_rate": 6.589115056199795e-05, "loss": 2.2508, "step": 90400 }, { "epoch": 0.57, "learning_rate": 6.588491242875177e-05, "loss": 2.2558, "step": 90408 }, { "epoch": 0.57, "learning_rate": 6.5878674149206e-05, "loss": 2.2418, "step": 90416 }, { "epoch": 0.57, "learning_rate": 6.587243572351574e-05, "loss": 2.2662, "step": 90424 }, { "epoch": 0.57, "learning_rate": 6.586619715183606e-05, "loss": 2.2575, "step": 90432 }, { "epoch": 0.57, "learning_rate": 6.585995843432207e-05, "loss": 2.2446, "step": 90440 }, { "epoch": 0.57, "learning_rate": 6.585371957112886e-05, "loss": 2.2582, "step": 90448 }, { "epoch": 0.57, "learning_rate": 6.584748056241151e-05, "loss": 2.2298, "step": 90456 }, { "epoch": 0.57, "learning_rate": 6.584124140832516e-05, "loss": 2.2617, "step": 90464 }, { "epoch": 0.57, "learning_rate": 6.583500210902485e-05, "loss": 2.2464, "step": 90472 }, { "epoch": 0.57, "learning_rate": 6.582876266466578e-05, "loss": 2.264, "step": 90480 }, { "epoch": 0.57, "learning_rate": 6.5822523075403e-05, "loss": 2.2327, "step": 90488 }, { "epoch": 0.57, "learning_rate": 6.581628334139163e-05, "loss": 2.2457, "step": 90496 }, { "epoch": 0.57, "learning_rate": 6.58100434627868e-05, "loss": 2.2387, "step": 90504 }, { "epoch": 0.57, "learning_rate": 6.580380343974366e-05, "loss": 2.2358, "step": 90512 }, { "epoch": 0.57, "learning_rate": 6.579756327241731e-05, "loss": 2.2348, "step": 90520 }, { "epoch": 0.57, "learning_rate": 6.579132296096289e-05, "loss": 2.2501, "step": 90528 }, { "epoch": 0.57, "learning_rate": 6.57850825055355e-05, "loss": 2.2623, "step": 90536 }, { "epoch": 0.57, "learning_rate": 6.577884190629036e-05, "loss": 2.2646, "step": 90544 }, { "epoch": 0.57, "learning_rate": 6.577260116338254e-05, "loss": 2.2576, "step": 90552 }, { "epoch": 0.57, "learning_rate": 6.576636027696719e-05, "loss": 2.2555, "step": 90560 }, { "epoch": 0.57, "learning_rate": 6.57601192471995e-05, "loss": 2.2457, "step": 90568 }, { "epoch": 0.57, "learning_rate": 6.575387807423457e-05, "loss": 2.2519, "step": 90576 }, { "epoch": 0.57, "learning_rate": 6.574763675822761e-05, "loss": 2.2541, "step": 90584 }, { "epoch": 0.57, "learning_rate": 6.574139529933375e-05, "loss": 2.2502, "step": 90592 }, { "epoch": 0.57, "learning_rate": 6.573515369770815e-05, "loss": 2.2622, "step": 90600 }, { "epoch": 0.57, "learning_rate": 6.572891195350602e-05, "loss": 2.262, "step": 90608 }, { "epoch": 0.57, "learning_rate": 6.572267006688245e-05, "loss": 2.2409, "step": 90616 }, { "epoch": 0.57, "learning_rate": 6.571642803799268e-05, "loss": 2.2585, "step": 90624 }, { "epoch": 0.57, "learning_rate": 6.571018586699187e-05, "loss": 2.2489, "step": 90632 }, { "epoch": 0.57, "learning_rate": 6.57039435540352e-05, "loss": 2.2711, "step": 90640 }, { "epoch": 0.57, "learning_rate": 6.569770109927784e-05, "loss": 2.2616, "step": 90648 }, { "epoch": 0.57, "learning_rate": 6.569145850287501e-05, "loss": 2.2562, "step": 90656 }, { "epoch": 0.57, "learning_rate": 6.568521576498188e-05, "loss": 2.2584, "step": 90664 }, { "epoch": 0.57, "learning_rate": 6.567897288575362e-05, "loss": 2.2681, "step": 90672 }, { "epoch": 0.57, "learning_rate": 6.567272986534549e-05, "loss": 2.2672, "step": 90680 }, { "epoch": 0.57, "learning_rate": 6.566648670391265e-05, "loss": 2.2489, "step": 90688 }, { "epoch": 0.57, "learning_rate": 6.566024340161031e-05, "loss": 2.2534, "step": 90696 }, { "epoch": 0.57, "learning_rate": 6.565399995859369e-05, "loss": 2.2539, "step": 90704 }, { "epoch": 0.57, "learning_rate": 6.564775637501799e-05, "loss": 2.2631, "step": 90712 }, { "epoch": 0.57, "learning_rate": 6.564151265103845e-05, "loss": 2.2616, "step": 90720 }, { "epoch": 0.57, "learning_rate": 6.563526878681024e-05, "loss": 2.2662, "step": 90728 }, { "epoch": 0.57, "learning_rate": 6.562902478248865e-05, "loss": 2.263, "step": 90736 }, { "epoch": 0.57, "learning_rate": 6.562278063822885e-05, "loss": 2.2616, "step": 90744 }, { "epoch": 0.57, "learning_rate": 6.56165363541861e-05, "loss": 2.2581, "step": 90752 }, { "epoch": 0.57, "learning_rate": 6.561029193051563e-05, "loss": 2.2538, "step": 90760 }, { "epoch": 0.57, "learning_rate": 6.560404736737267e-05, "loss": 2.2433, "step": 90768 }, { "epoch": 0.57, "learning_rate": 6.559780266491247e-05, "loss": 2.2618, "step": 90776 }, { "epoch": 0.57, "learning_rate": 6.559155782329025e-05, "loss": 2.2618, "step": 90784 }, { "epoch": 0.57, "learning_rate": 6.558531284266127e-05, "loss": 2.2606, "step": 90792 }, { "epoch": 0.57, "learning_rate": 6.557906772318083e-05, "loss": 2.2572, "step": 90800 }, { "epoch": 0.57, "learning_rate": 6.557282246500409e-05, "loss": 2.262, "step": 90808 }, { "epoch": 0.57, "learning_rate": 6.556657706828639e-05, "loss": 2.2443, "step": 90816 }, { "epoch": 0.57, "learning_rate": 6.556033153318294e-05, "loss": 2.2463, "step": 90824 }, { "epoch": 0.57, "learning_rate": 6.555408585984903e-05, "loss": 2.2585, "step": 90832 }, { "epoch": 0.57, "learning_rate": 6.554784004843992e-05, "loss": 2.2485, "step": 90840 }, { "epoch": 0.57, "learning_rate": 6.554159409911089e-05, "loss": 2.2586, "step": 90848 }, { "epoch": 0.57, "learning_rate": 6.553534801201722e-05, "loss": 2.2453, "step": 90856 }, { "epoch": 0.57, "learning_rate": 6.552910178731418e-05, "loss": 2.2657, "step": 90864 }, { "epoch": 0.57, "learning_rate": 6.552285542515703e-05, "loss": 2.2582, "step": 90872 }, { "epoch": 0.57, "learning_rate": 6.551660892570107e-05, "loss": 2.2617, "step": 90880 }, { "epoch": 0.57, "learning_rate": 6.55103622891016e-05, "loss": 2.2413, "step": 90888 }, { "epoch": 0.57, "learning_rate": 6.550411551551392e-05, "loss": 2.2596, "step": 90896 }, { "epoch": 0.57, "learning_rate": 6.54978686050933e-05, "loss": 2.2666, "step": 90904 }, { "epoch": 0.57, "learning_rate": 6.549162155799504e-05, "loss": 2.2418, "step": 90912 }, { "epoch": 0.57, "learning_rate": 6.548537437437448e-05, "loss": 2.2597, "step": 90920 }, { "epoch": 0.57, "learning_rate": 6.547912705438687e-05, "loss": 2.251, "step": 90928 }, { "epoch": 0.57, "learning_rate": 6.547287959818755e-05, "loss": 2.243, "step": 90936 }, { "epoch": 0.57, "learning_rate": 6.546663200593184e-05, "loss": 2.2495, "step": 90944 }, { "epoch": 0.57, "learning_rate": 6.546038427777503e-05, "loss": 2.2585, "step": 90952 }, { "epoch": 0.57, "learning_rate": 6.545413641387248e-05, "loss": 2.2422, "step": 90960 }, { "epoch": 0.57, "learning_rate": 6.544788841437946e-05, "loss": 2.2587, "step": 90968 }, { "epoch": 0.57, "learning_rate": 6.544164027945134e-05, "loss": 2.237, "step": 90976 }, { "epoch": 0.57, "learning_rate": 6.543539200924343e-05, "loss": 2.2498, "step": 90984 }, { "epoch": 0.57, "learning_rate": 6.542914360391104e-05, "loss": 2.237, "step": 90992 }, { "epoch": 0.57, "learning_rate": 6.542289506360954e-05, "loss": 2.2562, "step": 91000 }, { "epoch": 0.57, "learning_rate": 6.54166463884943e-05, "loss": 2.2598, "step": 91008 }, { "epoch": 0.57, "learning_rate": 6.541039757872058e-05, "loss": 2.2562, "step": 91016 }, { "epoch": 0.57, "learning_rate": 6.54041486344438e-05, "loss": 2.2584, "step": 91024 }, { "epoch": 0.57, "learning_rate": 6.539789955581924e-05, "loss": 2.2605, "step": 91032 }, { "epoch": 0.57, "learning_rate": 6.539165034300232e-05, "loss": 2.2469, "step": 91040 }, { "epoch": 0.57, "learning_rate": 6.538540099614837e-05, "loss": 2.2469, "step": 91048 }, { "epoch": 0.57, "learning_rate": 6.537915151541274e-05, "loss": 2.2518, "step": 91056 }, { "epoch": 0.57, "learning_rate": 6.537290190095078e-05, "loss": 2.247, "step": 91064 }, { "epoch": 0.57, "learning_rate": 6.53666521529179e-05, "loss": 2.2748, "step": 91072 }, { "epoch": 0.57, "learning_rate": 6.536040227146943e-05, "loss": 2.2673, "step": 91080 }, { "epoch": 0.57, "learning_rate": 6.535415225676079e-05, "loss": 2.2672, "step": 91088 }, { "epoch": 0.57, "learning_rate": 6.534790210894729e-05, "loss": 2.2534, "step": 91096 }, { "epoch": 0.57, "learning_rate": 6.534165182818435e-05, "loss": 2.2687, "step": 91104 }, { "epoch": 0.57, "learning_rate": 6.533540141462735e-05, "loss": 2.2412, "step": 91112 }, { "epoch": 0.57, "learning_rate": 6.532915086843168e-05, "loss": 2.2615, "step": 91120 }, { "epoch": 0.57, "learning_rate": 6.532290018975272e-05, "loss": 2.2617, "step": 91128 }, { "epoch": 0.57, "learning_rate": 6.531664937874587e-05, "loss": 2.2615, "step": 91136 }, { "epoch": 0.57, "learning_rate": 6.531039843556649e-05, "loss": 2.2505, "step": 91144 }, { "epoch": 0.57, "learning_rate": 6.530414736037002e-05, "loss": 2.2545, "step": 91152 }, { "epoch": 0.57, "learning_rate": 6.529789615331187e-05, "loss": 2.2488, "step": 91160 }, { "epoch": 0.57, "learning_rate": 6.529164481454741e-05, "loss": 2.2429, "step": 91168 }, { "epoch": 0.57, "learning_rate": 6.528539334423207e-05, "loss": 2.2661, "step": 91176 }, { "epoch": 0.57, "learning_rate": 6.527914174252125e-05, "loss": 2.2543, "step": 91184 }, { "epoch": 0.57, "learning_rate": 6.52728900095704e-05, "loss": 2.2649, "step": 91192 }, { "epoch": 0.57, "learning_rate": 6.526663814553489e-05, "loss": 2.2458, "step": 91200 }, { "epoch": 0.57, "learning_rate": 6.52603861505702e-05, "loss": 2.246, "step": 91208 }, { "epoch": 0.57, "learning_rate": 6.525413402483167e-05, "loss": 2.249, "step": 91216 }, { "epoch": 0.57, "learning_rate": 6.52478817684748e-05, "loss": 2.2421, "step": 91224 }, { "epoch": 0.57, "learning_rate": 6.524162938165501e-05, "loss": 2.2598, "step": 91232 }, { "epoch": 0.57, "learning_rate": 6.523537686452772e-05, "loss": 2.2533, "step": 91240 }, { "epoch": 0.57, "learning_rate": 6.522912421724837e-05, "loss": 2.2544, "step": 91248 }, { "epoch": 0.57, "learning_rate": 6.52228714399724e-05, "loss": 2.2399, "step": 91256 }, { "epoch": 0.57, "learning_rate": 6.521661853285527e-05, "loss": 2.2487, "step": 91264 }, { "epoch": 0.57, "learning_rate": 6.521036549605242e-05, "loss": 2.2577, "step": 91272 }, { "epoch": 0.57, "learning_rate": 6.520411232971928e-05, "loss": 2.2741, "step": 91280 }, { "epoch": 0.57, "learning_rate": 6.519785903401134e-05, "loss": 2.2483, "step": 91288 }, { "epoch": 0.57, "learning_rate": 6.519160560908403e-05, "loss": 2.2651, "step": 91296 }, { "epoch": 0.57, "learning_rate": 6.518535205509284e-05, "loss": 2.2401, "step": 91304 }, { "epoch": 0.57, "learning_rate": 6.517909837219321e-05, "loss": 2.2394, "step": 91312 }, { "epoch": 0.57, "learning_rate": 6.517284456054061e-05, "loss": 2.244, "step": 91320 }, { "epoch": 0.57, "learning_rate": 6.516659062029051e-05, "loss": 2.2506, "step": 91328 }, { "epoch": 0.57, "learning_rate": 6.51603365515984e-05, "loss": 2.2694, "step": 91336 }, { "epoch": 0.57, "learning_rate": 6.515408235461973e-05, "loss": 2.2443, "step": 91344 }, { "epoch": 0.57, "learning_rate": 6.514782802951001e-05, "loss": 2.2475, "step": 91352 }, { "epoch": 0.57, "learning_rate": 6.51415735764247e-05, "loss": 2.2534, "step": 91360 }, { "epoch": 0.57, "learning_rate": 6.513531899551928e-05, "loss": 2.2592, "step": 91368 }, { "epoch": 0.57, "learning_rate": 6.512906428694926e-05, "loss": 2.2477, "step": 91376 }, { "epoch": 0.57, "learning_rate": 6.512280945087015e-05, "loss": 2.2652, "step": 91384 }, { "epoch": 0.57, "learning_rate": 6.511655448743739e-05, "loss": 2.2405, "step": 91392 }, { "epoch": 0.57, "learning_rate": 6.511029939680653e-05, "loss": 2.244, "step": 91400 }, { "epoch": 0.57, "learning_rate": 6.510404417913305e-05, "loss": 2.2566, "step": 91408 }, { "epoch": 0.57, "learning_rate": 6.509778883457245e-05, "loss": 2.2619, "step": 91416 }, { "epoch": 0.57, "learning_rate": 6.509153336328026e-05, "loss": 2.2429, "step": 91424 }, { "epoch": 0.57, "learning_rate": 6.508527776541198e-05, "loss": 2.2532, "step": 91432 }, { "epoch": 0.57, "learning_rate": 6.507902204112311e-05, "loss": 2.2421, "step": 91440 }, { "epoch": 0.57, "learning_rate": 6.507276619056919e-05, "loss": 2.2536, "step": 91448 }, { "epoch": 0.57, "learning_rate": 6.506651021390574e-05, "loss": 2.2626, "step": 91456 }, { "epoch": 0.57, "learning_rate": 6.506025411128826e-05, "loss": 2.262, "step": 91464 }, { "epoch": 0.57, "learning_rate": 6.505399788287232e-05, "loss": 2.2518, "step": 91472 }, { "epoch": 0.57, "learning_rate": 6.504774152881341e-05, "loss": 2.2454, "step": 91480 }, { "epoch": 0.57, "learning_rate": 6.504148504926708e-05, "loss": 2.2568, "step": 91488 }, { "epoch": 0.57, "learning_rate": 6.503522844438887e-05, "loss": 2.2374, "step": 91496 }, { "epoch": 0.57, "learning_rate": 6.502897171433431e-05, "loss": 2.2515, "step": 91504 }, { "epoch": 0.57, "learning_rate": 6.502271485925896e-05, "loss": 2.2617, "step": 91512 }, { "epoch": 0.57, "learning_rate": 6.501645787931835e-05, "loss": 2.256, "step": 91520 }, { "epoch": 0.57, "learning_rate": 6.501020077466801e-05, "loss": 2.2555, "step": 91528 }, { "epoch": 0.57, "learning_rate": 6.500394354546355e-05, "loss": 2.2718, "step": 91536 }, { "epoch": 0.57, "learning_rate": 6.499768619186048e-05, "loss": 2.2511, "step": 91544 }, { "epoch": 0.57, "learning_rate": 6.499142871401438e-05, "loss": 2.2437, "step": 91552 }, { "epoch": 0.57, "learning_rate": 6.49851711120808e-05, "loss": 2.2555, "step": 91560 }, { "epoch": 0.57, "learning_rate": 6.49789133862153e-05, "loss": 2.2329, "step": 91568 }, { "epoch": 0.57, "learning_rate": 6.497265553657346e-05, "loss": 2.2479, "step": 91576 }, { "epoch": 0.57, "learning_rate": 6.496639756331085e-05, "loss": 2.2549, "step": 91584 }, { "epoch": 0.57, "learning_rate": 6.4960139466583e-05, "loss": 2.255, "step": 91592 }, { "epoch": 0.57, "learning_rate": 6.495388124654557e-05, "loss": 2.241, "step": 91600 }, { "epoch": 0.57, "learning_rate": 6.494762290335407e-05, "loss": 2.2673, "step": 91608 }, { "epoch": 0.57, "learning_rate": 6.494136443716415e-05, "loss": 2.253, "step": 91616 }, { "epoch": 0.57, "learning_rate": 6.49351058481313e-05, "loss": 2.2477, "step": 91624 }, { "epoch": 0.57, "learning_rate": 6.49288471364112e-05, "loss": 2.2416, "step": 91632 }, { "epoch": 0.57, "learning_rate": 6.49225883021594e-05, "loss": 2.2253, "step": 91640 }, { "epoch": 0.57, "learning_rate": 6.49163293455315e-05, "loss": 2.2519, "step": 91648 }, { "epoch": 0.57, "learning_rate": 6.49100702666831e-05, "loss": 2.2663, "step": 91656 }, { "epoch": 0.57, "learning_rate": 6.490381106576981e-05, "loss": 2.2511, "step": 91664 }, { "epoch": 0.57, "learning_rate": 6.489755174294723e-05, "loss": 2.2608, "step": 91672 }, { "epoch": 0.57, "learning_rate": 6.489129229837095e-05, "loss": 2.2571, "step": 91680 }, { "epoch": 0.57, "learning_rate": 6.488503273219659e-05, "loss": 2.2785, "step": 91688 }, { "epoch": 0.57, "learning_rate": 6.487877304457979e-05, "loss": 2.2416, "step": 91696 }, { "epoch": 0.57, "learning_rate": 6.487251323567614e-05, "loss": 2.2478, "step": 91704 }, { "epoch": 0.57, "learning_rate": 6.486625330564125e-05, "loss": 2.2487, "step": 91712 }, { "epoch": 0.57, "learning_rate": 6.485999325463078e-05, "loss": 2.2738, "step": 91720 }, { "epoch": 0.57, "learning_rate": 6.48537330828003e-05, "loss": 2.2456, "step": 91728 }, { "epoch": 0.57, "learning_rate": 6.484747279030549e-05, "loss": 2.2492, "step": 91736 }, { "epoch": 0.57, "learning_rate": 6.484121237730197e-05, "loss": 2.2612, "step": 91744 }, { "epoch": 0.57, "learning_rate": 6.483495184394535e-05, "loss": 2.2635, "step": 91752 }, { "epoch": 0.57, "learning_rate": 6.48286911903913e-05, "loss": 2.2776, "step": 91760 }, { "epoch": 0.57, "learning_rate": 6.482243041679544e-05, "loss": 2.2642, "step": 91768 }, { "epoch": 0.57, "learning_rate": 6.481616952331342e-05, "loss": 2.2595, "step": 91776 }, { "epoch": 0.57, "learning_rate": 6.480990851010087e-05, "loss": 2.2689, "step": 91784 }, { "epoch": 0.57, "learning_rate": 6.480364737731348e-05, "loss": 2.2689, "step": 91792 }, { "epoch": 0.57, "learning_rate": 6.479738612510686e-05, "loss": 2.2621, "step": 91800 }, { "epoch": 0.57, "learning_rate": 6.479112475363668e-05, "loss": 2.2716, "step": 91808 }, { "epoch": 0.57, "learning_rate": 6.478486326305862e-05, "loss": 2.2646, "step": 91816 }, { "epoch": 0.57, "learning_rate": 6.477860165352829e-05, "loss": 2.2612, "step": 91824 }, { "epoch": 0.57, "learning_rate": 6.477233992520141e-05, "loss": 2.2553, "step": 91832 }, { "epoch": 0.57, "learning_rate": 6.476607807823363e-05, "loss": 2.2425, "step": 91840 }, { "epoch": 0.57, "learning_rate": 6.47598161127806e-05, "loss": 2.2754, "step": 91848 }, { "epoch": 0.57, "learning_rate": 6.475355402899803e-05, "loss": 2.2653, "step": 91856 }, { "epoch": 0.57, "learning_rate": 6.474729182704154e-05, "loss": 2.2531, "step": 91864 }, { "epoch": 0.57, "learning_rate": 6.474102950706687e-05, "loss": 2.2523, "step": 91872 }, { "epoch": 0.57, "learning_rate": 6.473476706922965e-05, "loss": 2.2529, "step": 91880 }, { "epoch": 0.57, "learning_rate": 6.472850451368561e-05, "loss": 2.2487, "step": 91888 }, { "epoch": 0.57, "learning_rate": 6.472224184059041e-05, "loss": 2.261, "step": 91896 }, { "epoch": 0.57, "learning_rate": 6.471597905009973e-05, "loss": 2.2708, "step": 91904 }, { "epoch": 0.57, "learning_rate": 6.470971614236932e-05, "loss": 2.2671, "step": 91912 }, { "epoch": 0.57, "learning_rate": 6.470345311755481e-05, "loss": 2.2677, "step": 91920 }, { "epoch": 0.57, "learning_rate": 6.469718997581194e-05, "loss": 2.265, "step": 91928 }, { "epoch": 0.57, "learning_rate": 6.46909267172964e-05, "loss": 2.253, "step": 91936 }, { "epoch": 0.57, "learning_rate": 6.468466334216389e-05, "loss": 2.2556, "step": 91944 }, { "epoch": 0.57, "learning_rate": 6.467839985057014e-05, "loss": 2.2702, "step": 91952 }, { "epoch": 0.57, "learning_rate": 6.467213624267081e-05, "loss": 2.2499, "step": 91960 }, { "epoch": 0.57, "learning_rate": 6.466587251862166e-05, "loss": 2.2737, "step": 91968 }, { "epoch": 0.57, "learning_rate": 6.465960867857842e-05, "loss": 2.2476, "step": 91976 }, { "epoch": 0.57, "learning_rate": 6.465334472269678e-05, "loss": 2.2559, "step": 91984 }, { "epoch": 0.57, "learning_rate": 6.464708065113244e-05, "loss": 2.2573, "step": 91992 }, { "epoch": 0.57, "learning_rate": 6.464081646404117e-05, "loss": 2.2727, "step": 92000 }, { "epoch": 0.58, "learning_rate": 6.463455216157869e-05, "loss": 2.2535, "step": 92008 }, { "epoch": 0.58, "learning_rate": 6.462828774390072e-05, "loss": 2.2541, "step": 92016 }, { "epoch": 0.58, "learning_rate": 6.462202321116299e-05, "loss": 2.2557, "step": 92024 }, { "epoch": 0.58, "learning_rate": 6.461575856352125e-05, "loss": 2.2548, "step": 92032 }, { "epoch": 0.58, "learning_rate": 6.460949380113124e-05, "loss": 2.2563, "step": 92040 }, { "epoch": 0.58, "learning_rate": 6.460322892414869e-05, "loss": 2.2596, "step": 92048 }, { "epoch": 0.58, "learning_rate": 6.459696393272935e-05, "loss": 2.2529, "step": 92056 }, { "epoch": 0.58, "learning_rate": 6.459069882702898e-05, "loss": 2.2592, "step": 92064 }, { "epoch": 0.58, "learning_rate": 6.45844336072033e-05, "loss": 2.2658, "step": 92072 }, { "epoch": 0.58, "learning_rate": 6.45781682734081e-05, "loss": 2.26, "step": 92080 }, { "epoch": 0.58, "learning_rate": 6.457190282579912e-05, "loss": 2.262, "step": 92088 }, { "epoch": 0.58, "learning_rate": 6.456563726453214e-05, "loss": 2.2519, "step": 92096 }, { "epoch": 0.58, "learning_rate": 6.455937158976288e-05, "loss": 2.263, "step": 92104 }, { "epoch": 0.58, "learning_rate": 6.455310580164715e-05, "loss": 2.2657, "step": 92112 }, { "epoch": 0.58, "learning_rate": 6.45468399003407e-05, "loss": 2.2758, "step": 92120 }, { "epoch": 0.58, "learning_rate": 6.454057388599928e-05, "loss": 2.258, "step": 92128 }, { "epoch": 0.58, "learning_rate": 6.45343077587787e-05, "loss": 2.2445, "step": 92136 }, { "epoch": 0.58, "learning_rate": 6.452804151883472e-05, "loss": 2.273, "step": 92144 }, { "epoch": 0.58, "learning_rate": 6.452177516632311e-05, "loss": 2.2591, "step": 92152 }, { "epoch": 0.58, "learning_rate": 6.451550870139966e-05, "loss": 2.251, "step": 92160 }, { "epoch": 0.58, "learning_rate": 6.450924212422018e-05, "loss": 2.2539, "step": 92168 }, { "epoch": 0.58, "learning_rate": 6.450297543494042e-05, "loss": 2.2845, "step": 92176 }, { "epoch": 0.58, "learning_rate": 6.449670863371619e-05, "loss": 2.2644, "step": 92184 }, { "epoch": 0.58, "learning_rate": 6.449044172070327e-05, "loss": 2.2863, "step": 92192 }, { "epoch": 0.58, "learning_rate": 6.448417469605748e-05, "loss": 2.2655, "step": 92200 }, { "epoch": 0.58, "learning_rate": 6.447790755993458e-05, "loss": 2.2621, "step": 92208 }, { "epoch": 0.58, "learning_rate": 6.447164031249041e-05, "loss": 2.2693, "step": 92216 }, { "epoch": 0.58, "learning_rate": 6.446537295388076e-05, "loss": 2.2672, "step": 92224 }, { "epoch": 0.58, "learning_rate": 6.445910548426144e-05, "loss": 2.2695, "step": 92232 }, { "epoch": 0.58, "learning_rate": 6.445283790378826e-05, "loss": 2.2714, "step": 92240 }, { "epoch": 0.58, "learning_rate": 6.444657021261702e-05, "loss": 2.2527, "step": 92248 }, { "epoch": 0.58, "learning_rate": 6.444030241090354e-05, "loss": 2.2721, "step": 92256 }, { "epoch": 0.58, "learning_rate": 6.443403449880366e-05, "loss": 2.2471, "step": 92264 }, { "epoch": 0.58, "learning_rate": 6.442776647647318e-05, "loss": 2.2683, "step": 92272 }, { "epoch": 0.58, "learning_rate": 6.442149834406791e-05, "loss": 2.2676, "step": 92280 }, { "epoch": 0.58, "learning_rate": 6.441523010174373e-05, "loss": 2.259, "step": 92288 }, { "epoch": 0.58, "learning_rate": 6.44089617496564e-05, "loss": 2.2781, "step": 92296 }, { "epoch": 0.58, "learning_rate": 6.440269328796183e-05, "loss": 2.2472, "step": 92304 }, { "epoch": 0.58, "learning_rate": 6.439642471681576e-05, "loss": 2.2544, "step": 92312 }, { "epoch": 0.58, "learning_rate": 6.43901560363741e-05, "loss": 2.2435, "step": 92320 }, { "epoch": 0.58, "learning_rate": 6.43838872467927e-05, "loss": 2.2627, "step": 92328 }, { "epoch": 0.58, "learning_rate": 6.437761834822731e-05, "loss": 2.259, "step": 92336 }, { "epoch": 0.58, "learning_rate": 6.437134934083389e-05, "loss": 2.267, "step": 92344 }, { "epoch": 0.58, "learning_rate": 6.436508022476819e-05, "loss": 2.2525, "step": 92352 }, { "epoch": 0.58, "learning_rate": 6.435881100018615e-05, "loss": 2.2419, "step": 92360 }, { "epoch": 0.58, "learning_rate": 6.435254166724354e-05, "loss": 2.2604, "step": 92368 }, { "epoch": 0.58, "learning_rate": 6.434627222609628e-05, "loss": 2.2699, "step": 92376 }, { "epoch": 0.58, "learning_rate": 6.434000267690022e-05, "loss": 2.2584, "step": 92384 }, { "epoch": 0.58, "learning_rate": 6.433373301981119e-05, "loss": 2.2637, "step": 92392 }, { "epoch": 0.58, "learning_rate": 6.432746325498504e-05, "loss": 2.2513, "step": 92400 }, { "epoch": 0.58, "learning_rate": 6.432119338257769e-05, "loss": 2.2522, "step": 92408 }, { "epoch": 0.58, "learning_rate": 6.431492340274501e-05, "loss": 2.2542, "step": 92416 }, { "epoch": 0.58, "learning_rate": 6.430865331564283e-05, "loss": 2.2665, "step": 92424 }, { "epoch": 0.58, "learning_rate": 6.430238312142703e-05, "loss": 2.2506, "step": 92432 }, { "epoch": 0.58, "learning_rate": 6.429611282025354e-05, "loss": 2.2626, "step": 92440 }, { "epoch": 0.58, "learning_rate": 6.428984241227818e-05, "loss": 2.2513, "step": 92448 }, { "epoch": 0.58, "learning_rate": 6.428357189765686e-05, "loss": 2.2664, "step": 92456 }, { "epoch": 0.58, "learning_rate": 6.427730127654545e-05, "loss": 2.2445, "step": 92464 }, { "epoch": 0.58, "learning_rate": 6.427103054909987e-05, "loss": 2.2516, "step": 92472 }, { "epoch": 0.58, "learning_rate": 6.426475971547599e-05, "loss": 2.2583, "step": 92480 }, { "epoch": 0.58, "learning_rate": 6.42584887758297e-05, "loss": 2.2459, "step": 92488 }, { "epoch": 0.58, "learning_rate": 6.425221773031688e-05, "loss": 2.2578, "step": 92496 }, { "epoch": 0.58, "learning_rate": 6.424594657909349e-05, "loss": 2.2714, "step": 92504 }, { "epoch": 0.58, "learning_rate": 6.423967532231537e-05, "loss": 2.2458, "step": 92512 }, { "epoch": 0.58, "learning_rate": 6.423340396013844e-05, "loss": 2.2482, "step": 92520 }, { "epoch": 0.58, "learning_rate": 6.422713249271861e-05, "loss": 2.2586, "step": 92528 }, { "epoch": 0.58, "learning_rate": 6.42208609202118e-05, "loss": 2.254, "step": 92536 }, { "epoch": 0.58, "learning_rate": 6.421458924277392e-05, "loss": 2.2448, "step": 92544 }, { "epoch": 0.58, "learning_rate": 6.420831746056087e-05, "loss": 2.2492, "step": 92552 }, { "epoch": 0.58, "learning_rate": 6.42020455737286e-05, "loss": 2.2511, "step": 92560 }, { "epoch": 0.58, "learning_rate": 6.419577358243297e-05, "loss": 2.2636, "step": 92568 }, { "epoch": 0.58, "learning_rate": 6.418950148682996e-05, "loss": 2.2476, "step": 92576 }, { "epoch": 0.58, "learning_rate": 6.418322928707547e-05, "loss": 2.2542, "step": 92584 }, { "epoch": 0.58, "learning_rate": 6.417695698332542e-05, "loss": 2.2439, "step": 92592 }, { "epoch": 0.58, "learning_rate": 6.417068457573576e-05, "loss": 2.2426, "step": 92600 }, { "epoch": 0.58, "learning_rate": 6.416441206446242e-05, "loss": 2.2564, "step": 92608 }, { "epoch": 0.58, "learning_rate": 6.415813944966131e-05, "loss": 2.2429, "step": 92616 }, { "epoch": 0.58, "learning_rate": 6.41518667314884e-05, "loss": 2.2496, "step": 92624 }, { "epoch": 0.58, "learning_rate": 6.414559391009962e-05, "loss": 2.2456, "step": 92632 }, { "epoch": 0.58, "learning_rate": 6.41393209856509e-05, "loss": 2.2406, "step": 92640 }, { "epoch": 0.58, "learning_rate": 6.41330479582982e-05, "loss": 2.2536, "step": 92648 }, { "epoch": 0.58, "learning_rate": 6.412677482819747e-05, "loss": 2.2678, "step": 92656 }, { "epoch": 0.58, "learning_rate": 6.412050159550465e-05, "loss": 2.2784, "step": 92664 }, { "epoch": 0.58, "learning_rate": 6.411422826037569e-05, "loss": 2.262, "step": 92672 }, { "epoch": 0.58, "learning_rate": 6.410795482296657e-05, "loss": 2.2598, "step": 92680 }, { "epoch": 0.58, "learning_rate": 6.410168128343321e-05, "loss": 2.2632, "step": 92688 }, { "epoch": 0.58, "learning_rate": 6.409540764193162e-05, "loss": 2.2733, "step": 92696 }, { "epoch": 0.58, "learning_rate": 6.408913389861773e-05, "loss": 2.2506, "step": 92704 }, { "epoch": 0.58, "learning_rate": 6.408286005364748e-05, "loss": 2.2571, "step": 92712 }, { "epoch": 0.58, "learning_rate": 6.407658610717691e-05, "loss": 2.2654, "step": 92720 }, { "epoch": 0.58, "learning_rate": 6.407031205936194e-05, "loss": 2.2551, "step": 92728 }, { "epoch": 0.58, "learning_rate": 6.406403791035854e-05, "loss": 2.2564, "step": 92736 }, { "epoch": 0.58, "learning_rate": 6.405776366032272e-05, "loss": 2.2469, "step": 92744 }, { "epoch": 0.58, "learning_rate": 6.405148930941045e-05, "loss": 2.2706, "step": 92752 }, { "epoch": 0.58, "learning_rate": 6.404521485777768e-05, "loss": 2.2557, "step": 92760 }, { "epoch": 0.58, "learning_rate": 6.403894030558041e-05, "loss": 2.2528, "step": 92768 }, { "epoch": 0.58, "learning_rate": 6.403266565297465e-05, "loss": 2.2461, "step": 92776 }, { "epoch": 0.58, "learning_rate": 6.402639090011635e-05, "loss": 2.2598, "step": 92784 }, { "epoch": 0.58, "learning_rate": 6.402011604716155e-05, "loss": 2.2505, "step": 92792 }, { "epoch": 0.58, "learning_rate": 6.401384109426617e-05, "loss": 2.2397, "step": 92800 }, { "epoch": 0.58, "learning_rate": 6.40075660415863e-05, "loss": 2.2677, "step": 92808 }, { "epoch": 0.58, "learning_rate": 6.400129088927786e-05, "loss": 2.2451, "step": 92816 }, { "epoch": 0.58, "learning_rate": 6.399501563749689e-05, "loss": 2.2598, "step": 92824 }, { "epoch": 0.58, "learning_rate": 6.398874028639937e-05, "loss": 2.2551, "step": 92832 }, { "epoch": 0.58, "learning_rate": 6.398246483614132e-05, "loss": 2.2553, "step": 92840 }, { "epoch": 0.58, "learning_rate": 6.397618928687876e-05, "loss": 2.2662, "step": 92848 }, { "epoch": 0.58, "learning_rate": 6.396991363876769e-05, "loss": 2.2481, "step": 92856 }, { "epoch": 0.58, "learning_rate": 6.39636378919641e-05, "loss": 2.2483, "step": 92864 }, { "epoch": 0.58, "learning_rate": 6.395736204662406e-05, "loss": 2.2477, "step": 92872 }, { "epoch": 0.58, "learning_rate": 6.395108610290352e-05, "loss": 2.2438, "step": 92880 }, { "epoch": 0.58, "learning_rate": 6.394481006095856e-05, "loss": 2.2362, "step": 92888 }, { "epoch": 0.58, "learning_rate": 6.393853392094516e-05, "loss": 2.2562, "step": 92896 }, { "epoch": 0.58, "learning_rate": 6.393225768301938e-05, "loss": 2.2567, "step": 92904 }, { "epoch": 0.58, "learning_rate": 6.392598134733724e-05, "loss": 2.246, "step": 92912 }, { "epoch": 0.58, "learning_rate": 6.391970491405475e-05, "loss": 2.2557, "step": 92920 }, { "epoch": 0.58, "learning_rate": 6.391342838332795e-05, "loss": 2.2399, "step": 92928 }, { "epoch": 0.58, "learning_rate": 6.390715175531289e-05, "loss": 2.268, "step": 92936 }, { "epoch": 0.58, "learning_rate": 6.39008750301656e-05, "loss": 2.2422, "step": 92944 }, { "epoch": 0.58, "learning_rate": 6.389459820804214e-05, "loss": 2.2472, "step": 92952 }, { "epoch": 0.58, "learning_rate": 6.388832128909848e-05, "loss": 2.2588, "step": 92960 }, { "epoch": 0.58, "learning_rate": 6.388204427349075e-05, "loss": 2.2472, "step": 92968 }, { "epoch": 0.58, "learning_rate": 6.387576716137496e-05, "loss": 2.2585, "step": 92976 }, { "epoch": 0.58, "learning_rate": 6.386948995290718e-05, "loss": 2.2456, "step": 92984 }, { "epoch": 0.58, "learning_rate": 6.386321264824342e-05, "loss": 2.2468, "step": 92992 }, { "epoch": 0.58, "learning_rate": 6.385693524753978e-05, "loss": 2.2618, "step": 93000 }, { "epoch": 0.58, "learning_rate": 6.385065775095229e-05, "loss": 2.2501, "step": 93008 }, { "epoch": 0.58, "learning_rate": 6.384438015863701e-05, "loss": 2.2313, "step": 93016 }, { "epoch": 0.58, "learning_rate": 6.383810247074999e-05, "loss": 2.2444, "step": 93024 }, { "epoch": 0.58, "learning_rate": 6.383182468744735e-05, "loss": 2.2472, "step": 93032 }, { "epoch": 0.58, "learning_rate": 6.38255468088851e-05, "loss": 2.2561, "step": 93040 }, { "epoch": 0.58, "learning_rate": 6.381926883521931e-05, "loss": 2.2559, "step": 93048 }, { "epoch": 0.58, "learning_rate": 6.381299076660609e-05, "loss": 2.2648, "step": 93056 }, { "epoch": 0.58, "learning_rate": 6.38067126032015e-05, "loss": 2.2468, "step": 93064 }, { "epoch": 0.58, "learning_rate": 6.380043434516158e-05, "loss": 2.2597, "step": 93072 }, { "epoch": 0.58, "learning_rate": 6.379415599264247e-05, "loss": 2.2305, "step": 93080 }, { "epoch": 0.58, "learning_rate": 6.37878775458002e-05, "loss": 2.2346, "step": 93088 }, { "epoch": 0.58, "learning_rate": 6.378159900479086e-05, "loss": 2.2535, "step": 93096 }, { "epoch": 0.58, "learning_rate": 6.377532036977055e-05, "loss": 2.2288, "step": 93104 }, { "epoch": 0.58, "learning_rate": 6.376904164089534e-05, "loss": 2.2459, "step": 93112 }, { "epoch": 0.58, "learning_rate": 6.376276281832136e-05, "loss": 2.2645, "step": 93120 }, { "epoch": 0.58, "learning_rate": 6.375648390220466e-05, "loss": 2.2575, "step": 93128 }, { "epoch": 0.58, "learning_rate": 6.375020489270133e-05, "loss": 2.2434, "step": 93136 }, { "epoch": 0.58, "learning_rate": 6.374392578996752e-05, "loss": 2.2589, "step": 93144 }, { "epoch": 0.58, "learning_rate": 6.373764659415927e-05, "loss": 2.2565, "step": 93152 }, { "epoch": 0.58, "learning_rate": 6.373136730543272e-05, "loss": 2.2468, "step": 93160 }, { "epoch": 0.58, "learning_rate": 6.372508792394395e-05, "loss": 2.2593, "step": 93168 }, { "epoch": 0.58, "learning_rate": 6.371880844984907e-05, "loss": 2.2508, "step": 93176 }, { "epoch": 0.58, "learning_rate": 6.371252888330422e-05, "loss": 2.2377, "step": 93184 }, { "epoch": 0.58, "learning_rate": 6.370624922446548e-05, "loss": 2.2505, "step": 93192 }, { "epoch": 0.58, "learning_rate": 6.369996947348896e-05, "loss": 2.2394, "step": 93200 }, { "epoch": 0.58, "learning_rate": 6.369368963053077e-05, "loss": 2.2491, "step": 93208 }, { "epoch": 0.58, "learning_rate": 6.368740969574707e-05, "loss": 2.2526, "step": 93216 }, { "epoch": 0.58, "learning_rate": 6.368112966929394e-05, "loss": 2.2539, "step": 93224 }, { "epoch": 0.58, "learning_rate": 6.36748495513275e-05, "loss": 2.2551, "step": 93232 }, { "epoch": 0.58, "learning_rate": 6.36685693420039e-05, "loss": 2.2473, "step": 93240 }, { "epoch": 0.58, "learning_rate": 6.366228904147924e-05, "loss": 2.262, "step": 93248 }, { "epoch": 0.58, "learning_rate": 6.365600864990969e-05, "loss": 2.2509, "step": 93256 }, { "epoch": 0.58, "learning_rate": 6.364972816745134e-05, "loss": 2.25, "step": 93264 }, { "epoch": 0.58, "learning_rate": 6.364344759426033e-05, "loss": 2.2445, "step": 93272 }, { "epoch": 0.58, "learning_rate": 6.363716693049281e-05, "loss": 2.2487, "step": 93280 }, { "epoch": 0.58, "learning_rate": 6.363088617630492e-05, "loss": 2.2505, "step": 93288 }, { "epoch": 0.58, "learning_rate": 6.362460533185278e-05, "loss": 2.2415, "step": 93296 }, { "epoch": 0.58, "learning_rate": 6.361832439729256e-05, "loss": 2.2565, "step": 93304 }, { "epoch": 0.58, "learning_rate": 6.361204337278037e-05, "loss": 2.2428, "step": 93312 }, { "epoch": 0.58, "learning_rate": 6.36057622584724e-05, "loss": 2.241, "step": 93320 }, { "epoch": 0.58, "learning_rate": 6.359948105452476e-05, "loss": 2.2369, "step": 93328 }, { "epoch": 0.58, "learning_rate": 6.359319976109361e-05, "loss": 2.255, "step": 93336 }, { "epoch": 0.58, "learning_rate": 6.358691837833513e-05, "loss": 2.2408, "step": 93344 }, { "epoch": 0.58, "learning_rate": 6.358063690640546e-05, "loss": 2.2535, "step": 93352 }, { "epoch": 0.58, "learning_rate": 6.357435534546072e-05, "loss": 2.2567, "step": 93360 }, { "epoch": 0.58, "learning_rate": 6.356807369565713e-05, "loss": 2.2423, "step": 93368 }, { "epoch": 0.58, "learning_rate": 6.356179195715083e-05, "loss": 2.259, "step": 93376 }, { "epoch": 0.58, "learning_rate": 6.355551013009798e-05, "loss": 2.235, "step": 93384 }, { "epoch": 0.58, "learning_rate": 6.354922821465475e-05, "loss": 2.2474, "step": 93392 }, { "epoch": 0.58, "learning_rate": 6.35429462109773e-05, "loss": 2.2509, "step": 93400 }, { "epoch": 0.58, "learning_rate": 6.353666411922181e-05, "loss": 2.2557, "step": 93408 }, { "epoch": 0.58, "learning_rate": 6.353038193954445e-05, "loss": 2.2517, "step": 93416 }, { "epoch": 0.58, "learning_rate": 6.352409967210142e-05, "loss": 2.2283, "step": 93424 }, { "epoch": 0.58, "learning_rate": 6.351781731704886e-05, "loss": 2.2407, "step": 93432 }, { "epoch": 0.58, "learning_rate": 6.351153487454298e-05, "loss": 2.2543, "step": 93440 }, { "epoch": 0.58, "learning_rate": 6.350525234473993e-05, "loss": 2.2546, "step": 93448 }, { "epoch": 0.58, "learning_rate": 6.349896972779591e-05, "loss": 2.2438, "step": 93456 }, { "epoch": 0.58, "learning_rate": 6.349268702386713e-05, "loss": 2.2495, "step": 93464 }, { "epoch": 0.58, "learning_rate": 6.348640423310976e-05, "loss": 2.2473, "step": 93472 }, { "epoch": 0.58, "learning_rate": 6.348012135567999e-05, "loss": 2.2201, "step": 93480 }, { "epoch": 0.58, "learning_rate": 6.3473838391734e-05, "loss": 2.228, "step": 93488 }, { "epoch": 0.58, "learning_rate": 6.3467555341428e-05, "loss": 2.2517, "step": 93496 }, { "epoch": 0.58, "learning_rate": 6.346127220491817e-05, "loss": 2.2491, "step": 93504 }, { "epoch": 0.58, "learning_rate": 6.345498898236076e-05, "loss": 2.2398, "step": 93512 }, { "epoch": 0.58, "learning_rate": 6.344870567391193e-05, "loss": 2.2496, "step": 93520 }, { "epoch": 0.58, "learning_rate": 6.344242227972786e-05, "loss": 2.2526, "step": 93528 }, { "epoch": 0.58, "learning_rate": 6.343613879996482e-05, "loss": 2.262, "step": 93536 }, { "epoch": 0.58, "learning_rate": 6.342985523477896e-05, "loss": 2.2483, "step": 93544 }, { "epoch": 0.58, "learning_rate": 6.342357158432652e-05, "loss": 2.2409, "step": 93552 }, { "epoch": 0.58, "learning_rate": 6.341728784876371e-05, "loss": 2.2528, "step": 93560 }, { "epoch": 0.58, "learning_rate": 6.341100402824674e-05, "loss": 2.2512, "step": 93568 }, { "epoch": 0.58, "learning_rate": 6.340472012293182e-05, "loss": 2.2382, "step": 93576 }, { "epoch": 0.58, "learning_rate": 6.339843613297519e-05, "loss": 2.248, "step": 93584 }, { "epoch": 0.58, "learning_rate": 6.339215205853303e-05, "loss": 2.2456, "step": 93592 }, { "epoch": 0.58, "learning_rate": 6.338586789976161e-05, "loss": 2.2446, "step": 93600 }, { "epoch": 0.59, "learning_rate": 6.337958365681715e-05, "loss": 2.2424, "step": 93608 }, { "epoch": 0.59, "learning_rate": 6.337329932985583e-05, "loss": 2.2385, "step": 93616 }, { "epoch": 0.59, "learning_rate": 6.336701491903392e-05, "loss": 2.2684, "step": 93624 }, { "epoch": 0.59, "learning_rate": 6.336073042450765e-05, "loss": 2.2276, "step": 93632 }, { "epoch": 0.59, "learning_rate": 6.335444584643324e-05, "loss": 2.2486, "step": 93640 }, { "epoch": 0.59, "learning_rate": 6.334816118496691e-05, "loss": 2.2474, "step": 93648 }, { "epoch": 0.59, "learning_rate": 6.334187644026494e-05, "loss": 2.2491, "step": 93656 }, { "epoch": 0.59, "learning_rate": 6.333559161248355e-05, "loss": 2.2667, "step": 93664 }, { "epoch": 0.59, "learning_rate": 6.332930670177897e-05, "loss": 2.2543, "step": 93672 }, { "epoch": 0.59, "learning_rate": 6.332302170830745e-05, "loss": 2.2524, "step": 93680 }, { "epoch": 0.59, "learning_rate": 6.331673663222523e-05, "loss": 2.2562, "step": 93688 }, { "epoch": 0.59, "learning_rate": 6.33104514736886e-05, "loss": 2.2582, "step": 93696 }, { "epoch": 0.59, "learning_rate": 6.330416623285374e-05, "loss": 2.2364, "step": 93704 }, { "epoch": 0.59, "learning_rate": 6.329788090987695e-05, "loss": 2.2747, "step": 93712 }, { "epoch": 0.59, "learning_rate": 6.329159550491446e-05, "loss": 2.2521, "step": 93720 }, { "epoch": 0.59, "learning_rate": 6.328531001812254e-05, "loss": 2.2511, "step": 93728 }, { "epoch": 0.59, "learning_rate": 6.327902444965746e-05, "loss": 2.2419, "step": 93736 }, { "epoch": 0.59, "learning_rate": 6.327273879967545e-05, "loss": 2.2684, "step": 93744 }, { "epoch": 0.59, "learning_rate": 6.326645306833278e-05, "loss": 2.254, "step": 93752 }, { "epoch": 0.59, "learning_rate": 6.326016725578575e-05, "loss": 2.243, "step": 93760 }, { "epoch": 0.59, "learning_rate": 6.325388136219055e-05, "loss": 2.236, "step": 93768 }, { "epoch": 0.59, "learning_rate": 6.324759538770353e-05, "loss": 2.248, "step": 93776 }, { "epoch": 0.59, "learning_rate": 6.324130933248091e-05, "loss": 2.2535, "step": 93784 }, { "epoch": 0.59, "learning_rate": 6.3235023196679e-05, "loss": 2.2475, "step": 93792 }, { "epoch": 0.59, "learning_rate": 6.322873698045401e-05, "loss": 2.2689, "step": 93800 }, { "epoch": 0.59, "learning_rate": 6.322245068396229e-05, "loss": 2.2506, "step": 93808 }, { "epoch": 0.59, "learning_rate": 6.321616430736006e-05, "loss": 2.2612, "step": 93816 }, { "epoch": 0.59, "learning_rate": 6.320987785080364e-05, "loss": 2.2363, "step": 93824 }, { "epoch": 0.59, "learning_rate": 6.320359131444928e-05, "loss": 2.264, "step": 93832 }, { "epoch": 0.59, "learning_rate": 6.31973046984533e-05, "loss": 2.258, "step": 93840 }, { "epoch": 0.59, "learning_rate": 6.319101800297197e-05, "loss": 2.2696, "step": 93848 }, { "epoch": 0.59, "learning_rate": 6.318473122816155e-05, "loss": 2.2517, "step": 93856 }, { "epoch": 0.59, "learning_rate": 6.317844437417837e-05, "loss": 2.2577, "step": 93864 }, { "epoch": 0.59, "learning_rate": 6.31721574411787e-05, "loss": 2.2537, "step": 93872 }, { "epoch": 0.59, "learning_rate": 6.316587042931886e-05, "loss": 2.256, "step": 93880 }, { "epoch": 0.59, "learning_rate": 6.31595833387551e-05, "loss": 2.2648, "step": 93888 }, { "epoch": 0.59, "learning_rate": 6.315329616964377e-05, "loss": 2.2683, "step": 93896 }, { "epoch": 0.59, "learning_rate": 6.314700892214111e-05, "loss": 2.2627, "step": 93904 }, { "epoch": 0.59, "learning_rate": 6.314072159640347e-05, "loss": 2.2493, "step": 93912 }, { "epoch": 0.59, "learning_rate": 6.313443419258714e-05, "loss": 2.2511, "step": 93920 }, { "epoch": 0.59, "learning_rate": 6.312814671084844e-05, "loss": 2.2645, "step": 93928 }, { "epoch": 0.59, "learning_rate": 6.312185915134364e-05, "loss": 2.2522, "step": 93936 }, { "epoch": 0.59, "learning_rate": 6.311557151422908e-05, "loss": 2.2553, "step": 93944 }, { "epoch": 0.59, "learning_rate": 6.310928379966105e-05, "loss": 2.253, "step": 93952 }, { "epoch": 0.59, "learning_rate": 6.31029960077959e-05, "loss": 2.2386, "step": 93960 }, { "epoch": 0.59, "learning_rate": 6.309670813878992e-05, "loss": 2.2608, "step": 93968 }, { "epoch": 0.59, "learning_rate": 6.30904201927994e-05, "loss": 2.2523, "step": 93976 }, { "epoch": 0.59, "learning_rate": 6.30841321699807e-05, "loss": 2.253, "step": 93984 }, { "epoch": 0.59, "learning_rate": 6.307784407049013e-05, "loss": 2.256, "step": 93992 }, { "epoch": 0.59, "learning_rate": 6.307155589448403e-05, "loss": 2.2509, "step": 94000 }, { "epoch": 0.59, "learning_rate": 6.306526764211868e-05, "loss": 2.2384, "step": 94008 }, { "epoch": 0.59, "learning_rate": 6.305897931355042e-05, "loss": 2.2635, "step": 94016 }, { "epoch": 0.59, "learning_rate": 6.305269090893565e-05, "loss": 2.2454, "step": 94024 }, { "epoch": 0.59, "learning_rate": 6.304640242843058e-05, "loss": 2.264, "step": 94032 }, { "epoch": 0.59, "learning_rate": 6.304011387219164e-05, "loss": 2.27, "step": 94040 }, { "epoch": 0.59, "learning_rate": 6.30338252403751e-05, "loss": 2.2672, "step": 94048 }, { "epoch": 0.59, "learning_rate": 6.302753653313735e-05, "loss": 2.2671, "step": 94056 }, { "epoch": 0.59, "learning_rate": 6.30212477506347e-05, "loss": 2.2574, "step": 94064 }, { "epoch": 0.59, "learning_rate": 6.301495889302347e-05, "loss": 2.2688, "step": 94072 }, { "epoch": 0.59, "learning_rate": 6.300866996046004e-05, "loss": 2.2559, "step": 94080 }, { "epoch": 0.59, "learning_rate": 6.300238095310073e-05, "loss": 2.2616, "step": 94088 }, { "epoch": 0.59, "learning_rate": 6.299609187110192e-05, "loss": 2.2536, "step": 94096 }, { "epoch": 0.59, "learning_rate": 6.298980271461989e-05, "loss": 2.2449, "step": 94104 }, { "epoch": 0.59, "learning_rate": 6.298351348381104e-05, "loss": 2.2375, "step": 94112 }, { "epoch": 0.59, "learning_rate": 6.297722417883171e-05, "loss": 2.2453, "step": 94120 }, { "epoch": 0.59, "learning_rate": 6.297093479983827e-05, "loss": 2.2383, "step": 94128 }, { "epoch": 0.59, "learning_rate": 6.296464534698705e-05, "loss": 2.2312, "step": 94136 }, { "epoch": 0.59, "learning_rate": 6.295835582043441e-05, "loss": 2.261, "step": 94144 }, { "epoch": 0.59, "learning_rate": 6.295206622033671e-05, "loss": 2.2603, "step": 94152 }, { "epoch": 0.59, "learning_rate": 6.294577654685032e-05, "loss": 2.2583, "step": 94160 }, { "epoch": 0.59, "learning_rate": 6.293948680013159e-05, "loss": 2.261, "step": 94168 }, { "epoch": 0.59, "learning_rate": 6.293319698033688e-05, "loss": 2.2491, "step": 94176 }, { "epoch": 0.59, "learning_rate": 6.292690708762258e-05, "loss": 2.2589, "step": 94184 }, { "epoch": 0.59, "learning_rate": 6.292061712214504e-05, "loss": 2.2706, "step": 94192 }, { "epoch": 0.59, "learning_rate": 6.291432708406062e-05, "loss": 2.2603, "step": 94200 }, { "epoch": 0.59, "learning_rate": 6.29080369735257e-05, "loss": 2.2655, "step": 94208 }, { "epoch": 0.59, "learning_rate": 6.290174679069666e-05, "loss": 2.258, "step": 94216 }, { "epoch": 0.59, "learning_rate": 6.289545653572987e-05, "loss": 2.2664, "step": 94224 }, { "epoch": 0.59, "learning_rate": 6.288916620878171e-05, "loss": 2.2674, "step": 94232 }, { "epoch": 0.59, "learning_rate": 6.288287581000855e-05, "loss": 2.2552, "step": 94240 }, { "epoch": 0.59, "learning_rate": 6.287658533956677e-05, "loss": 2.2594, "step": 94248 }, { "epoch": 0.59, "learning_rate": 6.287029479761277e-05, "loss": 2.2585, "step": 94256 }, { "epoch": 0.59, "learning_rate": 6.286400418430291e-05, "loss": 2.2599, "step": 94264 }, { "epoch": 0.59, "learning_rate": 6.285771349979359e-05, "loss": 2.2539, "step": 94272 }, { "epoch": 0.59, "learning_rate": 6.285142274424118e-05, "loss": 2.2608, "step": 94280 }, { "epoch": 0.59, "learning_rate": 6.284513191780208e-05, "loss": 2.276, "step": 94288 }, { "epoch": 0.59, "learning_rate": 6.283884102063269e-05, "loss": 2.2591, "step": 94296 }, { "epoch": 0.59, "learning_rate": 6.283255005288938e-05, "loss": 2.2593, "step": 94304 }, { "epoch": 0.59, "learning_rate": 6.282625901472858e-05, "loss": 2.2524, "step": 94312 }, { "epoch": 0.59, "learning_rate": 6.281996790630667e-05, "loss": 2.251, "step": 94320 }, { "epoch": 0.59, "learning_rate": 6.281367672778e-05, "loss": 2.2612, "step": 94328 }, { "epoch": 0.59, "learning_rate": 6.280738547930505e-05, "loss": 2.2544, "step": 94336 }, { "epoch": 0.59, "learning_rate": 6.280109416103815e-05, "loss": 2.2661, "step": 94344 }, { "epoch": 0.59, "learning_rate": 6.279480277313576e-05, "loss": 2.2536, "step": 94352 }, { "epoch": 0.59, "learning_rate": 6.278851131575425e-05, "loss": 2.2579, "step": 94360 }, { "epoch": 0.59, "learning_rate": 6.278221978905003e-05, "loss": 2.2485, "step": 94368 }, { "epoch": 0.59, "learning_rate": 6.277592819317952e-05, "loss": 2.2549, "step": 94376 }, { "epoch": 0.59, "learning_rate": 6.276963652829914e-05, "loss": 2.2625, "step": 94384 }, { "epoch": 0.59, "learning_rate": 6.276334479456526e-05, "loss": 2.2309, "step": 94392 }, { "epoch": 0.59, "learning_rate": 6.275705299213433e-05, "loss": 2.2486, "step": 94400 }, { "epoch": 0.59, "learning_rate": 6.275076112116277e-05, "loss": 2.2616, "step": 94408 }, { "epoch": 0.59, "learning_rate": 6.274446918180694e-05, "loss": 2.2363, "step": 94416 }, { "epoch": 0.59, "learning_rate": 6.273817717422333e-05, "loss": 2.2449, "step": 94424 }, { "epoch": 0.59, "learning_rate": 6.273188509856831e-05, "loss": 2.2449, "step": 94432 }, { "epoch": 0.59, "learning_rate": 6.272559295499834e-05, "loss": 2.2576, "step": 94440 }, { "epoch": 0.59, "learning_rate": 6.27193007436698e-05, "loss": 2.251, "step": 94448 }, { "epoch": 0.59, "learning_rate": 6.271300846473916e-05, "loss": 2.2468, "step": 94456 }, { "epoch": 0.59, "learning_rate": 6.27067161183628e-05, "loss": 2.2487, "step": 94464 }, { "epoch": 0.59, "learning_rate": 6.27004237046972e-05, "loss": 2.2437, "step": 94472 }, { "epoch": 0.59, "learning_rate": 6.269413122389875e-05, "loss": 2.2554, "step": 94480 }, { "epoch": 0.59, "learning_rate": 6.268783867612389e-05, "loss": 2.2517, "step": 94488 }, { "epoch": 0.59, "learning_rate": 6.268154606152908e-05, "loss": 2.2466, "step": 94496 }, { "epoch": 0.59, "learning_rate": 6.267525338027071e-05, "loss": 2.2625, "step": 94504 }, { "epoch": 0.59, "learning_rate": 6.266896063250524e-05, "loss": 2.2394, "step": 94512 }, { "epoch": 0.59, "learning_rate": 6.266266781838912e-05, "loss": 2.2443, "step": 94520 }, { "epoch": 0.59, "learning_rate": 6.265637493807878e-05, "loss": 2.2616, "step": 94528 }, { "epoch": 0.59, "learning_rate": 6.265008199173068e-05, "loss": 2.2368, "step": 94536 }, { "epoch": 0.59, "learning_rate": 6.26437889795012e-05, "loss": 2.2418, "step": 94544 }, { "epoch": 0.59, "learning_rate": 6.263749590154687e-05, "loss": 2.2532, "step": 94552 }, { "epoch": 0.59, "learning_rate": 6.263120275802408e-05, "loss": 2.249, "step": 94560 }, { "epoch": 0.59, "learning_rate": 6.26249095490893e-05, "loss": 2.2461, "step": 94568 }, { "epoch": 0.59, "learning_rate": 6.261861627489897e-05, "loss": 2.2368, "step": 94576 }, { "epoch": 0.59, "learning_rate": 6.261232293560953e-05, "loss": 2.2414, "step": 94584 }, { "epoch": 0.59, "learning_rate": 6.260602953137747e-05, "loss": 2.249, "step": 94592 }, { "epoch": 0.59, "learning_rate": 6.259973606235923e-05, "loss": 2.2408, "step": 94600 }, { "epoch": 0.59, "learning_rate": 6.259344252871123e-05, "loss": 2.247, "step": 94608 }, { "epoch": 0.59, "learning_rate": 6.258714893058999e-05, "loss": 2.2515, "step": 94616 }, { "epoch": 0.59, "learning_rate": 6.25808552681519e-05, "loss": 2.2538, "step": 94624 }, { "epoch": 0.59, "learning_rate": 6.25745615415535e-05, "loss": 2.2557, "step": 94632 }, { "epoch": 0.59, "learning_rate": 6.256826775095117e-05, "loss": 2.2493, "step": 94640 }, { "epoch": 0.59, "learning_rate": 6.256197389650145e-05, "loss": 2.2646, "step": 94648 }, { "epoch": 0.59, "learning_rate": 6.255567997836075e-05, "loss": 2.2464, "step": 94656 }, { "epoch": 0.59, "learning_rate": 6.254938599668557e-05, "loss": 2.2553, "step": 94664 }, { "epoch": 0.59, "learning_rate": 6.254309195163237e-05, "loss": 2.2657, "step": 94672 }, { "epoch": 0.59, "learning_rate": 6.253679784335762e-05, "loss": 2.2669, "step": 94680 }, { "epoch": 0.59, "learning_rate": 6.253050367201778e-05, "loss": 2.2379, "step": 94688 }, { "epoch": 0.59, "learning_rate": 6.252420943776933e-05, "loss": 2.2481, "step": 94696 }, { "epoch": 0.59, "learning_rate": 6.251791514076877e-05, "loss": 2.2508, "step": 94704 }, { "epoch": 0.59, "learning_rate": 6.251162078117255e-05, "loss": 2.253, "step": 94712 }, { "epoch": 0.59, "learning_rate": 6.250532635913716e-05, "loss": 2.2483, "step": 94720 }, { "epoch": 0.59, "learning_rate": 6.249903187481905e-05, "loss": 2.2543, "step": 94728 }, { "epoch": 0.59, "learning_rate": 6.249273732837474e-05, "loss": 2.2578, "step": 94736 }, { "epoch": 0.59, "learning_rate": 6.248644271996072e-05, "loss": 2.2522, "step": 94744 }, { "epoch": 0.59, "learning_rate": 6.248014804973343e-05, "loss": 2.2456, "step": 94752 }, { "epoch": 0.59, "learning_rate": 6.247385331784939e-05, "loss": 2.2521, "step": 94760 }, { "epoch": 0.59, "learning_rate": 6.246755852446509e-05, "loss": 2.2579, "step": 94768 }, { "epoch": 0.59, "learning_rate": 6.246126366973699e-05, "loss": 2.2459, "step": 94776 }, { "epoch": 0.59, "learning_rate": 6.245496875382162e-05, "loss": 2.2635, "step": 94784 }, { "epoch": 0.59, "learning_rate": 6.244867377687543e-05, "loss": 2.2589, "step": 94792 }, { "epoch": 0.59, "learning_rate": 6.244237873905494e-05, "loss": 2.2753, "step": 94800 }, { "epoch": 0.59, "learning_rate": 6.243608364051666e-05, "loss": 2.2642, "step": 94808 }, { "epoch": 0.59, "learning_rate": 6.242978848141705e-05, "loss": 2.2431, "step": 94816 }, { "epoch": 0.59, "learning_rate": 6.242349326191262e-05, "loss": 2.2491, "step": 94824 }, { "epoch": 0.59, "learning_rate": 6.241719798215988e-05, "loss": 2.2455, "step": 94832 }, { "epoch": 0.59, "learning_rate": 6.241090264231534e-05, "loss": 2.248, "step": 94840 }, { "epoch": 0.59, "learning_rate": 6.240460724253549e-05, "loss": 2.2448, "step": 94848 }, { "epoch": 0.59, "learning_rate": 6.239831178297682e-05, "loss": 2.2557, "step": 94856 }, { "epoch": 0.59, "learning_rate": 6.239201626379585e-05, "loss": 2.2554, "step": 94864 }, { "epoch": 0.59, "learning_rate": 6.23857206851491e-05, "loss": 2.2676, "step": 94872 }, { "epoch": 0.59, "learning_rate": 6.237942504719305e-05, "loss": 2.2433, "step": 94880 }, { "epoch": 0.59, "learning_rate": 6.237312935008424e-05, "loss": 2.2463, "step": 94888 }, { "epoch": 0.59, "learning_rate": 6.236683359397915e-05, "loss": 2.2657, "step": 94896 }, { "epoch": 0.59, "learning_rate": 6.236053777903435e-05, "loss": 2.2495, "step": 94904 }, { "epoch": 0.59, "learning_rate": 6.235424190540628e-05, "loss": 2.2567, "step": 94912 }, { "epoch": 0.59, "learning_rate": 6.234794597325149e-05, "loss": 2.2559, "step": 94920 }, { "epoch": 0.59, "learning_rate": 6.234164998272651e-05, "loss": 2.2524, "step": 94928 }, { "epoch": 0.59, "learning_rate": 6.233535393398786e-05, "loss": 2.2613, "step": 94936 }, { "epoch": 0.59, "learning_rate": 6.232905782719203e-05, "loss": 2.2503, "step": 94944 }, { "epoch": 0.59, "learning_rate": 6.232276166249557e-05, "loss": 2.2569, "step": 94952 }, { "epoch": 0.59, "learning_rate": 6.2316465440055e-05, "loss": 2.247, "step": 94960 }, { "epoch": 0.59, "learning_rate": 6.231016916002684e-05, "loss": 2.2503, "step": 94968 }, { "epoch": 0.59, "learning_rate": 6.230387282256762e-05, "loss": 2.2599, "step": 94976 }, { "epoch": 0.59, "learning_rate": 6.229757642783384e-05, "loss": 2.2443, "step": 94984 }, { "epoch": 0.59, "learning_rate": 6.229127997598206e-05, "loss": 2.2801, "step": 94992 }, { "epoch": 0.59, "learning_rate": 6.228498346716883e-05, "loss": 2.2639, "step": 95000 }, { "epoch": 0.59, "learning_rate": 6.227868690155062e-05, "loss": 2.2505, "step": 95008 }, { "epoch": 0.59, "learning_rate": 6.2272390279284e-05, "loss": 2.2382, "step": 95016 }, { "epoch": 0.59, "learning_rate": 6.226609360052553e-05, "loss": 2.2581, "step": 95024 }, { "epoch": 0.59, "learning_rate": 6.225979686543169e-05, "loss": 2.2678, "step": 95032 }, { "epoch": 0.59, "learning_rate": 6.225350007415906e-05, "loss": 2.2572, "step": 95040 }, { "epoch": 0.59, "learning_rate": 6.224720322686415e-05, "loss": 2.2562, "step": 95048 }, { "epoch": 0.59, "learning_rate": 6.224090632370355e-05, "loss": 2.254, "step": 95056 }, { "epoch": 0.59, "learning_rate": 6.223460936483374e-05, "loss": 2.2454, "step": 95064 }, { "epoch": 0.59, "learning_rate": 6.222831235041128e-05, "loss": 2.2434, "step": 95072 }, { "epoch": 0.59, "learning_rate": 6.222201528059276e-05, "loss": 2.255, "step": 95080 }, { "epoch": 0.59, "learning_rate": 6.221571815553466e-05, "loss": 2.255, "step": 95088 }, { "epoch": 0.59, "learning_rate": 6.220942097539358e-05, "loss": 2.2551, "step": 95096 }, { "epoch": 0.59, "learning_rate": 6.220312374032604e-05, "loss": 2.2627, "step": 95104 }, { "epoch": 0.59, "learning_rate": 6.219682645048858e-05, "loss": 2.2486, "step": 95112 }, { "epoch": 0.59, "learning_rate": 6.21905291060378e-05, "loss": 2.2446, "step": 95120 }, { "epoch": 0.59, "learning_rate": 6.21842317071302e-05, "loss": 2.251, "step": 95128 }, { "epoch": 0.59, "learning_rate": 6.217793425392235e-05, "loss": 2.2531, "step": 95136 }, { "epoch": 0.59, "learning_rate": 6.217163674657083e-05, "loss": 2.2471, "step": 95144 }, { "epoch": 0.59, "learning_rate": 6.216533918523216e-05, "loss": 2.2601, "step": 95152 }, { "epoch": 0.59, "learning_rate": 6.215904157006294e-05, "loss": 2.2512, "step": 95160 }, { "epoch": 0.59, "learning_rate": 6.215274390121966e-05, "loss": 2.2633, "step": 95168 }, { "epoch": 0.59, "learning_rate": 6.214644617885897e-05, "loss": 2.2552, "step": 95176 }, { "epoch": 0.59, "learning_rate": 6.214014840313734e-05, "loss": 2.2678, "step": 95184 }, { "epoch": 0.59, "learning_rate": 6.213385057421142e-05, "loss": 2.2405, "step": 95192 }, { "epoch": 0.59, "learning_rate": 6.212755269223772e-05, "loss": 2.2528, "step": 95200 }, { "epoch": 0.6, "learning_rate": 6.212125475737281e-05, "loss": 2.2475, "step": 95208 }, { "epoch": 0.6, "learning_rate": 6.211495676977331e-05, "loss": 2.2537, "step": 95216 }, { "epoch": 0.6, "learning_rate": 6.21086587295957e-05, "loss": 2.2585, "step": 95224 }, { "epoch": 0.6, "learning_rate": 6.210236063699662e-05, "loss": 2.2527, "step": 95232 }, { "epoch": 0.6, "learning_rate": 6.209606249213263e-05, "loss": 2.2428, "step": 95240 }, { "epoch": 0.6, "learning_rate": 6.208976429516026e-05, "loss": 2.2541, "step": 95248 }, { "epoch": 0.6, "learning_rate": 6.208346604623613e-05, "loss": 2.2636, "step": 95256 }, { "epoch": 0.6, "learning_rate": 6.20771677455168e-05, "loss": 2.2519, "step": 95264 }, { "epoch": 0.6, "learning_rate": 6.207086939315884e-05, "loss": 2.2569, "step": 95272 }, { "epoch": 0.6, "learning_rate": 6.206457098931886e-05, "loss": 2.2457, "step": 95280 }, { "epoch": 0.6, "learning_rate": 6.205827253415339e-05, "loss": 2.258, "step": 95288 }, { "epoch": 0.6, "learning_rate": 6.205197402781903e-05, "loss": 2.2484, "step": 95296 }, { "epoch": 0.6, "learning_rate": 6.20456754704724e-05, "loss": 2.2695, "step": 95304 }, { "epoch": 0.6, "learning_rate": 6.203937686227002e-05, "loss": 2.2469, "step": 95312 }, { "epoch": 0.6, "learning_rate": 6.20330782033685e-05, "loss": 2.2358, "step": 95320 }, { "epoch": 0.6, "learning_rate": 6.202677949392444e-05, "loss": 2.2774, "step": 95328 }, { "epoch": 0.6, "learning_rate": 6.202048073409441e-05, "loss": 2.2535, "step": 95336 }, { "epoch": 0.6, "learning_rate": 6.2014181924035e-05, "loss": 2.2611, "step": 95344 }, { "epoch": 0.6, "learning_rate": 6.20078830639028e-05, "loss": 2.2598, "step": 95352 }, { "epoch": 0.6, "learning_rate": 6.20015841538544e-05, "loss": 2.2441, "step": 95360 }, { "epoch": 0.6, "learning_rate": 6.19952851940464e-05, "loss": 2.2411, "step": 95368 }, { "epoch": 0.6, "learning_rate": 6.19889861846354e-05, "loss": 2.2484, "step": 95376 }, { "epoch": 0.6, "learning_rate": 6.198268712577795e-05, "loss": 2.2623, "step": 95384 }, { "epoch": 0.6, "learning_rate": 6.19763880176307e-05, "loss": 2.2453, "step": 95392 }, { "epoch": 0.6, "learning_rate": 6.197008886035021e-05, "loss": 2.2518, "step": 95400 }, { "epoch": 0.6, "learning_rate": 6.19637896540931e-05, "loss": 2.2305, "step": 95408 }, { "epoch": 0.6, "learning_rate": 6.195749039901595e-05, "loss": 2.2571, "step": 95416 }, { "epoch": 0.6, "learning_rate": 6.195119109527536e-05, "loss": 2.2524, "step": 95424 }, { "epoch": 0.6, "learning_rate": 6.194489174302796e-05, "loss": 2.2673, "step": 95432 }, { "epoch": 0.6, "learning_rate": 6.193859234243032e-05, "loss": 2.2638, "step": 95440 }, { "epoch": 0.6, "learning_rate": 6.193229289363906e-05, "loss": 2.2476, "step": 95448 }, { "epoch": 0.6, "learning_rate": 6.192599339681078e-05, "loss": 2.2643, "step": 95456 }, { "epoch": 0.6, "learning_rate": 6.19196938521021e-05, "loss": 2.2565, "step": 95464 }, { "epoch": 0.6, "learning_rate": 6.19133942596696e-05, "loss": 2.2513, "step": 95472 }, { "epoch": 0.6, "learning_rate": 6.19070946196699e-05, "loss": 2.2508, "step": 95480 }, { "epoch": 0.6, "learning_rate": 6.190079493225963e-05, "loss": 2.2492, "step": 95488 }, { "epoch": 0.6, "learning_rate": 6.189449519759539e-05, "loss": 2.2641, "step": 95496 }, { "epoch": 0.6, "learning_rate": 6.188819541583377e-05, "loss": 2.2528, "step": 95504 }, { "epoch": 0.6, "learning_rate": 6.18818955871314e-05, "loss": 2.2436, "step": 95512 }, { "epoch": 0.6, "learning_rate": 6.18755957116449e-05, "loss": 2.2525, "step": 95520 }, { "epoch": 0.6, "learning_rate": 6.186929578953088e-05, "loss": 2.2428, "step": 95528 }, { "epoch": 0.6, "learning_rate": 6.186299582094595e-05, "loss": 2.2463, "step": 95536 }, { "epoch": 0.6, "learning_rate": 6.185669580604674e-05, "loss": 2.256, "step": 95544 }, { "epoch": 0.6, "learning_rate": 6.185039574498988e-05, "loss": 2.2579, "step": 95552 }, { "epoch": 0.6, "learning_rate": 6.184409563793195e-05, "loss": 2.2382, "step": 95560 }, { "epoch": 0.6, "learning_rate": 6.18377954850296e-05, "loss": 2.2477, "step": 95568 }, { "epoch": 0.6, "learning_rate": 6.183149528643945e-05, "loss": 2.2569, "step": 95576 }, { "epoch": 0.6, "learning_rate": 6.182519504231814e-05, "loss": 2.2488, "step": 95584 }, { "epoch": 0.6, "learning_rate": 6.181889475282226e-05, "loss": 2.2597, "step": 95592 }, { "epoch": 0.6, "learning_rate": 6.181259441810845e-05, "loss": 2.2472, "step": 95600 }, { "epoch": 0.6, "learning_rate": 6.180629403833335e-05, "loss": 2.2448, "step": 95608 }, { "epoch": 0.6, "learning_rate": 6.179999361365356e-05, "loss": 2.2628, "step": 95616 }, { "epoch": 0.6, "learning_rate": 6.179369314422576e-05, "loss": 2.2461, "step": 95624 }, { "epoch": 0.6, "learning_rate": 6.178739263020651e-05, "loss": 2.2391, "step": 95632 }, { "epoch": 0.6, "learning_rate": 6.17810920717525e-05, "loss": 2.2244, "step": 95640 }, { "epoch": 0.6, "learning_rate": 6.177479146902034e-05, "loss": 2.2486, "step": 95648 }, { "epoch": 0.6, "learning_rate": 6.176849082216665e-05, "loss": 2.2437, "step": 95656 }, { "epoch": 0.6, "learning_rate": 6.17621901313481e-05, "loss": 2.2513, "step": 95664 }, { "epoch": 0.6, "learning_rate": 6.17558893967213e-05, "loss": 2.2352, "step": 95672 }, { "epoch": 0.6, "learning_rate": 6.174958861844287e-05, "loss": 2.2451, "step": 95680 }, { "epoch": 0.6, "learning_rate": 6.17432877966695e-05, "loss": 2.2373, "step": 95688 }, { "epoch": 0.6, "learning_rate": 6.173698693155778e-05, "loss": 2.2614, "step": 95696 }, { "epoch": 0.6, "learning_rate": 6.173068602326437e-05, "loss": 2.2566, "step": 95704 }, { "epoch": 0.6, "learning_rate": 6.172438507194592e-05, "loss": 2.2616, "step": 95712 }, { "epoch": 0.6, "learning_rate": 6.171808407775907e-05, "loss": 2.2566, "step": 95720 }, { "epoch": 0.6, "learning_rate": 6.171178304086044e-05, "loss": 2.2448, "step": 95728 }, { "epoch": 0.6, "learning_rate": 6.17054819614067e-05, "loss": 2.2409, "step": 95736 }, { "epoch": 0.6, "learning_rate": 6.16991808395545e-05, "loss": 2.256, "step": 95744 }, { "epoch": 0.6, "learning_rate": 6.169287967546046e-05, "loss": 2.2431, "step": 95752 }, { "epoch": 0.6, "learning_rate": 6.168657846928126e-05, "loss": 2.2715, "step": 95760 }, { "epoch": 0.6, "learning_rate": 6.168027722117351e-05, "loss": 2.247, "step": 95768 }, { "epoch": 0.6, "learning_rate": 6.167397593129389e-05, "loss": 2.2377, "step": 95776 }, { "epoch": 0.6, "learning_rate": 6.166767459979901e-05, "loss": 2.2518, "step": 95784 }, { "epoch": 0.6, "learning_rate": 6.166137322684559e-05, "loss": 2.2409, "step": 95792 }, { "epoch": 0.6, "learning_rate": 6.165507181259022e-05, "loss": 2.2496, "step": 95800 }, { "epoch": 0.6, "learning_rate": 6.164877035718961e-05, "loss": 2.2735, "step": 95808 }, { "epoch": 0.6, "learning_rate": 6.164246886080037e-05, "loss": 2.2422, "step": 95816 }, { "epoch": 0.6, "learning_rate": 6.163616732357915e-05, "loss": 2.2422, "step": 95824 }, { "epoch": 0.6, "learning_rate": 6.162986574568264e-05, "loss": 2.2621, "step": 95832 }, { "epoch": 0.6, "learning_rate": 6.162356412726749e-05, "loss": 2.235, "step": 95840 }, { "epoch": 0.6, "learning_rate": 6.161726246849036e-05, "loss": 2.2541, "step": 95848 }, { "epoch": 0.6, "learning_rate": 6.161096076950787e-05, "loss": 2.2515, "step": 95856 }, { "epoch": 0.6, "learning_rate": 6.160465903047676e-05, "loss": 2.2385, "step": 95864 }, { "epoch": 0.6, "learning_rate": 6.15983572515536e-05, "loss": 2.2585, "step": 95872 }, { "epoch": 0.6, "learning_rate": 6.159205543289513e-05, "loss": 2.2606, "step": 95880 }, { "epoch": 0.6, "learning_rate": 6.158575357465798e-05, "loss": 2.2626, "step": 95888 }, { "epoch": 0.6, "learning_rate": 6.157945167699881e-05, "loss": 2.2493, "step": 95896 }, { "epoch": 0.6, "learning_rate": 6.15731497400743e-05, "loss": 2.2558, "step": 95904 }, { "epoch": 0.6, "learning_rate": 6.156684776404111e-05, "loss": 2.2447, "step": 95912 }, { "epoch": 0.6, "learning_rate": 6.156054574905592e-05, "loss": 2.242, "step": 95920 }, { "epoch": 0.6, "learning_rate": 6.155424369527537e-05, "loss": 2.2566, "step": 95928 }, { "epoch": 0.6, "learning_rate": 6.154794160285616e-05, "loss": 2.2422, "step": 95936 }, { "epoch": 0.6, "learning_rate": 6.154163947195493e-05, "loss": 2.2616, "step": 95944 }, { "epoch": 0.6, "learning_rate": 6.153533730272838e-05, "loss": 2.2636, "step": 95952 }, { "epoch": 0.6, "learning_rate": 6.152903509533319e-05, "loss": 2.2647, "step": 95960 }, { "epoch": 0.6, "learning_rate": 6.1522732849926e-05, "loss": 2.2611, "step": 95968 }, { "epoch": 0.6, "learning_rate": 6.15164305666635e-05, "loss": 2.2413, "step": 95976 }, { "epoch": 0.6, "learning_rate": 6.151012824570237e-05, "loss": 2.248, "step": 95984 }, { "epoch": 0.6, "learning_rate": 6.150382588719927e-05, "loss": 2.2396, "step": 95992 }, { "epoch": 0.6, "learning_rate": 6.14975234913109e-05, "loss": 2.2431, "step": 96000 }, { "epoch": 0.6, "learning_rate": 6.149122105819391e-05, "loss": 2.2583, "step": 96008 }, { "epoch": 0.6, "learning_rate": 6.148491858800503e-05, "loss": 2.2516, "step": 96016 }, { "epoch": 0.6, "learning_rate": 6.147861608090089e-05, "loss": 2.2475, "step": 96024 }, { "epoch": 0.6, "learning_rate": 6.14723135370382e-05, "loss": 2.2427, "step": 96032 }, { "epoch": 0.6, "learning_rate": 6.14660109565736e-05, "loss": 2.2436, "step": 96040 }, { "epoch": 0.6, "learning_rate": 6.145970833966383e-05, "loss": 2.2492, "step": 96048 }, { "epoch": 0.6, "learning_rate": 6.145340568646556e-05, "loss": 2.2533, "step": 96056 }, { "epoch": 0.6, "learning_rate": 6.144710299713543e-05, "loss": 2.2496, "step": 96064 }, { "epoch": 0.6, "learning_rate": 6.144080027183016e-05, "loss": 2.2482, "step": 96072 }, { "epoch": 0.6, "learning_rate": 6.143449751070644e-05, "loss": 2.2451, "step": 96080 }, { "epoch": 0.6, "learning_rate": 6.142819471392097e-05, "loss": 2.2368, "step": 96088 }, { "epoch": 0.6, "learning_rate": 6.142189188163039e-05, "loss": 2.2629, "step": 96096 }, { "epoch": 0.6, "learning_rate": 6.141558901399142e-05, "loss": 2.247, "step": 96104 }, { "epoch": 0.6, "learning_rate": 6.140928611116077e-05, "loss": 2.2532, "step": 96112 }, { "epoch": 0.6, "learning_rate": 6.14029831732951e-05, "loss": 2.2431, "step": 96120 }, { "epoch": 0.6, "learning_rate": 6.139668020055111e-05, "loss": 2.2368, "step": 96128 }, { "epoch": 0.6, "learning_rate": 6.139037719308549e-05, "loss": 2.2521, "step": 96136 }, { "epoch": 0.6, "learning_rate": 6.138407415105493e-05, "loss": 2.2518, "step": 96144 }, { "epoch": 0.6, "learning_rate": 6.137777107461615e-05, "loss": 2.2572, "step": 96152 }, { "epoch": 0.6, "learning_rate": 6.137146796392582e-05, "loss": 2.2451, "step": 96160 }, { "epoch": 0.6, "learning_rate": 6.136516481914064e-05, "loss": 2.2578, "step": 96168 }, { "epoch": 0.6, "learning_rate": 6.13588616404173e-05, "loss": 2.2482, "step": 96176 }, { "epoch": 0.6, "learning_rate": 6.135255842791252e-05, "loss": 2.2459, "step": 96184 }, { "epoch": 0.6, "learning_rate": 6.134625518178299e-05, "loss": 2.2572, "step": 96192 }, { "epoch": 0.6, "learning_rate": 6.133995190218539e-05, "loss": 2.2644, "step": 96200 }, { "epoch": 0.6, "learning_rate": 6.133364858927643e-05, "loss": 2.2312, "step": 96208 }, { "epoch": 0.6, "learning_rate": 6.132734524321285e-05, "loss": 2.2513, "step": 96216 }, { "epoch": 0.6, "learning_rate": 6.132104186415128e-05, "loss": 2.2646, "step": 96224 }, { "epoch": 0.6, "learning_rate": 6.131473845224849e-05, "loss": 2.2604, "step": 96232 }, { "epoch": 0.6, "learning_rate": 6.130843500766115e-05, "loss": 2.2597, "step": 96240 }, { "epoch": 0.6, "learning_rate": 6.130213153054595e-05, "loss": 2.2454, "step": 96248 }, { "epoch": 0.6, "learning_rate": 6.129582802105964e-05, "loss": 2.244, "step": 96256 }, { "epoch": 0.6, "learning_rate": 6.128952447935887e-05, "loss": 2.2694, "step": 96264 }, { "epoch": 0.6, "learning_rate": 6.128322090560041e-05, "loss": 2.2534, "step": 96272 }, { "epoch": 0.6, "learning_rate": 6.127691729994092e-05, "loss": 2.2306, "step": 96280 }, { "epoch": 0.6, "learning_rate": 6.12706136625371e-05, "loss": 2.2502, "step": 96288 }, { "epoch": 0.6, "learning_rate": 6.126430999354571e-05, "loss": 2.2607, "step": 96296 }, { "epoch": 0.6, "learning_rate": 6.125800629312341e-05, "loss": 2.2445, "step": 96304 }, { "epoch": 0.6, "learning_rate": 6.125170256142696e-05, "loss": 2.2526, "step": 96312 }, { "epoch": 0.6, "learning_rate": 6.124539879861302e-05, "loss": 2.2629, "step": 96320 }, { "epoch": 0.6, "learning_rate": 6.123909500483835e-05, "loss": 2.2503, "step": 96328 }, { "epoch": 0.6, "learning_rate": 6.123279118025961e-05, "loss": 2.2558, "step": 96336 }, { "epoch": 0.6, "learning_rate": 6.122648732503357e-05, "loss": 2.2432, "step": 96344 }, { "epoch": 0.6, "learning_rate": 6.12201834393169e-05, "loss": 2.2548, "step": 96352 }, { "epoch": 0.6, "learning_rate": 6.121387952326634e-05, "loss": 2.2621, "step": 96360 }, { "epoch": 0.6, "learning_rate": 6.12075755770386e-05, "loss": 2.2371, "step": 96368 }, { "epoch": 0.6, "learning_rate": 6.120127160079039e-05, "loss": 2.2497, "step": 96376 }, { "epoch": 0.6, "learning_rate": 6.119496759467842e-05, "loss": 2.2528, "step": 96384 }, { "epoch": 0.6, "learning_rate": 6.118866355885945e-05, "loss": 2.2445, "step": 96392 }, { "epoch": 0.6, "learning_rate": 6.118235949349016e-05, "loss": 2.2377, "step": 96400 }, { "epoch": 0.6, "learning_rate": 6.117605539872728e-05, "loss": 2.2568, "step": 96408 }, { "epoch": 0.6, "learning_rate": 6.116975127472752e-05, "loss": 2.2417, "step": 96416 }, { "epoch": 0.6, "learning_rate": 6.116344712164763e-05, "loss": 2.2368, "step": 96424 }, { "epoch": 0.6, "learning_rate": 6.11571429396443e-05, "loss": 2.2529, "step": 96432 }, { "epoch": 0.6, "learning_rate": 6.115083872887427e-05, "loss": 2.2537, "step": 96440 }, { "epoch": 0.6, "learning_rate": 6.114453448949426e-05, "loss": 2.2341, "step": 96448 }, { "epoch": 0.6, "learning_rate": 6.1138230221661e-05, "loss": 2.243, "step": 96456 }, { "epoch": 0.6, "learning_rate": 6.11319259255312e-05, "loss": 2.2313, "step": 96464 }, { "epoch": 0.6, "learning_rate": 6.11256216012616e-05, "loss": 2.2401, "step": 96472 }, { "epoch": 0.6, "learning_rate": 6.111931724900892e-05, "loss": 2.257, "step": 96480 }, { "epoch": 0.6, "learning_rate": 6.11130128689299e-05, "loss": 2.2651, "step": 96488 }, { "epoch": 0.6, "learning_rate": 6.110670846118123e-05, "loss": 2.2537, "step": 96496 }, { "epoch": 0.6, "learning_rate": 6.110040402591968e-05, "loss": 2.2345, "step": 96504 }, { "epoch": 0.6, "learning_rate": 6.109409956330196e-05, "loss": 2.2403, "step": 96512 }, { "epoch": 0.6, "learning_rate": 6.108779507348481e-05, "loss": 2.2383, "step": 96520 }, { "epoch": 0.6, "learning_rate": 6.108149055662495e-05, "loss": 2.2539, "step": 96528 }, { "epoch": 0.6, "learning_rate": 6.10751860128791e-05, "loss": 2.2512, "step": 96536 }, { "epoch": 0.6, "learning_rate": 6.1068881442404e-05, "loss": 2.2566, "step": 96544 }, { "epoch": 0.6, "learning_rate": 6.106257684535641e-05, "loss": 2.2491, "step": 96552 }, { "epoch": 0.6, "learning_rate": 6.105627222189302e-05, "loss": 2.2574, "step": 96560 }, { "epoch": 0.6, "learning_rate": 6.104996757217061e-05, "loss": 2.2485, "step": 96568 }, { "epoch": 0.6, "learning_rate": 6.104366289634587e-05, "loss": 2.2505, "step": 96576 }, { "epoch": 0.6, "learning_rate": 6.103735819457554e-05, "loss": 2.2461, "step": 96584 }, { "epoch": 0.6, "learning_rate": 6.103105346701638e-05, "loss": 2.2731, "step": 96592 }, { "epoch": 0.6, "learning_rate": 6.102474871382513e-05, "loss": 2.2264, "step": 96600 }, { "epoch": 0.6, "learning_rate": 6.1018443935158495e-05, "loss": 2.2582, "step": 96608 }, { "epoch": 0.6, "learning_rate": 6.101213913117324e-05, "loss": 2.2616, "step": 96616 }, { "epoch": 0.6, "learning_rate": 6.100583430202609e-05, "loss": 2.2707, "step": 96624 }, { "epoch": 0.6, "learning_rate": 6.099952944787377e-05, "loss": 2.2569, "step": 96632 }, { "epoch": 0.6, "learning_rate": 6.099322456887306e-05, "loss": 2.248, "step": 96640 }, { "epoch": 0.6, "learning_rate": 6.098691966518069e-05, "loss": 2.2309, "step": 96648 }, { "epoch": 0.6, "learning_rate": 6.098061473695335e-05, "loss": 2.2625, "step": 96656 }, { "epoch": 0.6, "learning_rate": 6.097430978434783e-05, "loss": 2.2444, "step": 96664 }, { "epoch": 0.6, "learning_rate": 6.096800480752085e-05, "loss": 2.2509, "step": 96672 }, { "epoch": 0.6, "learning_rate": 6.096169980662918e-05, "loss": 2.2553, "step": 96680 }, { "epoch": 0.6, "learning_rate": 6.095539478182954e-05, "loss": 2.2488, "step": 96688 }, { "epoch": 0.6, "learning_rate": 6.0949089733278664e-05, "loss": 2.2501, "step": 96696 }, { "epoch": 0.6, "learning_rate": 6.094278466113334e-05, "loss": 2.2503, "step": 96704 }, { "epoch": 0.6, "learning_rate": 6.093647956555026e-05, "loss": 2.2515, "step": 96712 }, { "epoch": 0.6, "learning_rate": 6.0930174446686196e-05, "loss": 2.2492, "step": 96720 }, { "epoch": 0.6, "learning_rate": 6.0923869304697887e-05, "loss": 2.2513, "step": 96728 }, { "epoch": 0.6, "learning_rate": 6.09175641397421e-05, "loss": 2.2525, "step": 96736 }, { "epoch": 0.6, "learning_rate": 6.091125895197556e-05, "loss": 2.2525, "step": 96744 }, { "epoch": 0.6, "learning_rate": 6.0904953741555e-05, "loss": 2.252, "step": 96752 }, { "epoch": 0.6, "learning_rate": 6.0898648508637204e-05, "loss": 2.2485, "step": 96760 }, { "epoch": 0.6, "learning_rate": 6.089234325337891e-05, "loss": 2.2701, "step": 96768 }, { "epoch": 0.6, "learning_rate": 6.088603797593686e-05, "loss": 2.2628, "step": 96776 }, { "epoch": 0.6, "learning_rate": 6.0879732676467807e-05, "loss": 2.256, "step": 96784 }, { "epoch": 0.6, "learning_rate": 6.087342735512849e-05, "loss": 2.252, "step": 96792 }, { "epoch": 0.6, "learning_rate": 6.0867122012075694e-05, "loss": 2.2435, "step": 96800 }, { "epoch": 0.61, "learning_rate": 6.0860816647466126e-05, "loss": 2.2422, "step": 96808 }, { "epoch": 0.61, "learning_rate": 6.085451126145656e-05, "loss": 2.252, "step": 96816 }, { "epoch": 0.61, "learning_rate": 6.0848205854203764e-05, "loss": 2.256, "step": 96824 }, { "epoch": 0.61, "learning_rate": 6.084190042586446e-05, "loss": 2.2557, "step": 96832 }, { "epoch": 0.61, "learning_rate": 6.083559497659543e-05, "loss": 2.2707, "step": 96840 }, { "epoch": 0.61, "learning_rate": 6.08292895065534e-05, "loss": 2.2515, "step": 96848 }, { "epoch": 0.61, "learning_rate": 6.082298401589515e-05, "loss": 2.2432, "step": 96856 }, { "epoch": 0.61, "learning_rate": 6.081667850477742e-05, "loss": 2.2524, "step": 96864 }, { "epoch": 0.61, "learning_rate": 6.081037297335699e-05, "loss": 2.2554, "step": 96872 }, { "epoch": 0.61, "learning_rate": 6.0804067421790565e-05, "loss": 2.2738, "step": 96880 }, { "epoch": 0.61, "learning_rate": 6.0797761850234944e-05, "loss": 2.2664, "step": 96888 }, { "epoch": 0.61, "learning_rate": 6.079145625884689e-05, "loss": 2.2729, "step": 96896 }, { "epoch": 0.61, "learning_rate": 6.078515064778314e-05, "loss": 2.2573, "step": 96904 }, { "epoch": 0.61, "learning_rate": 6.077884501720044e-05, "loss": 2.2445, "step": 96912 }, { "epoch": 0.61, "learning_rate": 6.077253936725558e-05, "loss": 2.2527, "step": 96920 }, { "epoch": 0.61, "learning_rate": 6.07662336981053e-05, "loss": 2.2691, "step": 96928 }, { "epoch": 0.61, "learning_rate": 6.075992800990635e-05, "loss": 2.2554, "step": 96936 }, { "epoch": 0.61, "learning_rate": 6.0753622302815526e-05, "loss": 2.2637, "step": 96944 }, { "epoch": 0.61, "learning_rate": 6.074731657698956e-05, "loss": 2.275, "step": 96952 }, { "epoch": 0.61, "learning_rate": 6.074101083258523e-05, "loss": 2.2538, "step": 96960 }, { "epoch": 0.61, "learning_rate": 6.073470506975927e-05, "loss": 2.2624, "step": 96968 }, { "epoch": 0.61, "learning_rate": 6.072839928866847e-05, "loss": 2.247, "step": 96976 }, { "epoch": 0.61, "learning_rate": 6.0722093489469576e-05, "loss": 2.2548, "step": 96984 }, { "epoch": 0.61, "learning_rate": 6.071578767231937e-05, "loss": 2.2682, "step": 96992 }, { "epoch": 0.61, "learning_rate": 6.0709481837374597e-05, "loss": 2.2433, "step": 97000 }, { "epoch": 0.61, "learning_rate": 6.0703175984792004e-05, "loss": 2.2538, "step": 97008 }, { "epoch": 0.61, "learning_rate": 6.06968701147284e-05, "loss": 2.2483, "step": 97016 }, { "epoch": 0.61, "learning_rate": 6.069056422734052e-05, "loss": 2.2505, "step": 97024 }, { "epoch": 0.61, "learning_rate": 6.0684258322785136e-05, "loss": 2.2375, "step": 97032 }, { "epoch": 0.61, "learning_rate": 6.0677952401219015e-05, "loss": 2.2625, "step": 97040 }, { "epoch": 0.61, "learning_rate": 6.0671646462798924e-05, "loss": 2.2466, "step": 97048 }, { "epoch": 0.61, "learning_rate": 6.066534050768163e-05, "loss": 2.2521, "step": 97056 }, { "epoch": 0.61, "learning_rate": 6.0659034536023885e-05, "loss": 2.249, "step": 97064 }, { "epoch": 0.61, "learning_rate": 6.0652728547982476e-05, "loss": 2.2487, "step": 97072 }, { "epoch": 0.61, "learning_rate": 6.064642254371415e-05, "loss": 2.2513, "step": 97080 }, { "epoch": 0.61, "learning_rate": 6.06401165233757e-05, "loss": 2.2543, "step": 97088 }, { "epoch": 0.61, "learning_rate": 6.063381048712387e-05, "loss": 2.2501, "step": 97096 }, { "epoch": 0.61, "learning_rate": 6.0627504435115444e-05, "loss": 2.2691, "step": 97104 }, { "epoch": 0.61, "learning_rate": 6.0621198367507195e-05, "loss": 2.2609, "step": 97112 }, { "epoch": 0.61, "learning_rate": 6.061489228445588e-05, "loss": 2.2618, "step": 97120 }, { "epoch": 0.61, "learning_rate": 6.0608586186118274e-05, "loss": 2.2437, "step": 97128 }, { "epoch": 0.61, "learning_rate": 6.060228007265114e-05, "loss": 2.2631, "step": 97136 }, { "epoch": 0.61, "learning_rate": 6.059597394421128e-05, "loss": 2.271, "step": 97144 }, { "epoch": 0.61, "learning_rate": 6.058966780095541e-05, "loss": 2.2575, "step": 97152 }, { "epoch": 0.61, "learning_rate": 6.058336164304035e-05, "loss": 2.2656, "step": 97160 }, { "epoch": 0.61, "learning_rate": 6.0577055470622846e-05, "loss": 2.2555, "step": 97168 }, { "epoch": 0.61, "learning_rate": 6.0570749283859694e-05, "loss": 2.269, "step": 97176 }, { "epoch": 0.61, "learning_rate": 6.056444308290763e-05, "loss": 2.2683, "step": 97184 }, { "epoch": 0.61, "learning_rate": 6.055813686792347e-05, "loss": 2.2672, "step": 97192 }, { "epoch": 0.61, "learning_rate": 6.055183063906394e-05, "loss": 2.2786, "step": 97200 }, { "epoch": 0.61, "learning_rate": 6.054552439648587e-05, "loss": 2.2625, "step": 97208 }, { "epoch": 0.61, "learning_rate": 6.053921814034597e-05, "loss": 2.2545, "step": 97216 }, { "epoch": 0.61, "learning_rate": 6.0532911870801045e-05, "loss": 2.242, "step": 97224 }, { "epoch": 0.61, "learning_rate": 6.052660558800789e-05, "loss": 2.2526, "step": 97232 }, { "epoch": 0.61, "learning_rate": 6.052029929212326e-05, "loss": 2.2372, "step": 97240 }, { "epoch": 0.61, "learning_rate": 6.0513992983303915e-05, "loss": 2.2587, "step": 97248 }, { "epoch": 0.61, "learning_rate": 6.050768666170666e-05, "loss": 2.251, "step": 97256 }, { "epoch": 0.61, "learning_rate": 6.050138032748827e-05, "loss": 2.2634, "step": 97264 }, { "epoch": 0.61, "learning_rate": 6.049507398080549e-05, "loss": 2.2438, "step": 97272 }, { "epoch": 0.61, "learning_rate": 6.048876762181511e-05, "loss": 2.2368, "step": 97280 }, { "epoch": 0.61, "learning_rate": 6.048246125067394e-05, "loss": 2.2539, "step": 97288 }, { "epoch": 0.61, "learning_rate": 6.04761548675387e-05, "loss": 2.2398, "step": 97296 }, { "epoch": 0.61, "learning_rate": 6.046984847256623e-05, "loss": 2.2523, "step": 97304 }, { "epoch": 0.61, "learning_rate": 6.046354206591323e-05, "loss": 2.2634, "step": 97312 }, { "epoch": 0.61, "learning_rate": 6.0457235647736554e-05, "loss": 2.2503, "step": 97320 }, { "epoch": 0.61, "learning_rate": 6.045092921819293e-05, "loss": 2.2478, "step": 97328 }, { "epoch": 0.61, "learning_rate": 6.0444622777439176e-05, "loss": 2.273, "step": 97336 }, { "epoch": 0.61, "learning_rate": 6.0438316325632036e-05, "loss": 2.2392, "step": 97344 }, { "epoch": 0.61, "learning_rate": 6.0432009862928305e-05, "loss": 2.2581, "step": 97352 }, { "epoch": 0.61, "learning_rate": 6.042570338948476e-05, "loss": 2.2563, "step": 97360 }, { "epoch": 0.61, "learning_rate": 6.041939690545819e-05, "loss": 2.257, "step": 97368 }, { "epoch": 0.61, "learning_rate": 6.0413090411005335e-05, "loss": 2.2466, "step": 97376 }, { "epoch": 0.61, "learning_rate": 6.040678390628305e-05, "loss": 2.2537, "step": 97384 }, { "epoch": 0.61, "learning_rate": 6.040047739144805e-05, "loss": 2.2577, "step": 97392 }, { "epoch": 0.61, "learning_rate": 6.039417086665713e-05, "loss": 2.253, "step": 97400 }, { "epoch": 0.61, "learning_rate": 6.038786433206709e-05, "loss": 2.2555, "step": 97408 }, { "epoch": 0.61, "learning_rate": 6.0381557787834676e-05, "loss": 2.2632, "step": 97416 }, { "epoch": 0.61, "learning_rate": 6.037525123411671e-05, "loss": 2.2636, "step": 97424 }, { "epoch": 0.61, "learning_rate": 6.036894467106997e-05, "loss": 2.254, "step": 97432 }, { "epoch": 0.61, "learning_rate": 6.036263809885121e-05, "loss": 2.2454, "step": 97440 }, { "epoch": 0.61, "learning_rate": 6.035633151761723e-05, "loss": 2.2644, "step": 97448 }, { "epoch": 0.61, "learning_rate": 6.03500249275248e-05, "loss": 2.2528, "step": 97456 }, { "epoch": 0.61, "learning_rate": 6.0343718328730714e-05, "loss": 2.244, "step": 97464 }, { "epoch": 0.61, "learning_rate": 6.033741172139176e-05, "loss": 2.2509, "step": 97472 }, { "epoch": 0.61, "learning_rate": 6.033110510566471e-05, "loss": 2.2471, "step": 97480 }, { "epoch": 0.61, "learning_rate": 6.032479848170636e-05, "loss": 2.2532, "step": 97488 }, { "epoch": 0.61, "learning_rate": 6.031849184967345e-05, "loss": 2.2531, "step": 97496 }, { "epoch": 0.61, "learning_rate": 6.0312185209722824e-05, "loss": 2.2541, "step": 97504 }, { "epoch": 0.61, "learning_rate": 6.030587856201122e-05, "loss": 2.2568, "step": 97512 }, { "epoch": 0.61, "learning_rate": 6.029957190669546e-05, "loss": 2.26, "step": 97520 }, { "epoch": 0.61, "learning_rate": 6.029326524393231e-05, "loss": 2.2458, "step": 97528 }, { "epoch": 0.61, "learning_rate": 6.0286958573878536e-05, "loss": 2.2399, "step": 97536 }, { "epoch": 0.61, "learning_rate": 6.0280651896690965e-05, "loss": 2.2606, "step": 97544 }, { "epoch": 0.61, "learning_rate": 6.027434521252633e-05, "loss": 2.2397, "step": 97552 }, { "epoch": 0.61, "learning_rate": 6.026803852154144e-05, "loss": 2.2415, "step": 97560 }, { "epoch": 0.61, "learning_rate": 6.0261731823893096e-05, "loss": 2.2807, "step": 97568 }, { "epoch": 0.61, "learning_rate": 6.0255425119738076e-05, "loss": 2.2418, "step": 97576 }, { "epoch": 0.61, "learning_rate": 6.0249118409233155e-05, "loss": 2.2415, "step": 97584 }, { "epoch": 0.61, "learning_rate": 6.024281169253511e-05, "loss": 2.2515, "step": 97592 }, { "epoch": 0.61, "learning_rate": 6.023650496980075e-05, "loss": 2.2491, "step": 97600 }, { "epoch": 0.61, "learning_rate": 6.023019824118685e-05, "loss": 2.2349, "step": 97608 }, { "epoch": 0.61, "learning_rate": 6.02238915068502e-05, "loss": 2.255, "step": 97616 }, { "epoch": 0.61, "learning_rate": 6.021758476694757e-05, "loss": 2.2473, "step": 97624 }, { "epoch": 0.61, "learning_rate": 6.021127802163575e-05, "loss": 2.2366, "step": 97632 }, { "epoch": 0.61, "learning_rate": 6.020497127107156e-05, "loss": 2.2561, "step": 97640 }, { "epoch": 0.61, "learning_rate": 6.019866451541174e-05, "loss": 2.2389, "step": 97648 }, { "epoch": 0.61, "learning_rate": 6.019235775481311e-05, "loss": 2.2471, "step": 97656 }, { "epoch": 0.61, "learning_rate": 6.018605098943244e-05, "loss": 2.2531, "step": 97664 }, { "epoch": 0.61, "learning_rate": 6.0179744219426524e-05, "loss": 2.251, "step": 97672 }, { "epoch": 0.61, "learning_rate": 6.0173437444952143e-05, "loss": 2.2509, "step": 97680 }, { "epoch": 0.61, "learning_rate": 6.016713066616608e-05, "loss": 2.2461, "step": 97688 }, { "epoch": 0.61, "learning_rate": 6.016082388322516e-05, "loss": 2.2524, "step": 97696 }, { "epoch": 0.61, "learning_rate": 6.0154517096286126e-05, "loss": 2.2568, "step": 97704 }, { "epoch": 0.61, "learning_rate": 6.014821030550577e-05, "loss": 2.255, "step": 97712 }, { "epoch": 0.61, "learning_rate": 6.0141903511040885e-05, "loss": 2.2681, "step": 97720 }, { "epoch": 0.61, "learning_rate": 6.013559671304827e-05, "loss": 2.2244, "step": 97728 }, { "epoch": 0.61, "learning_rate": 6.012928991168472e-05, "loss": 2.2365, "step": 97736 }, { "epoch": 0.61, "learning_rate": 6.012298310710698e-05, "loss": 2.2518, "step": 97744 }, { "epoch": 0.61, "learning_rate": 6.011667629947189e-05, "loss": 2.2413, "step": 97752 }, { "epoch": 0.61, "learning_rate": 6.0110369488936204e-05, "loss": 2.2535, "step": 97760 }, { "epoch": 0.61, "learning_rate": 6.010406267565672e-05, "loss": 2.2385, "step": 97768 }, { "epoch": 0.61, "learning_rate": 6.009775585979023e-05, "loss": 2.2451, "step": 97776 }, { "epoch": 0.61, "learning_rate": 6.009144904149351e-05, "loss": 2.243, "step": 97784 }, { "epoch": 0.61, "learning_rate": 6.0085142220923364e-05, "loss": 2.2484, "step": 97792 }, { "epoch": 0.61, "learning_rate": 6.007883539823658e-05, "loss": 2.2513, "step": 97800 }, { "epoch": 0.61, "learning_rate": 6.007252857358992e-05, "loss": 2.2398, "step": 97808 }, { "epoch": 0.61, "learning_rate": 6.0066221747140205e-05, "loss": 2.2373, "step": 97816 }, { "epoch": 0.61, "learning_rate": 6.0059914919044194e-05, "loss": 2.2421, "step": 97824 }, { "epoch": 0.61, "learning_rate": 6.005360808945871e-05, "loss": 2.2428, "step": 97832 }, { "epoch": 0.61, "learning_rate": 6.004730125854052e-05, "loss": 2.2543, "step": 97840 }, { "epoch": 0.61, "learning_rate": 6.004099442644641e-05, "loss": 2.2461, "step": 97848 }, { "epoch": 0.61, "learning_rate": 6.0034687593333184e-05, "loss": 2.2432, "step": 97856 }, { "epoch": 0.61, "learning_rate": 6.002838075935762e-05, "loss": 2.2627, "step": 97864 }, { "epoch": 0.61, "learning_rate": 6.002207392467649e-05, "loss": 2.2289, "step": 97872 }, { "epoch": 0.61, "learning_rate": 6.00157670894466e-05, "loss": 2.2556, "step": 97880 }, { "epoch": 0.61, "learning_rate": 6.0009460253824765e-05, "loss": 2.2326, "step": 97888 }, { "epoch": 0.61, "learning_rate": 6.000315341796774e-05, "loss": 2.2563, "step": 97896 }, { "epoch": 0.61, "learning_rate": 5.9996846582032287e-05, "loss": 2.2428, "step": 97904 }, { "epoch": 0.61, "learning_rate": 5.999053974617526e-05, "loss": 2.2519, "step": 97912 }, { "epoch": 0.61, "learning_rate": 5.998423291055342e-05, "loss": 2.2465, "step": 97920 }, { "epoch": 0.61, "learning_rate": 5.9977926075323535e-05, "loss": 2.2525, "step": 97928 }, { "epoch": 0.61, "learning_rate": 5.9971619240642405e-05, "loss": 2.2644, "step": 97936 }, { "epoch": 0.61, "learning_rate": 5.9965312406666826e-05, "loss": 2.2371, "step": 97944 }, { "epoch": 0.61, "learning_rate": 5.995900557355361e-05, "loss": 2.2484, "step": 97952 }, { "epoch": 0.61, "learning_rate": 5.99526987414595e-05, "loss": 2.2569, "step": 97960 }, { "epoch": 0.61, "learning_rate": 5.99463919105413e-05, "loss": 2.2319, "step": 97968 }, { "epoch": 0.61, "learning_rate": 5.994008508095581e-05, "loss": 2.2245, "step": 97976 }, { "epoch": 0.61, "learning_rate": 5.993377825285982e-05, "loss": 2.234, "step": 97984 }, { "epoch": 0.61, "learning_rate": 5.9927471426410086e-05, "loss": 2.2441, "step": 97992 }, { "epoch": 0.61, "learning_rate": 5.9921164601763444e-05, "loss": 2.2691, "step": 98000 }, { "epoch": 0.61, "learning_rate": 5.991485777907666e-05, "loss": 2.2536, "step": 98008 }, { "epoch": 0.61, "learning_rate": 5.9908550958506516e-05, "loss": 2.251, "step": 98016 }, { "epoch": 0.61, "learning_rate": 5.9902244140209795e-05, "loss": 2.2451, "step": 98024 }, { "epoch": 0.61, "learning_rate": 5.98959373243433e-05, "loss": 2.253, "step": 98032 }, { "epoch": 0.61, "learning_rate": 5.988963051106381e-05, "loss": 2.2552, "step": 98040 }, { "epoch": 0.61, "learning_rate": 5.9883323700528136e-05, "loss": 2.2417, "step": 98048 }, { "epoch": 0.61, "learning_rate": 5.9877016892893025e-05, "loss": 2.2297, "step": 98056 }, { "epoch": 0.61, "learning_rate": 5.9870710088315304e-05, "loss": 2.2443, "step": 98064 }, { "epoch": 0.61, "learning_rate": 5.9864403286951754e-05, "loss": 2.2484, "step": 98072 }, { "epoch": 0.61, "learning_rate": 5.9858096488959125e-05, "loss": 2.251, "step": 98080 }, { "epoch": 0.61, "learning_rate": 5.985178969449425e-05, "loss": 2.2488, "step": 98088 }, { "epoch": 0.61, "learning_rate": 5.9845482903713904e-05, "loss": 2.247, "step": 98096 }, { "epoch": 0.61, "learning_rate": 5.983917611677485e-05, "loss": 2.2457, "step": 98104 }, { "epoch": 0.61, "learning_rate": 5.9832869333833916e-05, "loss": 2.2396, "step": 98112 }, { "epoch": 0.61, "learning_rate": 5.982656255504786e-05, "loss": 2.2755, "step": 98120 }, { "epoch": 0.61, "learning_rate": 5.9820255780573486e-05, "loss": 2.2367, "step": 98128 }, { "epoch": 0.61, "learning_rate": 5.9813949010567563e-05, "loss": 2.2524, "step": 98136 }, { "epoch": 0.61, "learning_rate": 5.9807642245186915e-05, "loss": 2.232, "step": 98144 }, { "epoch": 0.61, "learning_rate": 5.980133548458827e-05, "loss": 2.2339, "step": 98152 }, { "epoch": 0.61, "learning_rate": 5.979502872892846e-05, "loss": 2.2537, "step": 98160 }, { "epoch": 0.61, "learning_rate": 5.978872197836426e-05, "loss": 2.2577, "step": 98168 }, { "epoch": 0.61, "learning_rate": 5.9782415233052455e-05, "loss": 2.2585, "step": 98176 }, { "epoch": 0.61, "learning_rate": 5.9776108493149826e-05, "loss": 2.2512, "step": 98184 }, { "epoch": 0.61, "learning_rate": 5.976980175881317e-05, "loss": 2.2498, "step": 98192 }, { "epoch": 0.61, "learning_rate": 5.976349503019927e-05, "loss": 2.2536, "step": 98200 }, { "epoch": 0.61, "learning_rate": 5.975718830746491e-05, "loss": 2.2331, "step": 98208 }, { "epoch": 0.61, "learning_rate": 5.975088159076686e-05, "loss": 2.255, "step": 98216 }, { "epoch": 0.61, "learning_rate": 5.974457488026194e-05, "loss": 2.2495, "step": 98224 }, { "epoch": 0.61, "learning_rate": 5.973826817610693e-05, "loss": 2.2541, "step": 98232 }, { "epoch": 0.61, "learning_rate": 5.9731961478458564e-05, "loss": 2.2545, "step": 98240 }, { "epoch": 0.61, "learning_rate": 5.9725654787473694e-05, "loss": 2.251, "step": 98248 }, { "epoch": 0.61, "learning_rate": 5.971934810330906e-05, "loss": 2.2597, "step": 98256 }, { "epoch": 0.61, "learning_rate": 5.971304142612149e-05, "loss": 2.2403, "step": 98264 }, { "epoch": 0.61, "learning_rate": 5.9706734756067716e-05, "loss": 2.2471, "step": 98272 }, { "epoch": 0.61, "learning_rate": 5.970042809330455e-05, "loss": 2.2477, "step": 98280 }, { "epoch": 0.61, "learning_rate": 5.969412143798878e-05, "loss": 2.249, "step": 98288 }, { "epoch": 0.61, "learning_rate": 5.9687814790277186e-05, "loss": 2.2451, "step": 98296 }, { "epoch": 0.61, "learning_rate": 5.968150815032656e-05, "loss": 2.2575, "step": 98304 }, { "epoch": 0.61, "learning_rate": 5.9675201518293664e-05, "loss": 2.2506, "step": 98312 }, { "epoch": 0.61, "learning_rate": 5.966889489433532e-05, "loss": 2.2488, "step": 98320 }, { "epoch": 0.61, "learning_rate": 5.9662588278608267e-05, "loss": 2.2583, "step": 98328 }, { "epoch": 0.61, "learning_rate": 5.965628167126929e-05, "loss": 2.258, "step": 98336 }, { "epoch": 0.61, "learning_rate": 5.964997507247521e-05, "loss": 2.2336, "step": 98344 }, { "epoch": 0.61, "learning_rate": 5.964366848238279e-05, "loss": 2.2424, "step": 98352 }, { "epoch": 0.61, "learning_rate": 5.963736190114881e-05, "loss": 2.2501, "step": 98360 }, { "epoch": 0.61, "learning_rate": 5.9631055328930055e-05, "loss": 2.2349, "step": 98368 }, { "epoch": 0.61, "learning_rate": 5.9624748765883284e-05, "loss": 2.267, "step": 98376 }, { "epoch": 0.61, "learning_rate": 5.961844221216533e-05, "loss": 2.2554, "step": 98384 }, { "epoch": 0.61, "learning_rate": 5.9612135667932934e-05, "loss": 2.2431, "step": 98392 }, { "epoch": 0.61, "learning_rate": 5.9605829133342885e-05, "loss": 2.2387, "step": 98400 }, { "epoch": 0.62, "learning_rate": 5.959952260855197e-05, "loss": 2.2351, "step": 98408 }, { "epoch": 0.62, "learning_rate": 5.959321609371697e-05, "loss": 2.257, "step": 98416 }, { "epoch": 0.62, "learning_rate": 5.958690958899467e-05, "loss": 2.2561, "step": 98424 }, { "epoch": 0.62, "learning_rate": 5.958060309454183e-05, "loss": 2.2541, "step": 98432 }, { "epoch": 0.62, "learning_rate": 5.957429661051526e-05, "loss": 2.2311, "step": 98440 }, { "epoch": 0.62, "learning_rate": 5.9567990137071726e-05, "loss": 2.2406, "step": 98448 }, { "epoch": 0.62, "learning_rate": 5.956168367436799e-05, "loss": 2.2467, "step": 98456 }, { "epoch": 0.62, "learning_rate": 5.955537722256084e-05, "loss": 2.2513, "step": 98464 }, { "epoch": 0.62, "learning_rate": 5.9549070781807074e-05, "loss": 2.2608, "step": 98472 }, { "epoch": 0.62, "learning_rate": 5.954276435226347e-05, "loss": 2.253, "step": 98480 }, { "epoch": 0.62, "learning_rate": 5.9536457934086776e-05, "loss": 2.2391, "step": 98488 }, { "epoch": 0.62, "learning_rate": 5.95301515274338e-05, "loss": 2.266, "step": 98496 }, { "epoch": 0.62, "learning_rate": 5.952384513246132e-05, "loss": 2.2559, "step": 98504 }, { "epoch": 0.62, "learning_rate": 5.951753874932608e-05, "loss": 2.2297, "step": 98512 }, { "epoch": 0.62, "learning_rate": 5.95112323781849e-05, "loss": 2.2516, "step": 98520 }, { "epoch": 0.62, "learning_rate": 5.950492601919452e-05, "loss": 2.226, "step": 98528 }, { "epoch": 0.62, "learning_rate": 5.9498619672511754e-05, "loss": 2.2381, "step": 98536 }, { "epoch": 0.62, "learning_rate": 5.9492313338293346e-05, "loss": 2.2411, "step": 98544 }, { "epoch": 0.62, "learning_rate": 5.948600701669609e-05, "loss": 2.2562, "step": 98552 }, { "epoch": 0.62, "learning_rate": 5.947970070787676e-05, "loss": 2.252, "step": 98560 }, { "epoch": 0.62, "learning_rate": 5.9473394411992125e-05, "loss": 2.2449, "step": 98568 }, { "epoch": 0.62, "learning_rate": 5.9467088129198964e-05, "loss": 2.2408, "step": 98576 }, { "epoch": 0.62, "learning_rate": 5.946078185965405e-05, "loss": 2.2619, "step": 98584 }, { "epoch": 0.62, "learning_rate": 5.9454475603514156e-05, "loss": 2.2648, "step": 98592 }, { "epoch": 0.62, "learning_rate": 5.944816936093608e-05, "loss": 2.2396, "step": 98600 }, { "epoch": 0.62, "learning_rate": 5.9441863132076556e-05, "loss": 2.2473, "step": 98608 }, { "epoch": 0.62, "learning_rate": 5.9435556917092374e-05, "loss": 2.2539, "step": 98616 }, { "epoch": 0.62, "learning_rate": 5.9429250716140336e-05, "loss": 2.2364, "step": 98624 }, { "epoch": 0.62, "learning_rate": 5.942294452937716e-05, "loss": 2.2577, "step": 98632 }, { "epoch": 0.62, "learning_rate": 5.9416638356959674e-05, "loss": 2.246, "step": 98640 }, { "epoch": 0.62, "learning_rate": 5.9410332199044594e-05, "loss": 2.2417, "step": 98648 }, { "epoch": 0.62, "learning_rate": 5.940402605578874e-05, "loss": 2.254, "step": 98656 }, { "epoch": 0.62, "learning_rate": 5.939771992734886e-05, "loss": 2.2605, "step": 98664 }, { "epoch": 0.62, "learning_rate": 5.9391413813881735e-05, "loss": 2.2684, "step": 98672 }, { "epoch": 0.62, "learning_rate": 5.938510771554413e-05, "loss": 2.2455, "step": 98680 }, { "epoch": 0.62, "learning_rate": 5.937880163249281e-05, "loss": 2.2527, "step": 98688 }, { "epoch": 0.62, "learning_rate": 5.9372495564884566e-05, "loss": 2.2458, "step": 98696 }, { "epoch": 0.62, "learning_rate": 5.9366189512876136e-05, "loss": 2.2531, "step": 98704 }, { "epoch": 0.62, "learning_rate": 5.935988347662431e-05, "loss": 2.2436, "step": 98712 }, { "epoch": 0.62, "learning_rate": 5.935357745628587e-05, "loss": 2.2617, "step": 98720 }, { "epoch": 0.62, "learning_rate": 5.934727145201755e-05, "loss": 2.2271, "step": 98728 }, { "epoch": 0.62, "learning_rate": 5.934096546397614e-05, "loss": 2.245, "step": 98736 }, { "epoch": 0.62, "learning_rate": 5.933465949231838e-05, "loss": 2.2478, "step": 98744 }, { "epoch": 0.62, "learning_rate": 5.93283535372011e-05, "loss": 2.2613, "step": 98752 }, { "epoch": 0.62, "learning_rate": 5.9322047598780995e-05, "loss": 2.2501, "step": 98760 }, { "epoch": 0.62, "learning_rate": 5.931574167721487e-05, "loss": 2.248, "step": 98768 }, { "epoch": 0.62, "learning_rate": 5.9309435772659484e-05, "loss": 2.2515, "step": 98776 }, { "epoch": 0.62, "learning_rate": 5.93031298852716e-05, "loss": 2.2334, "step": 98784 }, { "epoch": 0.62, "learning_rate": 5.9296824015208006e-05, "loss": 2.2609, "step": 98792 }, { "epoch": 0.62, "learning_rate": 5.9290518162625434e-05, "loss": 2.2509, "step": 98800 }, { "epoch": 0.62, "learning_rate": 5.928421232768064e-05, "loss": 2.246, "step": 98808 }, { "epoch": 0.62, "learning_rate": 5.927790651053045e-05, "loss": 2.2576, "step": 98816 }, { "epoch": 0.62, "learning_rate": 5.9271600711331544e-05, "loss": 2.2652, "step": 98824 }, { "epoch": 0.62, "learning_rate": 5.9265294930240734e-05, "loss": 2.2642, "step": 98832 }, { "epoch": 0.62, "learning_rate": 5.9258989167414794e-05, "loss": 2.2553, "step": 98840 }, { "epoch": 0.62, "learning_rate": 5.9252683423010446e-05, "loss": 2.2676, "step": 98848 }, { "epoch": 0.62, "learning_rate": 5.9246377697184484e-05, "loss": 2.2649, "step": 98856 }, { "epoch": 0.62, "learning_rate": 5.924007199009365e-05, "loss": 2.2474, "step": 98864 }, { "epoch": 0.62, "learning_rate": 5.923376630189472e-05, "loss": 2.2618, "step": 98872 }, { "epoch": 0.62, "learning_rate": 5.922746063274444e-05, "loss": 2.2541, "step": 98880 }, { "epoch": 0.62, "learning_rate": 5.9221154982799585e-05, "loss": 2.2588, "step": 98888 }, { "epoch": 0.62, "learning_rate": 5.921484935221688e-05, "loss": 2.2585, "step": 98896 }, { "epoch": 0.62, "learning_rate": 5.920854374115312e-05, "loss": 2.2504, "step": 98904 }, { "epoch": 0.62, "learning_rate": 5.9202238149765065e-05, "loss": 2.2558, "step": 98912 }, { "epoch": 0.62, "learning_rate": 5.919593257820946e-05, "loss": 2.256, "step": 98920 }, { "epoch": 0.62, "learning_rate": 5.9189627026643036e-05, "loss": 2.2485, "step": 98928 }, { "epoch": 0.62, "learning_rate": 5.918332149522259e-05, "loss": 2.2394, "step": 98936 }, { "epoch": 0.62, "learning_rate": 5.917701598410487e-05, "loss": 2.2623, "step": 98944 }, { "epoch": 0.62, "learning_rate": 5.9170710493446626e-05, "loss": 2.2546, "step": 98952 }, { "epoch": 0.62, "learning_rate": 5.916440502340459e-05, "loss": 2.2324, "step": 98960 }, { "epoch": 0.62, "learning_rate": 5.915809957413556e-05, "loss": 2.2509, "step": 98968 }, { "epoch": 0.62, "learning_rate": 5.915179414579626e-05, "loss": 2.2563, "step": 98976 }, { "epoch": 0.62, "learning_rate": 5.9145488738543455e-05, "loss": 2.2496, "step": 98984 }, { "epoch": 0.62, "learning_rate": 5.91391833525339e-05, "loss": 2.2585, "step": 98992 }, { "epoch": 0.62, "learning_rate": 5.913287798792433e-05, "loss": 2.2571, "step": 99000 }, { "epoch": 0.62, "learning_rate": 5.912657264487151e-05, "loss": 2.2371, "step": 99008 }, { "epoch": 0.62, "learning_rate": 5.912026732353222e-05, "loss": 2.2358, "step": 99016 }, { "epoch": 0.62, "learning_rate": 5.9113962024063155e-05, "loss": 2.2678, "step": 99024 }, { "epoch": 0.62, "learning_rate": 5.910765674662111e-05, "loss": 2.252, "step": 99032 }, { "epoch": 0.62, "learning_rate": 5.91013514913628e-05, "loss": 2.2364, "step": 99040 }, { "epoch": 0.62, "learning_rate": 5.909504625844501e-05, "loss": 2.2341, "step": 99048 }, { "epoch": 0.62, "learning_rate": 5.9088741048024465e-05, "loss": 2.2394, "step": 99056 }, { "epoch": 0.62, "learning_rate": 5.908243586025792e-05, "loss": 2.2501, "step": 99064 }, { "epoch": 0.62, "learning_rate": 5.907613069530214e-05, "loss": 2.2475, "step": 99072 }, { "epoch": 0.62, "learning_rate": 5.906982555331382e-05, "loss": 2.2588, "step": 99080 }, { "epoch": 0.62, "learning_rate": 5.906352043444976e-05, "loss": 2.2536, "step": 99088 }, { "epoch": 0.62, "learning_rate": 5.905721533886668e-05, "loss": 2.2339, "step": 99096 }, { "epoch": 0.62, "learning_rate": 5.905091026672134e-05, "loss": 2.2633, "step": 99104 }, { "epoch": 0.62, "learning_rate": 5.904460521817048e-05, "loss": 2.254, "step": 99112 }, { "epoch": 0.62, "learning_rate": 5.903830019337083e-05, "loss": 2.2441, "step": 99120 }, { "epoch": 0.62, "learning_rate": 5.9031995192479163e-05, "loss": 2.2474, "step": 99128 }, { "epoch": 0.62, "learning_rate": 5.902569021565218e-05, "loss": 2.2538, "step": 99136 }, { "epoch": 0.62, "learning_rate": 5.901938526304667e-05, "loss": 2.2573, "step": 99144 }, { "epoch": 0.62, "learning_rate": 5.9013080334819335e-05, "loss": 2.2574, "step": 99152 }, { "epoch": 0.62, "learning_rate": 5.900677543112695e-05, "loss": 2.2469, "step": 99160 }, { "epoch": 0.62, "learning_rate": 5.900047055212623e-05, "loss": 2.249, "step": 99168 }, { "epoch": 0.62, "learning_rate": 5.8994165697973915e-05, "loss": 2.2568, "step": 99176 }, { "epoch": 0.62, "learning_rate": 5.8987860868826775e-05, "loss": 2.2572, "step": 99184 }, { "epoch": 0.62, "learning_rate": 5.89815560648415e-05, "loss": 2.259, "step": 99192 }, { "epoch": 0.62, "learning_rate": 5.8975251286174896e-05, "loss": 2.2689, "step": 99200 }, { "epoch": 0.62, "learning_rate": 5.896894653298361e-05, "loss": 2.265, "step": 99208 }, { "epoch": 0.62, "learning_rate": 5.8962641805424455e-05, "loss": 2.2523, "step": 99216 }, { "epoch": 0.62, "learning_rate": 5.895633710365416e-05, "loss": 2.2539, "step": 99224 }, { "epoch": 0.62, "learning_rate": 5.8950032427829414e-05, "loss": 2.2564, "step": 99232 }, { "epoch": 0.62, "learning_rate": 5.894372777810699e-05, "loss": 2.2481, "step": 99240 }, { "epoch": 0.62, "learning_rate": 5.893742315464361e-05, "loss": 2.2532, "step": 99248 }, { "epoch": 0.62, "learning_rate": 5.893111855759601e-05, "loss": 2.2622, "step": 99256 }, { "epoch": 0.62, "learning_rate": 5.892481398712093e-05, "loss": 2.241, "step": 99264 }, { "epoch": 0.62, "learning_rate": 5.891850944337507e-05, "loss": 2.2607, "step": 99272 }, { "epoch": 0.62, "learning_rate": 5.891220492651521e-05, "loss": 2.2469, "step": 99280 }, { "epoch": 0.62, "learning_rate": 5.8905900436698056e-05, "loss": 2.2393, "step": 99288 }, { "epoch": 0.62, "learning_rate": 5.8899595974080334e-05, "loss": 2.2334, "step": 99296 }, { "epoch": 0.62, "learning_rate": 5.8893291538818775e-05, "loss": 2.2543, "step": 99304 }, { "epoch": 0.62, "learning_rate": 5.888698713107013e-05, "loss": 2.2625, "step": 99312 }, { "epoch": 0.62, "learning_rate": 5.888068275099109e-05, "loss": 2.2317, "step": 99320 }, { "epoch": 0.62, "learning_rate": 5.8874378398738415e-05, "loss": 2.2532, "step": 99328 }, { "epoch": 0.62, "learning_rate": 5.88680740744688e-05, "loss": 2.2497, "step": 99336 }, { "epoch": 0.62, "learning_rate": 5.886176977833902e-05, "loss": 2.244, "step": 99344 }, { "epoch": 0.62, "learning_rate": 5.8855465510505744e-05, "loss": 2.2539, "step": 99352 }, { "epoch": 0.62, "learning_rate": 5.884916127112574e-05, "loss": 2.244, "step": 99360 }, { "epoch": 0.62, "learning_rate": 5.8842857060355706e-05, "loss": 2.2516, "step": 99368 }, { "epoch": 0.62, "learning_rate": 5.883655287835239e-05, "loss": 2.2557, "step": 99376 }, { "epoch": 0.62, "learning_rate": 5.88302487252725e-05, "loss": 2.2653, "step": 99384 }, { "epoch": 0.62, "learning_rate": 5.882394460127274e-05, "loss": 2.2561, "step": 99392 }, { "epoch": 0.62, "learning_rate": 5.8817640506509867e-05, "loss": 2.2668, "step": 99400 }, { "epoch": 0.62, "learning_rate": 5.881133644114056e-05, "loss": 2.2412, "step": 99408 }, { "epoch": 0.62, "learning_rate": 5.880503240532158e-05, "loss": 2.2475, "step": 99416 }, { "epoch": 0.62, "learning_rate": 5.879872839920964e-05, "loss": 2.2403, "step": 99424 }, { "epoch": 0.62, "learning_rate": 5.8792424422961425e-05, "loss": 2.2538, "step": 99432 }, { "epoch": 0.62, "learning_rate": 5.878612047673369e-05, "loss": 2.2458, "step": 99440 }, { "epoch": 0.62, "learning_rate": 5.877981656068312e-05, "loss": 2.2435, "step": 99448 }, { "epoch": 0.62, "learning_rate": 5.8773512674966446e-05, "loss": 2.2531, "step": 99456 }, { "epoch": 0.62, "learning_rate": 5.8767208819740404e-05, "loss": 2.2628, "step": 99464 }, { "epoch": 0.62, "learning_rate": 5.876090499516167e-05, "loss": 2.2682, "step": 99472 }, { "epoch": 0.62, "learning_rate": 5.8754601201386994e-05, "loss": 2.2501, "step": 99480 }, { "epoch": 0.62, "learning_rate": 5.874829743857305e-05, "loss": 2.2615, "step": 99488 }, { "epoch": 0.62, "learning_rate": 5.874199370687658e-05, "loss": 2.2452, "step": 99496 }, { "epoch": 0.62, "learning_rate": 5.8735690006454317e-05, "loss": 2.2535, "step": 99504 }, { "epoch": 0.62, "learning_rate": 5.872938633746291e-05, "loss": 2.2606, "step": 99512 }, { "epoch": 0.62, "learning_rate": 5.872308270005911e-05, "loss": 2.2382, "step": 99520 }, { "epoch": 0.62, "learning_rate": 5.871677909439961e-05, "loss": 2.2347, "step": 99528 }, { "epoch": 0.62, "learning_rate": 5.871047552064114e-05, "loss": 2.2435, "step": 99536 }, { "epoch": 0.62, "learning_rate": 5.870417197894038e-05, "loss": 2.2351, "step": 99544 }, { "epoch": 0.62, "learning_rate": 5.869786846945406e-05, "loss": 2.2496, "step": 99552 }, { "epoch": 0.62, "learning_rate": 5.8691564992338875e-05, "loss": 2.255, "step": 99560 }, { "epoch": 0.62, "learning_rate": 5.8685261547751526e-05, "loss": 2.259, "step": 99568 }, { "epoch": 0.62, "learning_rate": 5.8678958135848727e-05, "loss": 2.2429, "step": 99576 }, { "epoch": 0.62, "learning_rate": 5.867265475678716e-05, "loss": 2.258, "step": 99584 }, { "epoch": 0.62, "learning_rate": 5.866635141072356e-05, "loss": 2.2532, "step": 99592 }, { "epoch": 0.62, "learning_rate": 5.866004809781462e-05, "loss": 2.2702, "step": 99600 }, { "epoch": 0.62, "learning_rate": 5.865374481821704e-05, "loss": 2.2585, "step": 99608 }, { "epoch": 0.62, "learning_rate": 5.864744157208748e-05, "loss": 2.2415, "step": 99616 }, { "epoch": 0.62, "learning_rate": 5.8641138359582705e-05, "loss": 2.2604, "step": 99624 }, { "epoch": 0.62, "learning_rate": 5.863483518085937e-05, "loss": 2.2486, "step": 99632 }, { "epoch": 0.62, "learning_rate": 5.862853203607419e-05, "loss": 2.2491, "step": 99640 }, { "epoch": 0.62, "learning_rate": 5.862222892538386e-05, "loss": 2.2688, "step": 99648 }, { "epoch": 0.62, "learning_rate": 5.861592584894508e-05, "loss": 2.242, "step": 99656 }, { "epoch": 0.62, "learning_rate": 5.860962280691452e-05, "loss": 2.2437, "step": 99664 }, { "epoch": 0.62, "learning_rate": 5.860331979944891e-05, "loss": 2.2482, "step": 99672 }, { "epoch": 0.62, "learning_rate": 5.859701682670491e-05, "loss": 2.257, "step": 99680 }, { "epoch": 0.62, "learning_rate": 5.859071388883923e-05, "loss": 2.2306, "step": 99688 }, { "epoch": 0.62, "learning_rate": 5.8584410986008586e-05, "loss": 2.2534, "step": 99696 }, { "epoch": 0.62, "learning_rate": 5.857810811836961e-05, "loss": 2.2437, "step": 99704 }, { "epoch": 0.62, "learning_rate": 5.857180528607905e-05, "loss": 2.2479, "step": 99712 }, { "epoch": 0.62, "learning_rate": 5.8565502489293555e-05, "loss": 2.2601, "step": 99720 }, { "epoch": 0.62, "learning_rate": 5.8559199728169855e-05, "loss": 2.2498, "step": 99728 }, { "epoch": 0.62, "learning_rate": 5.8552897002864596e-05, "loss": 2.2426, "step": 99736 }, { "epoch": 0.62, "learning_rate": 5.8546594313534466e-05, "loss": 2.2543, "step": 99744 }, { "epoch": 0.62, "learning_rate": 5.854029166033619e-05, "loss": 2.2513, "step": 99752 }, { "epoch": 0.62, "learning_rate": 5.85339890434264e-05, "loss": 2.24, "step": 99760 }, { "epoch": 0.62, "learning_rate": 5.8527686462961816e-05, "loss": 2.2455, "step": 99768 }, { "epoch": 0.62, "learning_rate": 5.852138391909911e-05, "loss": 2.2595, "step": 99776 }, { "epoch": 0.62, "learning_rate": 5.8515081411994975e-05, "loss": 2.2402, "step": 99784 }, { "epoch": 0.62, "learning_rate": 5.8508778941806086e-05, "loss": 2.2452, "step": 99792 }, { "epoch": 0.62, "learning_rate": 5.850247650868911e-05, "loss": 2.2499, "step": 99800 }, { "epoch": 0.62, "learning_rate": 5.849617411280074e-05, "loss": 2.2446, "step": 99808 }, { "epoch": 0.62, "learning_rate": 5.848987175429766e-05, "loss": 2.2566, "step": 99816 }, { "epoch": 0.62, "learning_rate": 5.8483569433336525e-05, "loss": 2.2347, "step": 99824 }, { "epoch": 0.62, "learning_rate": 5.8477267150074024e-05, "loss": 2.2644, "step": 99832 }, { "epoch": 0.62, "learning_rate": 5.847096490466682e-05, "loss": 2.2247, "step": 99840 }, { "epoch": 0.62, "learning_rate": 5.846466269727162e-05, "loss": 2.2522, "step": 99848 }, { "epoch": 0.62, "learning_rate": 5.8458360528045076e-05, "loss": 2.2334, "step": 99856 }, { "epoch": 0.62, "learning_rate": 5.845205839714385e-05, "loss": 2.2492, "step": 99864 }, { "epoch": 0.62, "learning_rate": 5.8445756304724645e-05, "loss": 2.2604, "step": 99872 }, { "epoch": 0.62, "learning_rate": 5.8439454250944105e-05, "loss": 2.2527, "step": 99880 }, { "epoch": 0.62, "learning_rate": 5.8433152235958887e-05, "loss": 2.2403, "step": 99888 }, { "epoch": 0.62, "learning_rate": 5.842685025992569e-05, "loss": 2.2535, "step": 99896 }, { "epoch": 0.62, "learning_rate": 5.842054832300119e-05, "loss": 2.2345, "step": 99904 }, { "epoch": 0.62, "learning_rate": 5.841424642534203e-05, "loss": 2.2377, "step": 99912 }, { "epoch": 0.62, "learning_rate": 5.8407944567104876e-05, "loss": 2.2578, "step": 99920 }, { "epoch": 0.62, "learning_rate": 5.84016427484464e-05, "loss": 2.2531, "step": 99928 }, { "epoch": 0.62, "learning_rate": 5.839534096952326e-05, "loss": 2.2459, "step": 99936 }, { "epoch": 0.62, "learning_rate": 5.838903923049214e-05, "loss": 2.2359, "step": 99944 }, { "epoch": 0.62, "learning_rate": 5.8382737531509665e-05, "loss": 2.2538, "step": 99952 }, { "epoch": 0.62, "learning_rate": 5.837643587273252e-05, "loss": 2.2514, "step": 99960 }, { "epoch": 0.62, "learning_rate": 5.837013425431738e-05, "loss": 2.2313, "step": 99968 }, { "epoch": 0.62, "learning_rate": 5.8363832676420873e-05, "loss": 2.2552, "step": 99976 }, { "epoch": 0.62, "learning_rate": 5.835753113919966e-05, "loss": 2.2534, "step": 99984 }, { "epoch": 0.62, "learning_rate": 5.8351229642810414e-05, "loss": 2.2492, "step": 99992 }, { "epoch": 0.62, "learning_rate": 5.8344928187409774e-05, "loss": 2.2576, "step": 100000 }, { "epoch": 0.63, "learning_rate": 5.8338626773154424e-05, "loss": 2.2427, "step": 100008 }, { "epoch": 0.63, "learning_rate": 5.8332325400200996e-05, "loss": 2.2394, "step": 100016 }, { "epoch": 0.63, "learning_rate": 5.832602406870613e-05, "loss": 2.2547, "step": 100024 }, { "epoch": 0.63, "learning_rate": 5.831972277882651e-05, "loss": 2.2597, "step": 100032 }, { "epoch": 0.63, "learning_rate": 5.831342153071877e-05, "loss": 2.2641, "step": 100040 }, { "epoch": 0.63, "learning_rate": 5.830712032453955e-05, "loss": 2.2506, "step": 100048 }, { "epoch": 0.63, "learning_rate": 5.830081916044551e-05, "loss": 2.2459, "step": 100056 }, { "epoch": 0.63, "learning_rate": 5.8294518038593306e-05, "loss": 2.2496, "step": 100064 }, { "epoch": 0.63, "learning_rate": 5.8288216959139566e-05, "loss": 2.2529, "step": 100072 }, { "epoch": 0.63, "learning_rate": 5.828191592224094e-05, "loss": 2.2325, "step": 100080 }, { "epoch": 0.63, "learning_rate": 5.827561492805409e-05, "loss": 2.2611, "step": 100088 }, { "epoch": 0.63, "learning_rate": 5.826931397673563e-05, "loss": 2.2425, "step": 100096 }, { "epoch": 0.63, "learning_rate": 5.826301306844224e-05, "loss": 2.2426, "step": 100104 }, { "epoch": 0.63, "learning_rate": 5.825671220333051e-05, "loss": 2.2445, "step": 100112 }, { "epoch": 0.63, "learning_rate": 5.8250411381557135e-05, "loss": 2.255, "step": 100120 }, { "epoch": 0.63, "learning_rate": 5.824411060327873e-05, "loss": 2.2495, "step": 100128 }, { "epoch": 0.63, "learning_rate": 5.823780986865193e-05, "loss": 2.2522, "step": 100136 }, { "epoch": 0.63, "learning_rate": 5.8231509177833366e-05, "loss": 2.2483, "step": 100144 }, { "epoch": 0.63, "learning_rate": 5.822520853097968e-05, "loss": 2.2459, "step": 100152 }, { "epoch": 0.63, "learning_rate": 5.8218907928247515e-05, "loss": 2.2407, "step": 100160 }, { "epoch": 0.63, "learning_rate": 5.82126073697935e-05, "loss": 2.2656, "step": 100168 }, { "epoch": 0.63, "learning_rate": 5.820630685577426e-05, "loss": 2.2502, "step": 100176 }, { "epoch": 0.63, "learning_rate": 5.820000638634644e-05, "loss": 2.2352, "step": 100184 }, { "epoch": 0.63, "learning_rate": 5.8193705961666665e-05, "loss": 2.237, "step": 100192 }, { "epoch": 0.63, "learning_rate": 5.8187405581891555e-05, "loss": 2.2374, "step": 100200 }, { "epoch": 0.63, "learning_rate": 5.8181105247177744e-05, "loss": 2.2593, "step": 100208 }, { "epoch": 0.63, "learning_rate": 5.8174804957681886e-05, "loss": 2.2459, "step": 100216 }, { "epoch": 0.63, "learning_rate": 5.816850471356056e-05, "loss": 2.2542, "step": 100224 }, { "epoch": 0.63, "learning_rate": 5.81622045149704e-05, "loss": 2.2482, "step": 100232 }, { "epoch": 0.63, "learning_rate": 5.8155904362068056e-05, "loss": 2.2293, "step": 100240 }, { "epoch": 0.63, "learning_rate": 5.814960425501014e-05, "loss": 2.2539, "step": 100248 }, { "epoch": 0.63, "learning_rate": 5.8143304193953266e-05, "loss": 2.2592, "step": 100256 }, { "epoch": 0.63, "learning_rate": 5.813700417905406e-05, "loss": 2.2534, "step": 100264 }, { "epoch": 0.63, "learning_rate": 5.8130704210469134e-05, "loss": 2.2482, "step": 100272 }, { "epoch": 0.63, "learning_rate": 5.8124404288355114e-05, "loss": 2.2332, "step": 100280 }, { "epoch": 0.63, "learning_rate": 5.8118104412868625e-05, "loss": 2.2379, "step": 100288 }, { "epoch": 0.63, "learning_rate": 5.811180458416625e-05, "loss": 2.2426, "step": 100296 }, { "epoch": 0.63, "learning_rate": 5.8105504802404644e-05, "loss": 2.2441, "step": 100304 }, { "epoch": 0.63, "learning_rate": 5.8099205067740384e-05, "loss": 2.247, "step": 100312 }, { "epoch": 0.63, "learning_rate": 5.809290538033012e-05, "loss": 2.2196, "step": 100320 }, { "epoch": 0.63, "learning_rate": 5.808660574033041e-05, "loss": 2.2427, "step": 100328 }, { "epoch": 0.63, "learning_rate": 5.8080306147897926e-05, "loss": 2.2516, "step": 100336 }, { "epoch": 0.63, "learning_rate": 5.807400660318925e-05, "loss": 2.2438, "step": 100344 }, { "epoch": 0.63, "learning_rate": 5.806770710636096e-05, "loss": 2.2406, "step": 100352 }, { "epoch": 0.63, "learning_rate": 5.806140765756969e-05, "loss": 2.2291, "step": 100360 }, { "epoch": 0.63, "learning_rate": 5.805510825697206e-05, "loss": 2.247, "step": 100368 }, { "epoch": 0.63, "learning_rate": 5.804880890472466e-05, "loss": 2.246, "step": 100376 }, { "epoch": 0.63, "learning_rate": 5.8042509600984076e-05, "loss": 2.2411, "step": 100384 }, { "epoch": 0.63, "learning_rate": 5.8036210345906916e-05, "loss": 2.2521, "step": 100392 }, { "epoch": 0.63, "learning_rate": 5.802991113964981e-05, "loss": 2.2322, "step": 100400 }, { "epoch": 0.63, "learning_rate": 5.802361198236932e-05, "loss": 2.2633, "step": 100408 }, { "epoch": 0.63, "learning_rate": 5.8017312874222065e-05, "loss": 2.243, "step": 100416 }, { "epoch": 0.63, "learning_rate": 5.801101381536462e-05, "loss": 2.2389, "step": 100424 }, { "epoch": 0.63, "learning_rate": 5.8004714805953607e-05, "loss": 2.2332, "step": 100432 }, { "epoch": 0.63, "learning_rate": 5.799841584614561e-05, "loss": 2.2352, "step": 100440 }, { "epoch": 0.63, "learning_rate": 5.799211693609721e-05, "loss": 2.2373, "step": 100448 }, { "epoch": 0.63, "learning_rate": 5.798581807596502e-05, "loss": 2.2545, "step": 100456 }, { "epoch": 0.63, "learning_rate": 5.79795192659056e-05, "loss": 2.2448, "step": 100464 }, { "epoch": 0.63, "learning_rate": 5.797322050607558e-05, "loss": 2.2376, "step": 100472 }, { "epoch": 0.63, "learning_rate": 5.79669217966315e-05, "loss": 2.261, "step": 100480 }, { "epoch": 0.63, "learning_rate": 5.796062313772999e-05, "loss": 2.2508, "step": 100488 }, { "epoch": 0.63, "learning_rate": 5.795432452952763e-05, "loss": 2.2464, "step": 100496 }, { "epoch": 0.63, "learning_rate": 5.7948025972180964e-05, "loss": 2.256, "step": 100504 }, { "epoch": 0.63, "learning_rate": 5.794172746584661e-05, "loss": 2.2574, "step": 100512 }, { "epoch": 0.63, "learning_rate": 5.793542901068116e-05, "loss": 2.2332, "step": 100520 }, { "epoch": 0.63, "learning_rate": 5.792913060684115e-05, "loss": 2.247, "step": 100528 }, { "epoch": 0.63, "learning_rate": 5.7922832254483203e-05, "loss": 2.2315, "step": 100536 }, { "epoch": 0.63, "learning_rate": 5.791653395376387e-05, "loss": 2.2415, "step": 100544 }, { "epoch": 0.63, "learning_rate": 5.7910235704839753e-05, "loss": 2.2552, "step": 100552 }, { "epoch": 0.63, "learning_rate": 5.7903937507867404e-05, "loss": 2.2477, "step": 100560 }, { "epoch": 0.63, "learning_rate": 5.7897639363003396e-05, "loss": 2.2503, "step": 100568 }, { "epoch": 0.63, "learning_rate": 5.789134127040432e-05, "loss": 2.2433, "step": 100576 }, { "epoch": 0.63, "learning_rate": 5.788504323022672e-05, "loss": 2.2495, "step": 100584 }, { "epoch": 0.63, "learning_rate": 5.7878745242627196e-05, "loss": 2.2519, "step": 100592 }, { "epoch": 0.63, "learning_rate": 5.787244730776229e-05, "loss": 2.2669, "step": 100600 }, { "epoch": 0.63, "learning_rate": 5.7866149425788594e-05, "loss": 2.2552, "step": 100608 }, { "epoch": 0.63, "learning_rate": 5.785985159686267e-05, "loss": 2.2544, "step": 100616 }, { "epoch": 0.63, "learning_rate": 5.785355382114106e-05, "loss": 2.2594, "step": 100624 }, { "epoch": 0.63, "learning_rate": 5.7847256098780356e-05, "loss": 2.256, "step": 100632 }, { "epoch": 0.63, "learning_rate": 5.784095842993709e-05, "loss": 2.2442, "step": 100640 }, { "epoch": 0.63, "learning_rate": 5.783466081476785e-05, "loss": 2.2586, "step": 100648 }, { "epoch": 0.63, "learning_rate": 5.78283632534292e-05, "loss": 2.2471, "step": 100656 }, { "epoch": 0.63, "learning_rate": 5.782206574607766e-05, "loss": 2.2561, "step": 100664 }, { "epoch": 0.63, "learning_rate": 5.781576829286981e-05, "loss": 2.2574, "step": 100672 }, { "epoch": 0.63, "learning_rate": 5.780947089396221e-05, "loss": 2.2558, "step": 100680 }, { "epoch": 0.63, "learning_rate": 5.780317354951143e-05, "loss": 2.2497, "step": 100688 }, { "epoch": 0.63, "learning_rate": 5.779687625967398e-05, "loss": 2.2634, "step": 100696 }, { "epoch": 0.63, "learning_rate": 5.779057902460643e-05, "loss": 2.2411, "step": 100704 }, { "epoch": 0.63, "learning_rate": 5.7784281844465336e-05, "loss": 2.2474, "step": 100712 }, { "epoch": 0.63, "learning_rate": 5.777798471940725e-05, "loss": 2.2497, "step": 100720 }, { "epoch": 0.63, "learning_rate": 5.777168764958871e-05, "loss": 2.2472, "step": 100728 }, { "epoch": 0.63, "learning_rate": 5.776539063516626e-05, "loss": 2.2421, "step": 100736 }, { "epoch": 0.63, "learning_rate": 5.775909367629647e-05, "loss": 2.2649, "step": 100744 }, { "epoch": 0.63, "learning_rate": 5.775279677313585e-05, "loss": 2.2484, "step": 100752 }, { "epoch": 0.63, "learning_rate": 5.774649992584096e-05, "loss": 2.2546, "step": 100760 }, { "epoch": 0.63, "learning_rate": 5.7740203134568316e-05, "loss": 2.2587, "step": 100768 }, { "epoch": 0.63, "learning_rate": 5.773390639947449e-05, "loss": 2.2629, "step": 100776 }, { "epoch": 0.63, "learning_rate": 5.772760972071601e-05, "loss": 2.2596, "step": 100784 }, { "epoch": 0.63, "learning_rate": 5.7721313098449394e-05, "loss": 2.236, "step": 100792 }, { "epoch": 0.63, "learning_rate": 5.77150165328312e-05, "loss": 2.2584, "step": 100800 }, { "epoch": 0.63, "learning_rate": 5.770872002401795e-05, "loss": 2.2409, "step": 100808 }, { "epoch": 0.63, "learning_rate": 5.7702423572166176e-05, "loss": 2.2473, "step": 100816 }, { "epoch": 0.63, "learning_rate": 5.76961271774324e-05, "loss": 2.2461, "step": 100824 }, { "epoch": 0.63, "learning_rate": 5.768983083997318e-05, "loss": 2.2302, "step": 100832 }, { "epoch": 0.63, "learning_rate": 5.768353455994502e-05, "loss": 2.2448, "step": 100840 }, { "epoch": 0.63, "learning_rate": 5.7677238337504447e-05, "loss": 2.2475, "step": 100848 }, { "epoch": 0.63, "learning_rate": 5.7670942172807974e-05, "loss": 2.2527, "step": 100856 }, { "epoch": 0.63, "learning_rate": 5.766464606601216e-05, "loss": 2.2589, "step": 100864 }, { "epoch": 0.63, "learning_rate": 5.765835001727351e-05, "loss": 2.257, "step": 100872 }, { "epoch": 0.63, "learning_rate": 5.7652054026748525e-05, "loss": 2.2368, "step": 100880 }, { "epoch": 0.63, "learning_rate": 5.764575809459374e-05, "loss": 2.2415, "step": 100888 }, { "epoch": 0.63, "learning_rate": 5.763946222096568e-05, "loss": 2.2606, "step": 100896 }, { "epoch": 0.63, "learning_rate": 5.7633166406020855e-05, "loss": 2.2371, "step": 100904 }, { "epoch": 0.63, "learning_rate": 5.762687064991579e-05, "loss": 2.2348, "step": 100912 }, { "epoch": 0.63, "learning_rate": 5.762057495280696e-05, "loss": 2.2429, "step": 100920 }, { "epoch": 0.63, "learning_rate": 5.7614279314850926e-05, "loss": 2.2507, "step": 100928 }, { "epoch": 0.63, "learning_rate": 5.760798373620416e-05, "loss": 2.252, "step": 100936 }, { "epoch": 0.63, "learning_rate": 5.7601688217023206e-05, "loss": 2.2387, "step": 100944 }, { "epoch": 0.63, "learning_rate": 5.759539275746453e-05, "loss": 2.2674, "step": 100952 }, { "epoch": 0.63, "learning_rate": 5.758909735768467e-05, "loss": 2.2573, "step": 100960 }, { "epoch": 0.63, "learning_rate": 5.758280201784013e-05, "loss": 2.2467, "step": 100968 }, { "epoch": 0.63, "learning_rate": 5.757650673808739e-05, "loss": 2.2477, "step": 100976 }, { "epoch": 0.63, "learning_rate": 5.7570211518582976e-05, "loss": 2.2292, "step": 100984 }, { "epoch": 0.63, "learning_rate": 5.756391635948335e-05, "loss": 2.2571, "step": 100992 }, { "epoch": 0.63, "learning_rate": 5.755762126094506e-05, "loss": 2.2519, "step": 101000 }, { "epoch": 0.63, "learning_rate": 5.755132622312458e-05, "loss": 2.261, "step": 101008 }, { "epoch": 0.63, "learning_rate": 5.754503124617841e-05, "loss": 2.2455, "step": 101016 }, { "epoch": 0.63, "learning_rate": 5.753873633026302e-05, "loss": 2.2485, "step": 101024 }, { "epoch": 0.63, "learning_rate": 5.7532441475534926e-05, "loss": 2.2382, "step": 101032 }, { "epoch": 0.63, "learning_rate": 5.7526146682150615e-05, "loss": 2.2505, "step": 101040 }, { "epoch": 0.63, "learning_rate": 5.751985195026659e-05, "loss": 2.2373, "step": 101048 }, { "epoch": 0.63, "learning_rate": 5.75135572800393e-05, "loss": 2.2437, "step": 101056 }, { "epoch": 0.63, "learning_rate": 5.750726267162527e-05, "loss": 2.2409, "step": 101064 }, { "epoch": 0.63, "learning_rate": 5.7500968125180956e-05, "loss": 2.243, "step": 101072 }, { "epoch": 0.63, "learning_rate": 5.7494673640862875e-05, "loss": 2.2443, "step": 101080 }, { "epoch": 0.63, "learning_rate": 5.748837921882747e-05, "loss": 2.2404, "step": 101088 }, { "epoch": 0.63, "learning_rate": 5.748208485923126e-05, "loss": 2.2578, "step": 101096 }, { "epoch": 0.63, "learning_rate": 5.747579056223068e-05, "loss": 2.2509, "step": 101104 }, { "epoch": 0.63, "learning_rate": 5.746949632798224e-05, "loss": 2.232, "step": 101112 }, { "epoch": 0.63, "learning_rate": 5.746320215664241e-05, "loss": 2.2555, "step": 101120 }, { "epoch": 0.63, "learning_rate": 5.745690804836765e-05, "loss": 2.2453, "step": 101128 }, { "epoch": 0.63, "learning_rate": 5.745061400331444e-05, "loss": 2.2499, "step": 101136 }, { "epoch": 0.63, "learning_rate": 5.744432002163926e-05, "loss": 2.2607, "step": 101144 }, { "epoch": 0.63, "learning_rate": 5.7438026103498575e-05, "loss": 2.2429, "step": 101152 }, { "epoch": 0.63, "learning_rate": 5.7431732249048844e-05, "loss": 2.2424, "step": 101160 }, { "epoch": 0.63, "learning_rate": 5.7425438458446525e-05, "loss": 2.2397, "step": 101168 }, { "epoch": 0.63, "learning_rate": 5.741914473184811e-05, "loss": 2.2615, "step": 101176 }, { "epoch": 0.63, "learning_rate": 5.741285106941003e-05, "loss": 2.2458, "step": 101184 }, { "epoch": 0.63, "learning_rate": 5.740655747128878e-05, "loss": 2.2366, "step": 101192 }, { "epoch": 0.63, "learning_rate": 5.74002639376408e-05, "loss": 2.2488, "step": 101200 }, { "epoch": 0.63, "learning_rate": 5.739397046862254e-05, "loss": 2.2535, "step": 101208 }, { "epoch": 0.63, "learning_rate": 5.738767706439048e-05, "loss": 2.2496, "step": 101216 }, { "epoch": 0.63, "learning_rate": 5.738138372510104e-05, "loss": 2.236, "step": 101224 }, { "epoch": 0.63, "learning_rate": 5.737509045091072e-05, "loss": 2.2642, "step": 101232 }, { "epoch": 0.63, "learning_rate": 5.736879724197594e-05, "loss": 2.2553, "step": 101240 }, { "epoch": 0.63, "learning_rate": 5.736250409845314e-05, "loss": 2.2423, "step": 101248 }, { "epoch": 0.63, "learning_rate": 5.7356211020498795e-05, "loss": 2.2625, "step": 101256 }, { "epoch": 0.63, "learning_rate": 5.7349918008269346e-05, "loss": 2.2475, "step": 101264 }, { "epoch": 0.63, "learning_rate": 5.7343625061921225e-05, "loss": 2.2457, "step": 101272 }, { "epoch": 0.63, "learning_rate": 5.733733218161088e-05, "loss": 2.2557, "step": 101280 }, { "epoch": 0.63, "learning_rate": 5.733103936749477e-05, "loss": 2.2517, "step": 101288 }, { "epoch": 0.63, "learning_rate": 5.732474661972931e-05, "loss": 2.2674, "step": 101296 }, { "epoch": 0.63, "learning_rate": 5.731845393847095e-05, "loss": 2.2554, "step": 101304 }, { "epoch": 0.63, "learning_rate": 5.731216132387612e-05, "loss": 2.2614, "step": 101312 }, { "epoch": 0.63, "learning_rate": 5.7305868776101265e-05, "loss": 2.2521, "step": 101320 }, { "epoch": 0.63, "learning_rate": 5.729957629530283e-05, "loss": 2.2619, "step": 101328 }, { "epoch": 0.63, "learning_rate": 5.7293283881637214e-05, "loss": 2.2626, "step": 101336 }, { "epoch": 0.63, "learning_rate": 5.728699153526087e-05, "loss": 2.2684, "step": 101344 }, { "epoch": 0.63, "learning_rate": 5.7280699256330214e-05, "loss": 2.2379, "step": 101352 }, { "epoch": 0.63, "learning_rate": 5.727440704500169e-05, "loss": 2.2419, "step": 101360 }, { "epoch": 0.63, "learning_rate": 5.72681149014317e-05, "loss": 2.2521, "step": 101368 }, { "epoch": 0.63, "learning_rate": 5.72618228257767e-05, "loss": 2.2369, "step": 101376 }, { "epoch": 0.63, "learning_rate": 5.725553081819306e-05, "loss": 2.241, "step": 101384 }, { "epoch": 0.63, "learning_rate": 5.7249238878837264e-05, "loss": 2.242, "step": 101392 }, { "epoch": 0.63, "learning_rate": 5.7242947007865686e-05, "loss": 2.2515, "step": 101400 }, { "epoch": 0.63, "learning_rate": 5.7236655205434754e-05, "loss": 2.245, "step": 101408 }, { "epoch": 0.63, "learning_rate": 5.723036347170088e-05, "loss": 2.2454, "step": 101416 }, { "epoch": 0.63, "learning_rate": 5.722407180682048e-05, "loss": 2.2488, "step": 101424 }, { "epoch": 0.63, "learning_rate": 5.7217780210949976e-05, "loss": 2.2462, "step": 101432 }, { "epoch": 0.63, "learning_rate": 5.7211488684245764e-05, "loss": 2.2413, "step": 101440 }, { "epoch": 0.63, "learning_rate": 5.720519722686426e-05, "loss": 2.2605, "step": 101448 }, { "epoch": 0.63, "learning_rate": 5.719890583896186e-05, "loss": 2.256, "step": 101456 }, { "epoch": 0.63, "learning_rate": 5.7192614520694975e-05, "loss": 2.2581, "step": 101464 }, { "epoch": 0.63, "learning_rate": 5.718632327222002e-05, "loss": 2.2449, "step": 101472 }, { "epoch": 0.63, "learning_rate": 5.7180032093693356e-05, "loss": 2.2629, "step": 101480 }, { "epoch": 0.63, "learning_rate": 5.717374098527144e-05, "loss": 2.2635, "step": 101488 }, { "epoch": 0.63, "learning_rate": 5.716744994711063e-05, "loss": 2.2575, "step": 101496 }, { "epoch": 0.63, "learning_rate": 5.7161158979367326e-05, "loss": 2.2783, "step": 101504 }, { "epoch": 0.63, "learning_rate": 5.715486808219793e-05, "loss": 2.2436, "step": 101512 }, { "epoch": 0.63, "learning_rate": 5.714857725575884e-05, "loss": 2.2379, "step": 101520 }, { "epoch": 0.63, "learning_rate": 5.7142286500206435e-05, "loss": 2.245, "step": 101528 }, { "epoch": 0.63, "learning_rate": 5.713599581569711e-05, "loss": 2.2431, "step": 101536 }, { "epoch": 0.63, "learning_rate": 5.7129705202387244e-05, "loss": 2.2387, "step": 101544 }, { "epoch": 0.63, "learning_rate": 5.712341466043323e-05, "loss": 2.2298, "step": 101552 }, { "epoch": 0.63, "learning_rate": 5.7117124189991457e-05, "loss": 2.253, "step": 101560 }, { "epoch": 0.63, "learning_rate": 5.7110833791218286e-05, "loss": 2.2295, "step": 101568 }, { "epoch": 0.63, "learning_rate": 5.7104543464270135e-05, "loss": 2.2564, "step": 101576 }, { "epoch": 0.63, "learning_rate": 5.7098253209303346e-05, "loss": 2.2471, "step": 101584 }, { "epoch": 0.63, "learning_rate": 5.7091963026474306e-05, "loss": 2.2551, "step": 101592 }, { "epoch": 0.64, "learning_rate": 5.708567291593938e-05, "loss": 2.2501, "step": 101600 }, { "epoch": 0.64, "learning_rate": 5.707938287785497e-05, "loss": 2.2491, "step": 101608 }, { "epoch": 0.64, "learning_rate": 5.7073092912377425e-05, "loss": 2.2571, "step": 101616 }, { "epoch": 0.64, "learning_rate": 5.706680301966312e-05, "loss": 2.2574, "step": 101624 }, { "epoch": 0.64, "learning_rate": 5.7060513199868424e-05, "loss": 2.2515, "step": 101632 }, { "epoch": 0.64, "learning_rate": 5.705422345314968e-05, "loss": 2.2347, "step": 101640 }, { "epoch": 0.64, "learning_rate": 5.7047933779663284e-05, "loss": 2.2563, "step": 101648 }, { "epoch": 0.64, "learning_rate": 5.704164417956561e-05, "loss": 2.2451, "step": 101656 }, { "epoch": 0.64, "learning_rate": 5.703535465301295e-05, "loss": 2.2397, "step": 101664 }, { "epoch": 0.64, "learning_rate": 5.7029065200161736e-05, "loss": 2.242, "step": 101672 }, { "epoch": 0.64, "learning_rate": 5.702277582116829e-05, "loss": 2.2369, "step": 101680 }, { "epoch": 0.64, "learning_rate": 5.701648651618896e-05, "loss": 2.2385, "step": 101688 }, { "epoch": 0.64, "learning_rate": 5.701019728538011e-05, "loss": 2.2412, "step": 101696 }, { "epoch": 0.64, "learning_rate": 5.70039081288981e-05, "loss": 2.2739, "step": 101704 }, { "epoch": 0.64, "learning_rate": 5.699761904689929e-05, "loss": 2.2501, "step": 101712 }, { "epoch": 0.64, "learning_rate": 5.699133003953998e-05, "loss": 2.2512, "step": 101720 }, { "epoch": 0.64, "learning_rate": 5.698504110697653e-05, "loss": 2.2332, "step": 101728 }, { "epoch": 0.64, "learning_rate": 5.6978752249365334e-05, "loss": 2.2365, "step": 101736 }, { "epoch": 0.64, "learning_rate": 5.697246346686267e-05, "loss": 2.2568, "step": 101744 }, { "epoch": 0.64, "learning_rate": 5.69661747596249e-05, "loss": 2.2425, "step": 101752 }, { "epoch": 0.64, "learning_rate": 5.695988612780838e-05, "loss": 2.2425, "step": 101760 }, { "epoch": 0.64, "learning_rate": 5.6953597571569425e-05, "loss": 2.2495, "step": 101768 }, { "epoch": 0.64, "learning_rate": 5.6947309091064384e-05, "loss": 2.2597, "step": 101776 }, { "epoch": 0.64, "learning_rate": 5.694102068644958e-05, "loss": 2.255, "step": 101784 }, { "epoch": 0.64, "learning_rate": 5.693473235788134e-05, "loss": 2.2644, "step": 101792 }, { "epoch": 0.64, "learning_rate": 5.692844410551599e-05, "loss": 2.2572, "step": 101800 }, { "epoch": 0.64, "learning_rate": 5.6922155929509866e-05, "loss": 2.2441, "step": 101808 }, { "epoch": 0.64, "learning_rate": 5.6915867830019306e-05, "loss": 2.2329, "step": 101816 }, { "epoch": 0.64, "learning_rate": 5.690957980720062e-05, "loss": 2.2449, "step": 101824 }, { "epoch": 0.64, "learning_rate": 5.690329186121011e-05, "loss": 2.2474, "step": 101832 }, { "epoch": 0.64, "learning_rate": 5.6897003992204124e-05, "loss": 2.2609, "step": 101840 }, { "epoch": 0.64, "learning_rate": 5.689071620033894e-05, "loss": 2.2608, "step": 101848 }, { "epoch": 0.64, "learning_rate": 5.688442848577093e-05, "loss": 2.2569, "step": 101856 }, { "epoch": 0.64, "learning_rate": 5.687814084865637e-05, "loss": 2.2465, "step": 101864 }, { "epoch": 0.64, "learning_rate": 5.687185328915159e-05, "loss": 2.2318, "step": 101872 }, { "epoch": 0.64, "learning_rate": 5.686556580741287e-05, "loss": 2.2536, "step": 101880 }, { "epoch": 0.64, "learning_rate": 5.685927840359653e-05, "loss": 2.2433, "step": 101888 }, { "epoch": 0.64, "learning_rate": 5.685299107785891e-05, "loss": 2.2436, "step": 101896 }, { "epoch": 0.64, "learning_rate": 5.6846703830356265e-05, "loss": 2.2615, "step": 101904 }, { "epoch": 0.64, "learning_rate": 5.684041666124491e-05, "loss": 2.2344, "step": 101912 }, { "epoch": 0.64, "learning_rate": 5.683412957068115e-05, "loss": 2.2397, "step": 101920 }, { "epoch": 0.64, "learning_rate": 5.6827842558821306e-05, "loss": 2.2403, "step": 101928 }, { "epoch": 0.64, "learning_rate": 5.682155562582164e-05, "loss": 2.248, "step": 101936 }, { "epoch": 0.64, "learning_rate": 5.681526877183846e-05, "loss": 2.2503, "step": 101944 }, { "epoch": 0.64, "learning_rate": 5.680898199702807e-05, "loss": 2.2421, "step": 101952 }, { "epoch": 0.64, "learning_rate": 5.6802695301546715e-05, "loss": 2.2394, "step": 101960 }, { "epoch": 0.64, "learning_rate": 5.6796408685550716e-05, "loss": 2.2474, "step": 101968 }, { "epoch": 0.64, "learning_rate": 5.679012214919639e-05, "loss": 2.2436, "step": 101976 }, { "epoch": 0.64, "learning_rate": 5.678383569263996e-05, "loss": 2.2335, "step": 101984 }, { "epoch": 0.64, "learning_rate": 5.6777549316037734e-05, "loss": 2.2316, "step": 101992 }, { "epoch": 0.64, "learning_rate": 5.6771263019546005e-05, "loss": 2.2516, "step": 102000 }, { "epoch": 0.64, "learning_rate": 5.676497680332104e-05, "loss": 2.239, "step": 102008 }, { "epoch": 0.64, "learning_rate": 5.67586906675191e-05, "loss": 2.25, "step": 102016 }, { "epoch": 0.64, "learning_rate": 5.675240461229648e-05, "loss": 2.2327, "step": 102024 }, { "epoch": 0.64, "learning_rate": 5.674611863780945e-05, "loss": 2.2278, "step": 102032 }, { "epoch": 0.64, "learning_rate": 5.6739832744214284e-05, "loss": 2.2361, "step": 102040 }, { "epoch": 0.64, "learning_rate": 5.6733546931667226e-05, "loss": 2.2459, "step": 102048 }, { "epoch": 0.64, "learning_rate": 5.672726120032457e-05, "loss": 2.2475, "step": 102056 }, { "epoch": 0.64, "learning_rate": 5.672097555034256e-05, "loss": 2.2343, "step": 102064 }, { "epoch": 0.64, "learning_rate": 5.6714689981877466e-05, "loss": 2.2418, "step": 102072 }, { "epoch": 0.64, "learning_rate": 5.6708404495085545e-05, "loss": 2.2607, "step": 102080 }, { "epoch": 0.64, "learning_rate": 5.6702119090123085e-05, "loss": 2.2514, "step": 102088 }, { "epoch": 0.64, "learning_rate": 5.6695833767146265e-05, "loss": 2.2219, "step": 102096 }, { "epoch": 0.64, "learning_rate": 5.668954852631142e-05, "loss": 2.2521, "step": 102104 }, { "epoch": 0.64, "learning_rate": 5.6683263367774786e-05, "loss": 2.261, "step": 102112 }, { "epoch": 0.64, "learning_rate": 5.667697829169256e-05, "loss": 2.2464, "step": 102120 }, { "epoch": 0.64, "learning_rate": 5.6670693298221056e-05, "loss": 2.248, "step": 102128 }, { "epoch": 0.64, "learning_rate": 5.6664408387516456e-05, "loss": 2.2366, "step": 102136 }, { "epoch": 0.64, "learning_rate": 5.6658123559735074e-05, "loss": 2.2437, "step": 102144 }, { "epoch": 0.64, "learning_rate": 5.6651838815033095e-05, "loss": 2.2462, "step": 102152 }, { "epoch": 0.64, "learning_rate": 5.664555415356678e-05, "loss": 2.2376, "step": 102160 }, { "epoch": 0.64, "learning_rate": 5.663926957549237e-05, "loss": 2.2267, "step": 102168 }, { "epoch": 0.64, "learning_rate": 5.663298508096611e-05, "loss": 2.2402, "step": 102176 }, { "epoch": 0.64, "learning_rate": 5.6626700670144195e-05, "loss": 2.2338, "step": 102184 }, { "epoch": 0.64, "learning_rate": 5.6620416343182894e-05, "loss": 2.225, "step": 102192 }, { "epoch": 0.64, "learning_rate": 5.6614132100238406e-05, "loss": 2.2464, "step": 102200 }, { "epoch": 0.64, "learning_rate": 5.660784794146698e-05, "loss": 2.2538, "step": 102208 }, { "epoch": 0.64, "learning_rate": 5.660156386702483e-05, "loss": 2.2542, "step": 102216 }, { "epoch": 0.64, "learning_rate": 5.6595279877068206e-05, "loss": 2.227, "step": 102224 }, { "epoch": 0.64, "learning_rate": 5.6588995971753286e-05, "loss": 2.2481, "step": 102232 }, { "epoch": 0.64, "learning_rate": 5.6582712151236305e-05, "loss": 2.2516, "step": 102240 }, { "epoch": 0.64, "learning_rate": 5.6576428415673497e-05, "loss": 2.2416, "step": 102248 }, { "epoch": 0.64, "learning_rate": 5.657014476522107e-05, "loss": 2.2475, "step": 102256 }, { "epoch": 0.64, "learning_rate": 5.656386120003521e-05, "loss": 2.2478, "step": 102264 }, { "epoch": 0.64, "learning_rate": 5.655757772027215e-05, "loss": 2.2409, "step": 102272 }, { "epoch": 0.64, "learning_rate": 5.65512943260881e-05, "loss": 2.2466, "step": 102280 }, { "epoch": 0.64, "learning_rate": 5.654501101763925e-05, "loss": 2.2376, "step": 102288 }, { "epoch": 0.64, "learning_rate": 5.653872779508182e-05, "loss": 2.2645, "step": 102296 }, { "epoch": 0.64, "learning_rate": 5.653244465857203e-05, "loss": 2.2539, "step": 102304 }, { "epoch": 0.64, "learning_rate": 5.652616160826603e-05, "loss": 2.2407, "step": 102312 }, { "epoch": 0.64, "learning_rate": 5.651987864432003e-05, "loss": 2.2563, "step": 102320 }, { "epoch": 0.64, "learning_rate": 5.651359576689026e-05, "loss": 2.2427, "step": 102328 }, { "epoch": 0.64, "learning_rate": 5.650731297613288e-05, "loss": 2.238, "step": 102336 }, { "epoch": 0.64, "learning_rate": 5.650103027220409e-05, "loss": 2.2236, "step": 102344 }, { "epoch": 0.64, "learning_rate": 5.6494747655260075e-05, "loss": 2.2415, "step": 102352 }, { "epoch": 0.64, "learning_rate": 5.648846512545705e-05, "loss": 2.2318, "step": 102360 }, { "epoch": 0.64, "learning_rate": 5.6482182682951156e-05, "loss": 2.2638, "step": 102368 }, { "epoch": 0.64, "learning_rate": 5.64759003278986e-05, "loss": 2.2381, "step": 102376 }, { "epoch": 0.64, "learning_rate": 5.646961806045556e-05, "loss": 2.2521, "step": 102384 }, { "epoch": 0.64, "learning_rate": 5.64633358807782e-05, "loss": 2.2584, "step": 102392 }, { "epoch": 0.64, "learning_rate": 5.645705378902271e-05, "loss": 2.2619, "step": 102400 }, { "epoch": 0.64, "learning_rate": 5.645077178534526e-05, "loss": 2.2366, "step": 102408 }, { "epoch": 0.64, "learning_rate": 5.644448986990204e-05, "loss": 2.2632, "step": 102416 }, { "epoch": 0.64, "learning_rate": 5.643820804284918e-05, "loss": 2.2573, "step": 102424 }, { "epoch": 0.64, "learning_rate": 5.643192630434288e-05, "loss": 2.2435, "step": 102432 }, { "epoch": 0.64, "learning_rate": 5.6425644654539287e-05, "loss": 2.2439, "step": 102440 }, { "epoch": 0.64, "learning_rate": 5.641936309359457e-05, "loss": 2.2321, "step": 102448 }, { "epoch": 0.64, "learning_rate": 5.6413081621664875e-05, "loss": 2.2529, "step": 102456 }, { "epoch": 0.64, "learning_rate": 5.64068002389064e-05, "loss": 2.2373, "step": 102464 }, { "epoch": 0.64, "learning_rate": 5.6400518945475265e-05, "loss": 2.228, "step": 102472 }, { "epoch": 0.64, "learning_rate": 5.639423774152761e-05, "loss": 2.2372, "step": 102480 }, { "epoch": 0.64, "learning_rate": 5.6387956627219626e-05, "loss": 2.2241, "step": 102488 }, { "epoch": 0.64, "learning_rate": 5.638167560270746e-05, "loss": 2.244, "step": 102496 }, { "epoch": 0.64, "learning_rate": 5.637539466814723e-05, "loss": 2.2527, "step": 102504 }, { "epoch": 0.64, "learning_rate": 5.636911382369509e-05, "loss": 2.2589, "step": 102512 }, { "epoch": 0.64, "learning_rate": 5.6362833069507204e-05, "loss": 2.2501, "step": 102520 }, { "epoch": 0.64, "learning_rate": 5.6356552405739695e-05, "loss": 2.2374, "step": 102528 }, { "epoch": 0.64, "learning_rate": 5.6350271832548686e-05, "loss": 2.2563, "step": 102536 }, { "epoch": 0.64, "learning_rate": 5.634399135009034e-05, "loss": 2.2563, "step": 102544 }, { "epoch": 0.64, "learning_rate": 5.6337710958520774e-05, "loss": 2.2509, "step": 102552 }, { "epoch": 0.64, "learning_rate": 5.633143065799613e-05, "loss": 2.2661, "step": 102560 }, { "epoch": 0.64, "learning_rate": 5.63251504486725e-05, "loss": 2.2434, "step": 102568 }, { "epoch": 0.64, "learning_rate": 5.631887033070609e-05, "loss": 2.2546, "step": 102576 }, { "epoch": 0.64, "learning_rate": 5.6312590304252953e-05, "loss": 2.2584, "step": 102584 }, { "epoch": 0.64, "learning_rate": 5.630631036946924e-05, "loss": 2.251, "step": 102592 }, { "epoch": 0.64, "learning_rate": 5.6300030526511074e-05, "loss": 2.2598, "step": 102600 }, { "epoch": 0.64, "learning_rate": 5.629375077553454e-05, "loss": 2.2377, "step": 102608 }, { "epoch": 0.64, "learning_rate": 5.628747111669579e-05, "loss": 2.2512, "step": 102616 }, { "epoch": 0.64, "learning_rate": 5.628119155015092e-05, "loss": 2.2465, "step": 102624 }, { "epoch": 0.64, "learning_rate": 5.627491207605606e-05, "loss": 2.2575, "step": 102632 }, { "epoch": 0.64, "learning_rate": 5.62686326945673e-05, "loss": 2.2662, "step": 102640 }, { "epoch": 0.64, "learning_rate": 5.626235340584074e-05, "loss": 2.237, "step": 102648 }, { "epoch": 0.64, "learning_rate": 5.625607421003249e-05, "loss": 2.2463, "step": 102656 }, { "epoch": 0.64, "learning_rate": 5.624979510729866e-05, "loss": 2.2485, "step": 102664 }, { "epoch": 0.64, "learning_rate": 5.6243516097795356e-05, "loss": 2.2638, "step": 102672 }, { "epoch": 0.64, "learning_rate": 5.623723718167867e-05, "loss": 2.25, "step": 102680 }, { "epoch": 0.64, "learning_rate": 5.6230958359104655e-05, "loss": 2.2635, "step": 102688 }, { "epoch": 0.64, "learning_rate": 5.622467963022946e-05, "loss": 2.2444, "step": 102696 }, { "epoch": 0.64, "learning_rate": 5.6218400995209154e-05, "loss": 2.2614, "step": 102704 }, { "epoch": 0.64, "learning_rate": 5.621212245419983e-05, "loss": 2.2397, "step": 102712 }, { "epoch": 0.64, "learning_rate": 5.6205844007357555e-05, "loss": 2.2548, "step": 102720 }, { "epoch": 0.64, "learning_rate": 5.6199565654838414e-05, "loss": 2.2508, "step": 102728 }, { "epoch": 0.64, "learning_rate": 5.619328739679852e-05, "loss": 2.2626, "step": 102736 }, { "epoch": 0.64, "learning_rate": 5.6187009233393925e-05, "loss": 2.2328, "step": 102744 }, { "epoch": 0.64, "learning_rate": 5.6180731164780685e-05, "loss": 2.2369, "step": 102752 }, { "epoch": 0.64, "learning_rate": 5.617445319111492e-05, "loss": 2.2406, "step": 102760 }, { "epoch": 0.64, "learning_rate": 5.616817531255267e-05, "loss": 2.2422, "step": 102768 }, { "epoch": 0.64, "learning_rate": 5.616189752925002e-05, "loss": 2.2549, "step": 102776 }, { "epoch": 0.64, "learning_rate": 5.6155619841363004e-05, "loss": 2.2475, "step": 102784 }, { "epoch": 0.64, "learning_rate": 5.614934224904774e-05, "loss": 2.2389, "step": 102792 }, { "epoch": 0.64, "learning_rate": 5.614306475246025e-05, "loss": 2.2456, "step": 102800 }, { "epoch": 0.64, "learning_rate": 5.613678735175659e-05, "loss": 2.2538, "step": 102808 }, { "epoch": 0.64, "learning_rate": 5.6130510047092845e-05, "loss": 2.2574, "step": 102816 }, { "epoch": 0.64, "learning_rate": 5.612423283862505e-05, "loss": 2.2511, "step": 102824 }, { "epoch": 0.64, "learning_rate": 5.611795572650925e-05, "loss": 2.2542, "step": 102832 }, { "epoch": 0.64, "learning_rate": 5.611167871090152e-05, "loss": 2.2424, "step": 102840 }, { "epoch": 0.64, "learning_rate": 5.610540179195789e-05, "loss": 2.2637, "step": 102848 }, { "epoch": 0.64, "learning_rate": 5.609912496983441e-05, "loss": 2.238, "step": 102856 }, { "epoch": 0.64, "learning_rate": 5.6092848244687114e-05, "loss": 2.2508, "step": 102864 }, { "epoch": 0.64, "learning_rate": 5.608657161667206e-05, "loss": 2.2576, "step": 102872 }, { "epoch": 0.64, "learning_rate": 5.608029508594527e-05, "loss": 2.2466, "step": 102880 }, { "epoch": 0.64, "learning_rate": 5.6074018652662774e-05, "loss": 2.2255, "step": 102888 }, { "epoch": 0.64, "learning_rate": 5.606774231698064e-05, "loss": 2.2618, "step": 102896 }, { "epoch": 0.64, "learning_rate": 5.6061466079054844e-05, "loss": 2.2587, "step": 102904 }, { "epoch": 0.64, "learning_rate": 5.6055189939041455e-05, "loss": 2.2378, "step": 102912 }, { "epoch": 0.64, "learning_rate": 5.604891389709648e-05, "loss": 2.2319, "step": 102920 }, { "epoch": 0.64, "learning_rate": 5.6042637953375974e-05, "loss": 2.2452, "step": 102928 }, { "epoch": 0.64, "learning_rate": 5.603636210803591e-05, "loss": 2.2473, "step": 102936 }, { "epoch": 0.64, "learning_rate": 5.6030086361232324e-05, "loss": 2.2536, "step": 102944 }, { "epoch": 0.64, "learning_rate": 5.602381071312126e-05, "loss": 2.2586, "step": 102952 }, { "epoch": 0.64, "learning_rate": 5.601753516385869e-05, "loss": 2.2531, "step": 102960 }, { "epoch": 0.64, "learning_rate": 5.601125971360064e-05, "loss": 2.241, "step": 102968 }, { "epoch": 0.64, "learning_rate": 5.600498436250312e-05, "loss": 2.2581, "step": 102976 }, { "epoch": 0.64, "learning_rate": 5.5998709110722156e-05, "loss": 2.2515, "step": 102984 }, { "epoch": 0.64, "learning_rate": 5.5992433958413714e-05, "loss": 2.2649, "step": 102992 }, { "epoch": 0.64, "learning_rate": 5.598615890573382e-05, "loss": 2.2493, "step": 103000 }, { "epoch": 0.64, "learning_rate": 5.5979883952838485e-05, "loss": 2.2705, "step": 103008 }, { "epoch": 0.64, "learning_rate": 5.597360909988365e-05, "loss": 2.2576, "step": 103016 }, { "epoch": 0.64, "learning_rate": 5.596733434702537e-05, "loss": 2.2382, "step": 103024 }, { "epoch": 0.64, "learning_rate": 5.59610596944196e-05, "loss": 2.2417, "step": 103032 }, { "epoch": 0.64, "learning_rate": 5.595478514222234e-05, "loss": 2.2722, "step": 103040 }, { "epoch": 0.64, "learning_rate": 5.5948510690589576e-05, "loss": 2.2553, "step": 103048 }, { "epoch": 0.64, "learning_rate": 5.594223633967729e-05, "loss": 2.2603, "step": 103056 }, { "epoch": 0.64, "learning_rate": 5.593596208964147e-05, "loss": 2.2565, "step": 103064 }, { "epoch": 0.64, "learning_rate": 5.592968794063809e-05, "loss": 2.2469, "step": 103072 }, { "epoch": 0.64, "learning_rate": 5.5923413892823104e-05, "loss": 2.2375, "step": 103080 }, { "epoch": 0.64, "learning_rate": 5.591713994635253e-05, "loss": 2.2818, "step": 103088 }, { "epoch": 0.64, "learning_rate": 5.5910866101382296e-05, "loss": 2.2491, "step": 103096 }, { "epoch": 0.64, "learning_rate": 5.59045923580684e-05, "loss": 2.2446, "step": 103104 }, { "epoch": 0.64, "learning_rate": 5.589831871656679e-05, "loss": 2.256, "step": 103112 }, { "epoch": 0.64, "learning_rate": 5.589204517703346e-05, "loss": 2.2602, "step": 103120 }, { "epoch": 0.64, "learning_rate": 5.5885771739624325e-05, "loss": 2.2528, "step": 103128 }, { "epoch": 0.64, "learning_rate": 5.587949840449535e-05, "loss": 2.2266, "step": 103136 }, { "epoch": 0.64, "learning_rate": 5.5873225171802555e-05, "loss": 2.2518, "step": 103144 }, { "epoch": 0.64, "learning_rate": 5.5866952041701825e-05, "loss": 2.2538, "step": 103152 }, { "epoch": 0.64, "learning_rate": 5.5860679014349105e-05, "loss": 2.2532, "step": 103160 }, { "epoch": 0.64, "learning_rate": 5.58544060899004e-05, "loss": 2.2464, "step": 103168 }, { "epoch": 0.64, "learning_rate": 5.5848133268511614e-05, "loss": 2.2417, "step": 103176 }, { "epoch": 0.64, "learning_rate": 5.584186055033871e-05, "loss": 2.243, "step": 103184 }, { "epoch": 0.64, "learning_rate": 5.583558793553759e-05, "loss": 2.2314, "step": 103192 }, { "epoch": 0.65, "learning_rate": 5.582931542426426e-05, "loss": 2.2523, "step": 103200 }, { "epoch": 0.65, "learning_rate": 5.582304301667459e-05, "loss": 2.2481, "step": 103208 }, { "epoch": 0.65, "learning_rate": 5.581677071292455e-05, "loss": 2.2445, "step": 103216 }, { "epoch": 0.65, "learning_rate": 5.5810498513170064e-05, "loss": 2.2518, "step": 103224 }, { "epoch": 0.65, "learning_rate": 5.580422641756704e-05, "loss": 2.2391, "step": 103232 }, { "epoch": 0.65, "learning_rate": 5.579795442627143e-05, "loss": 2.2555, "step": 103240 }, { "epoch": 0.65, "learning_rate": 5.579168253943914e-05, "loss": 2.2682, "step": 103248 }, { "epoch": 0.65, "learning_rate": 5.57854107572261e-05, "loss": 2.2466, "step": 103256 }, { "epoch": 0.65, "learning_rate": 5.57791390797882e-05, "loss": 2.2415, "step": 103264 }, { "epoch": 0.65, "learning_rate": 5.577286750728139e-05, "loss": 2.2532, "step": 103272 }, { "epoch": 0.65, "learning_rate": 5.5766596039861585e-05, "loss": 2.258, "step": 103280 }, { "epoch": 0.65, "learning_rate": 5.576032467768465e-05, "loss": 2.2551, "step": 103288 }, { "epoch": 0.65, "learning_rate": 5.5754053420906535e-05, "loss": 2.2373, "step": 103296 }, { "epoch": 0.65, "learning_rate": 5.5747782269683126e-05, "loss": 2.2476, "step": 103304 }, { "epoch": 0.65, "learning_rate": 5.574151122417033e-05, "loss": 2.2469, "step": 103312 }, { "epoch": 0.65, "learning_rate": 5.573524028452403e-05, "loss": 2.2461, "step": 103320 }, { "epoch": 0.65, "learning_rate": 5.572896945090014e-05, "loss": 2.2349, "step": 103328 }, { "epoch": 0.65, "learning_rate": 5.572269872345457e-05, "loss": 2.2603, "step": 103336 }, { "epoch": 0.65, "learning_rate": 5.571642810234315e-05, "loss": 2.2616, "step": 103344 }, { "epoch": 0.65, "learning_rate": 5.571015758772184e-05, "loss": 2.2404, "step": 103352 }, { "epoch": 0.65, "learning_rate": 5.570388717974648e-05, "loss": 2.2586, "step": 103360 }, { "epoch": 0.65, "learning_rate": 5.5697616878572975e-05, "loss": 2.2463, "step": 103368 }, { "epoch": 0.65, "learning_rate": 5.569134668435718e-05, "loss": 2.2399, "step": 103376 }, { "epoch": 0.65, "learning_rate": 5.5685076597255014e-05, "loss": 2.2407, "step": 103384 }, { "epoch": 0.65, "learning_rate": 5.567880661742232e-05, "loss": 2.2541, "step": 103392 }, { "epoch": 0.65, "learning_rate": 5.567253674501497e-05, "loss": 2.25, "step": 103400 }, { "epoch": 0.65, "learning_rate": 5.5666266980188844e-05, "loss": 2.251, "step": 103408 }, { "epoch": 0.65, "learning_rate": 5.5659997323099814e-05, "loss": 2.2477, "step": 103416 }, { "epoch": 0.65, "learning_rate": 5.565372777390373e-05, "loss": 2.2251, "step": 103424 }, { "epoch": 0.65, "learning_rate": 5.5647458332756464e-05, "loss": 2.2566, "step": 103432 }, { "epoch": 0.65, "learning_rate": 5.564118899981388e-05, "loss": 2.2469, "step": 103440 }, { "epoch": 0.65, "learning_rate": 5.563491977523181e-05, "loss": 2.2367, "step": 103448 }, { "epoch": 0.65, "learning_rate": 5.562865065916614e-05, "loss": 2.2572, "step": 103456 }, { "epoch": 0.65, "learning_rate": 5.5622381651772696e-05, "loss": 2.2509, "step": 103464 }, { "epoch": 0.65, "learning_rate": 5.561611275320733e-05, "loss": 2.2415, "step": 103472 }, { "epoch": 0.65, "learning_rate": 5.5609843963625896e-05, "loss": 2.2641, "step": 103480 }, { "epoch": 0.65, "learning_rate": 5.560357528318424e-05, "loss": 2.2488, "step": 103488 }, { "epoch": 0.65, "learning_rate": 5.5597306712038196e-05, "loss": 2.2365, "step": 103496 }, { "epoch": 0.65, "learning_rate": 5.55910382503436e-05, "loss": 2.2313, "step": 103504 }, { "epoch": 0.65, "learning_rate": 5.558476989825628e-05, "loss": 2.2469, "step": 103512 }, { "epoch": 0.65, "learning_rate": 5.55785016559321e-05, "loss": 2.2418, "step": 103520 }, { "epoch": 0.65, "learning_rate": 5.5572233523526826e-05, "loss": 2.251, "step": 103528 }, { "epoch": 0.65, "learning_rate": 5.556596550119635e-05, "loss": 2.2519, "step": 103536 }, { "epoch": 0.65, "learning_rate": 5.555969758909646e-05, "loss": 2.2465, "step": 103544 }, { "epoch": 0.65, "learning_rate": 5.5553429787383005e-05, "loss": 2.2472, "step": 103552 }, { "epoch": 0.65, "learning_rate": 5.554716209621176e-05, "loss": 2.2654, "step": 103560 }, { "epoch": 0.65, "learning_rate": 5.554089451573856e-05, "loss": 2.2372, "step": 103568 }, { "epoch": 0.65, "learning_rate": 5.553462704611927e-05, "loss": 2.2538, "step": 103576 }, { "epoch": 0.65, "learning_rate": 5.55283596875096e-05, "loss": 2.254, "step": 103584 }, { "epoch": 0.65, "learning_rate": 5.552209244006543e-05, "loss": 2.2566, "step": 103592 }, { "epoch": 0.65, "learning_rate": 5.551582530394255e-05, "loss": 2.2547, "step": 103600 }, { "epoch": 0.65, "learning_rate": 5.550955827929675e-05, "loss": 2.2407, "step": 103608 }, { "epoch": 0.65, "learning_rate": 5.550329136628383e-05, "loss": 2.248, "step": 103616 }, { "epoch": 0.65, "learning_rate": 5.549702456505959e-05, "loss": 2.2591, "step": 103624 }, { "epoch": 0.65, "learning_rate": 5.549075787577984e-05, "loss": 2.2528, "step": 103632 }, { "epoch": 0.65, "learning_rate": 5.548449129860034e-05, "loss": 2.2419, "step": 103640 }, { "epoch": 0.65, "learning_rate": 5.54782248336769e-05, "loss": 2.2545, "step": 103648 }, { "epoch": 0.65, "learning_rate": 5.54719584811653e-05, "loss": 2.2364, "step": 103656 }, { "epoch": 0.65, "learning_rate": 5.5465692241221314e-05, "loss": 2.2477, "step": 103664 }, { "epoch": 0.65, "learning_rate": 5.5459426114000725e-05, "loss": 2.2575, "step": 103672 }, { "epoch": 0.65, "learning_rate": 5.5453160099659305e-05, "loss": 2.246, "step": 103680 }, { "epoch": 0.65, "learning_rate": 5.544689419835287e-05, "loss": 2.2514, "step": 103688 }, { "epoch": 0.65, "learning_rate": 5.5440628410237114e-05, "loss": 2.2352, "step": 103696 }, { "epoch": 0.65, "learning_rate": 5.543436273546787e-05, "loss": 2.2669, "step": 103704 }, { "epoch": 0.65, "learning_rate": 5.542809717420089e-05, "loss": 2.256, "step": 103712 }, { "epoch": 0.65, "learning_rate": 5.542183172659191e-05, "loss": 2.258, "step": 103720 }, { "epoch": 0.65, "learning_rate": 5.54155663927967e-05, "loss": 2.249, "step": 103728 }, { "epoch": 0.65, "learning_rate": 5.5409301172971054e-05, "loss": 2.2605, "step": 103736 }, { "epoch": 0.65, "learning_rate": 5.540303606727066e-05, "loss": 2.2399, "step": 103744 }, { "epoch": 0.65, "learning_rate": 5.539677107585133e-05, "loss": 2.25, "step": 103752 }, { "epoch": 0.65, "learning_rate": 5.5390506198868775e-05, "loss": 2.2376, "step": 103760 }, { "epoch": 0.65, "learning_rate": 5.538424143647878e-05, "loss": 2.2566, "step": 103768 }, { "epoch": 0.65, "learning_rate": 5.5377976788837025e-05, "loss": 2.2488, "step": 103776 }, { "epoch": 0.65, "learning_rate": 5.53717122560993e-05, "loss": 2.2668, "step": 103784 }, { "epoch": 0.65, "learning_rate": 5.5365447838421325e-05, "loss": 2.2556, "step": 103792 }, { "epoch": 0.65, "learning_rate": 5.5359183535958834e-05, "loss": 2.2515, "step": 103800 }, { "epoch": 0.65, "learning_rate": 5.535291934886757e-05, "loss": 2.2629, "step": 103808 }, { "epoch": 0.65, "learning_rate": 5.534665527730324e-05, "loss": 2.2464, "step": 103816 }, { "epoch": 0.65, "learning_rate": 5.5340391321421605e-05, "loss": 2.2407, "step": 103824 }, { "epoch": 0.65, "learning_rate": 5.533412748137834e-05, "loss": 2.2585, "step": 103832 }, { "epoch": 0.65, "learning_rate": 5.53278637573292e-05, "loss": 2.2475, "step": 103840 }, { "epoch": 0.65, "learning_rate": 5.5321600149429896e-05, "loss": 2.2348, "step": 103848 }, { "epoch": 0.65, "learning_rate": 5.5315336657836125e-05, "loss": 2.2359, "step": 103856 }, { "epoch": 0.65, "learning_rate": 5.530907328270362e-05, "loss": 2.2516, "step": 103864 }, { "epoch": 0.65, "learning_rate": 5.530281002418808e-05, "loss": 2.2438, "step": 103872 }, { "epoch": 0.65, "learning_rate": 5.5296546882445214e-05, "loss": 2.2433, "step": 103880 }, { "epoch": 0.65, "learning_rate": 5.52902838576307e-05, "loss": 2.248, "step": 103888 }, { "epoch": 0.65, "learning_rate": 5.528402094990026e-05, "loss": 2.2609, "step": 103896 }, { "epoch": 0.65, "learning_rate": 5.527775815940961e-05, "loss": 2.2357, "step": 103904 }, { "epoch": 0.65, "learning_rate": 5.5271495486314406e-05, "loss": 2.2576, "step": 103912 }, { "epoch": 0.65, "learning_rate": 5.526523293077035e-05, "loss": 2.2473, "step": 103920 }, { "epoch": 0.65, "learning_rate": 5.525897049293316e-05, "loss": 2.2498, "step": 103928 }, { "epoch": 0.65, "learning_rate": 5.5252708172958465e-05, "loss": 2.246, "step": 103936 }, { "epoch": 0.65, "learning_rate": 5.524644597100199e-05, "loss": 2.2348, "step": 103944 }, { "epoch": 0.65, "learning_rate": 5.524018388721942e-05, "loss": 2.2601, "step": 103952 }, { "epoch": 0.65, "learning_rate": 5.5233921921766384e-05, "loss": 2.2678, "step": 103960 }, { "epoch": 0.65, "learning_rate": 5.522766007479859e-05, "loss": 2.2414, "step": 103968 }, { "epoch": 0.65, "learning_rate": 5.5221398346471706e-05, "loss": 2.2467, "step": 103976 }, { "epoch": 0.65, "learning_rate": 5.521513673694141e-05, "loss": 2.2393, "step": 103984 }, { "epoch": 0.65, "learning_rate": 5.520887524636333e-05, "loss": 2.2432, "step": 103992 }, { "epoch": 0.65, "learning_rate": 5.520261387489316e-05, "loss": 2.2404, "step": 104000 }, { "epoch": 0.65, "learning_rate": 5.5196352622686555e-05, "loss": 2.247, "step": 104008 }, { "epoch": 0.65, "learning_rate": 5.519009148989915e-05, "loss": 2.2417, "step": 104016 }, { "epoch": 0.65, "learning_rate": 5.51838304766866e-05, "loss": 2.2384, "step": 104024 }, { "epoch": 0.65, "learning_rate": 5.5177569583204566e-05, "loss": 2.2349, "step": 104032 }, { "epoch": 0.65, "learning_rate": 5.517130880960872e-05, "loss": 2.2426, "step": 104040 }, { "epoch": 0.65, "learning_rate": 5.5165048156054656e-05, "loss": 2.2473, "step": 104048 }, { "epoch": 0.65, "learning_rate": 5.515878762269805e-05, "loss": 2.2466, "step": 104056 }, { "epoch": 0.65, "learning_rate": 5.5152527209694524e-05, "loss": 2.234, "step": 104064 }, { "epoch": 0.65, "learning_rate": 5.5146266917199704e-05, "loss": 2.2166, "step": 104072 }, { "epoch": 0.65, "learning_rate": 5.5140006745369255e-05, "loss": 2.236, "step": 104080 }, { "epoch": 0.65, "learning_rate": 5.5133746694358765e-05, "loss": 2.2457, "step": 104088 }, { "epoch": 0.65, "learning_rate": 5.5127486764323885e-05, "loss": 2.2367, "step": 104096 }, { "epoch": 0.65, "learning_rate": 5.5121226955420226e-05, "loss": 2.246, "step": 104104 }, { "epoch": 0.65, "learning_rate": 5.5114967267803405e-05, "loss": 2.227, "step": 104112 }, { "epoch": 0.65, "learning_rate": 5.510870770162906e-05, "loss": 2.2365, "step": 104120 }, { "epoch": 0.65, "learning_rate": 5.5102448257052796e-05, "loss": 2.234, "step": 104128 }, { "epoch": 0.65, "learning_rate": 5.509618893423021e-05, "loss": 2.2288, "step": 104136 }, { "epoch": 0.65, "learning_rate": 5.5089929733316906e-05, "loss": 2.2461, "step": 104144 }, { "epoch": 0.65, "learning_rate": 5.508367065446851e-05, "loss": 2.2438, "step": 104152 }, { "epoch": 0.65, "learning_rate": 5.507741169784062e-05, "loss": 2.2208, "step": 104160 }, { "epoch": 0.65, "learning_rate": 5.5071152863588814e-05, "loss": 2.2322, "step": 104168 }, { "epoch": 0.65, "learning_rate": 5.50648941518687e-05, "loss": 2.2321, "step": 104176 }, { "epoch": 0.65, "learning_rate": 5.505863556283588e-05, "loss": 2.2469, "step": 104184 }, { "epoch": 0.65, "learning_rate": 5.505237709664592e-05, "loss": 2.2512, "step": 104192 }, { "epoch": 0.65, "learning_rate": 5.504611875345446e-05, "loss": 2.246, "step": 104200 }, { "epoch": 0.65, "learning_rate": 5.503986053341701e-05, "loss": 2.2477, "step": 104208 }, { "epoch": 0.65, "learning_rate": 5.503360243668918e-05, "loss": 2.2397, "step": 104216 }, { "epoch": 0.65, "learning_rate": 5.502734446342657e-05, "loss": 2.2507, "step": 104224 }, { "epoch": 0.65, "learning_rate": 5.5021086613784735e-05, "loss": 2.2496, "step": 104232 }, { "epoch": 0.65, "learning_rate": 5.5014828887919225e-05, "loss": 2.2523, "step": 104240 }, { "epoch": 0.65, "learning_rate": 5.500857128598562e-05, "loss": 2.2437, "step": 104248 }, { "epoch": 0.65, "learning_rate": 5.500231380813954e-05, "loss": 2.2521, "step": 104256 }, { "epoch": 0.65, "learning_rate": 5.499605645453646e-05, "loss": 2.2364, "step": 104264 }, { "epoch": 0.65, "learning_rate": 5.4989799225331984e-05, "loss": 2.2305, "step": 104272 }, { "epoch": 0.65, "learning_rate": 5.498354212068168e-05, "loss": 2.2442, "step": 104280 }, { "epoch": 0.65, "learning_rate": 5.4977285140741055e-05, "loss": 2.2387, "step": 104288 }, { "epoch": 0.65, "learning_rate": 5.497102828566569e-05, "loss": 2.239, "step": 104296 }, { "epoch": 0.65, "learning_rate": 5.4964771555611147e-05, "loss": 2.2566, "step": 104304 }, { "epoch": 0.65, "learning_rate": 5.4958514950732945e-05, "loss": 2.2321, "step": 104312 }, { "epoch": 0.65, "learning_rate": 5.495225847118661e-05, "loss": 2.2455, "step": 104320 }, { "epoch": 0.65, "learning_rate": 5.494600211712769e-05, "loss": 2.2514, "step": 104328 }, { "epoch": 0.65, "learning_rate": 5.493974588871175e-05, "loss": 2.2365, "step": 104336 }, { "epoch": 0.65, "learning_rate": 5.4933489786094275e-05, "loss": 2.2602, "step": 104344 }, { "epoch": 0.65, "learning_rate": 5.492723380943081e-05, "loss": 2.2469, "step": 104352 }, { "epoch": 0.65, "learning_rate": 5.492097795887692e-05, "loss": 2.2431, "step": 104360 }, { "epoch": 0.65, "learning_rate": 5.491472223458804e-05, "loss": 2.2432, "step": 104368 }, { "epoch": 0.65, "learning_rate": 5.490846663671976e-05, "loss": 2.2449, "step": 104376 }, { "epoch": 0.65, "learning_rate": 5.4902211165427555e-05, "loss": 2.2294, "step": 104384 }, { "epoch": 0.65, "learning_rate": 5.4895955820866976e-05, "loss": 2.2472, "step": 104392 }, { "epoch": 0.65, "learning_rate": 5.4889700603193484e-05, "loss": 2.25, "step": 104400 }, { "epoch": 0.65, "learning_rate": 5.4883445512562615e-05, "loss": 2.2443, "step": 104408 }, { "epoch": 0.65, "learning_rate": 5.4877190549129884e-05, "loss": 2.257, "step": 104416 }, { "epoch": 0.65, "learning_rate": 5.487093571305075e-05, "loss": 2.2515, "step": 104424 }, { "epoch": 0.65, "learning_rate": 5.486468100448072e-05, "loss": 2.2374, "step": 104432 }, { "epoch": 0.65, "learning_rate": 5.485842642357534e-05, "loss": 2.2369, "step": 104440 }, { "epoch": 0.65, "learning_rate": 5.4852171970490016e-05, "loss": 2.2392, "step": 104448 }, { "epoch": 0.65, "learning_rate": 5.48459176453803e-05, "loss": 2.2617, "step": 104456 }, { "epoch": 0.65, "learning_rate": 5.483966344840161e-05, "loss": 2.2392, "step": 104464 }, { "epoch": 0.65, "learning_rate": 5.483340937970951e-05, "loss": 2.2438, "step": 104472 }, { "epoch": 0.65, "learning_rate": 5.482715543945941e-05, "loss": 2.2423, "step": 104480 }, { "epoch": 0.65, "learning_rate": 5.48209016278068e-05, "loss": 2.2398, "step": 104488 }, { "epoch": 0.65, "learning_rate": 5.481464794490718e-05, "loss": 2.2349, "step": 104496 }, { "epoch": 0.65, "learning_rate": 5.480839439091598e-05, "loss": 2.2447, "step": 104504 }, { "epoch": 0.65, "learning_rate": 5.4802140965988666e-05, "loss": 2.2292, "step": 104512 }, { "epoch": 0.65, "learning_rate": 5.479588767028072e-05, "loss": 2.2488, "step": 104520 }, { "epoch": 0.65, "learning_rate": 5.4789634503947606e-05, "loss": 2.2427, "step": 104528 }, { "epoch": 0.65, "learning_rate": 5.4783381467144745e-05, "loss": 2.2516, "step": 104536 }, { "epoch": 0.65, "learning_rate": 5.4777128560027615e-05, "loss": 2.2349, "step": 104544 }, { "epoch": 0.65, "learning_rate": 5.477087578275165e-05, "loss": 2.2558, "step": 104552 }, { "epoch": 0.65, "learning_rate": 5.4764623135472305e-05, "loss": 2.2298, "step": 104560 }, { "epoch": 0.65, "learning_rate": 5.4758370618345e-05, "loss": 2.2464, "step": 104568 }, { "epoch": 0.65, "learning_rate": 5.475211823152522e-05, "loss": 2.2473, "step": 104576 }, { "epoch": 0.65, "learning_rate": 5.474586597516833e-05, "loss": 2.2344, "step": 104584 }, { "epoch": 0.65, "learning_rate": 5.473961384942983e-05, "loss": 2.2344, "step": 104592 }, { "epoch": 0.65, "learning_rate": 5.473336185446511e-05, "loss": 2.2445, "step": 104600 }, { "epoch": 0.65, "learning_rate": 5.4727109990429626e-05, "loss": 2.2404, "step": 104608 }, { "epoch": 0.65, "learning_rate": 5.472085825747875e-05, "loss": 2.2593, "step": 104616 }, { "epoch": 0.65, "learning_rate": 5.471460665576793e-05, "loss": 2.2631, "step": 104624 }, { "epoch": 0.65, "learning_rate": 5.470835518545261e-05, "loss": 2.2304, "step": 104632 }, { "epoch": 0.65, "learning_rate": 5.4702103846688145e-05, "loss": 2.2522, "step": 104640 }, { "epoch": 0.65, "learning_rate": 5.469585263962997e-05, "loss": 2.2466, "step": 104648 }, { "epoch": 0.65, "learning_rate": 5.4689601564433525e-05, "loss": 2.2521, "step": 104656 }, { "epoch": 0.65, "learning_rate": 5.468335062125417e-05, "loss": 2.2497, "step": 104664 }, { "epoch": 0.65, "learning_rate": 5.467709981024731e-05, "loss": 2.2399, "step": 104672 }, { "epoch": 0.65, "learning_rate": 5.467084913156833e-05, "loss": 2.2399, "step": 104680 }, { "epoch": 0.65, "learning_rate": 5.466459858537267e-05, "loss": 2.2573, "step": 104688 }, { "epoch": 0.65, "learning_rate": 5.465834817181566e-05, "loss": 2.2471, "step": 104696 }, { "epoch": 0.65, "learning_rate": 5.4652097891052724e-05, "loss": 2.2665, "step": 104704 }, { "epoch": 0.65, "learning_rate": 5.4645847743239244e-05, "loss": 2.2514, "step": 104712 }, { "epoch": 0.65, "learning_rate": 5.463959772853058e-05, "loss": 2.2545, "step": 104720 }, { "epoch": 0.65, "learning_rate": 5.4633347847082115e-05, "loss": 2.2506, "step": 104728 }, { "epoch": 0.65, "learning_rate": 5.4627098099049226e-05, "loss": 2.2514, "step": 104736 }, { "epoch": 0.65, "learning_rate": 5.462084848458729e-05, "loss": 2.2448, "step": 104744 }, { "epoch": 0.65, "learning_rate": 5.461459900385165e-05, "loss": 2.2327, "step": 104752 }, { "epoch": 0.65, "learning_rate": 5.460834965699768e-05, "loss": 2.2496, "step": 104760 }, { "epoch": 0.65, "learning_rate": 5.460210044418077e-05, "loss": 2.2401, "step": 104768 }, { "epoch": 0.65, "learning_rate": 5.459585136555623e-05, "loss": 2.2444, "step": 104776 }, { "epoch": 0.65, "learning_rate": 5.458960242127943e-05, "loss": 2.2498, "step": 104784 }, { "epoch": 0.65, "learning_rate": 5.458335361150574e-05, "loss": 2.2451, "step": 104792 }, { "epoch": 0.66, "learning_rate": 5.457710493639046e-05, "loss": 2.2471, "step": 104800 }, { "epoch": 0.66, "learning_rate": 5.457085639608897e-05, "loss": 2.2483, "step": 104808 }, { "epoch": 0.66, "learning_rate": 5.45646079907566e-05, "loss": 2.2462, "step": 104816 }, { "epoch": 0.66, "learning_rate": 5.455835972054869e-05, "loss": 2.2301, "step": 104824 }, { "epoch": 0.66, "learning_rate": 5.455211158562055e-05, "loss": 2.2361, "step": 104832 }, { "epoch": 0.66, "learning_rate": 5.454586358612754e-05, "loss": 2.2337, "step": 104840 }, { "epoch": 0.66, "learning_rate": 5.453961572222499e-05, "loss": 2.2604, "step": 104848 }, { "epoch": 0.66, "learning_rate": 5.453336799406818e-05, "loss": 2.239, "step": 104856 }, { "epoch": 0.66, "learning_rate": 5.452712040181247e-05, "loss": 2.25, "step": 104864 }, { "epoch": 0.66, "learning_rate": 5.452087294561315e-05, "loss": 2.2485, "step": 104872 }, { "epoch": 0.66, "learning_rate": 5.451462562562555e-05, "loss": 2.2449, "step": 104880 }, { "epoch": 0.66, "learning_rate": 5.450837844200497e-05, "loss": 2.2545, "step": 104888 }, { "epoch": 0.66, "learning_rate": 5.450213139490672e-05, "loss": 2.2442, "step": 104896 }, { "epoch": 0.66, "learning_rate": 5.4495884484486106e-05, "loss": 2.2469, "step": 104904 }, { "epoch": 0.66, "learning_rate": 5.448963771089841e-05, "loss": 2.2428, "step": 104912 }, { "epoch": 0.66, "learning_rate": 5.448339107429894e-05, "loss": 2.2457, "step": 104920 }, { "epoch": 0.66, "learning_rate": 5.447714457484298e-05, "loss": 2.2471, "step": 104928 }, { "epoch": 0.66, "learning_rate": 5.447089821268585e-05, "loss": 2.2417, "step": 104936 }, { "epoch": 0.66, "learning_rate": 5.446465198798279e-05, "loss": 2.2436, "step": 104944 }, { "epoch": 0.66, "learning_rate": 5.445840590088911e-05, "loss": 2.2513, "step": 104952 }, { "epoch": 0.66, "learning_rate": 5.445215995156008e-05, "loss": 2.2393, "step": 104960 }, { "epoch": 0.66, "learning_rate": 5.4445914140150964e-05, "loss": 2.2443, "step": 104968 }, { "epoch": 0.66, "learning_rate": 5.4439668466817075e-05, "loss": 2.2382, "step": 104976 }, { "epoch": 0.66, "learning_rate": 5.443342293171363e-05, "loss": 2.2456, "step": 104984 }, { "epoch": 0.66, "learning_rate": 5.442717753499592e-05, "loss": 2.247, "step": 104992 }, { "epoch": 0.66, "learning_rate": 5.442093227681919e-05, "loss": 2.2372, "step": 105000 }, { "epoch": 0.66, "learning_rate": 5.4414687157338725e-05, "loss": 2.2485, "step": 105008 }, { "epoch": 0.66, "learning_rate": 5.4408442176709776e-05, "loss": 2.2512, "step": 105016 }, { "epoch": 0.66, "learning_rate": 5.440219733508756e-05, "loss": 2.2399, "step": 105024 }, { "epoch": 0.66, "learning_rate": 5.439595263262735e-05, "loss": 2.2545, "step": 105032 }, { "epoch": 0.66, "learning_rate": 5.4389708069484404e-05, "loss": 2.2643, "step": 105040 }, { "epoch": 0.66, "learning_rate": 5.4383463645813925e-05, "loss": 2.2457, "step": 105048 }, { "epoch": 0.66, "learning_rate": 5.437721936177116e-05, "loss": 2.2547, "step": 105056 }, { "epoch": 0.66, "learning_rate": 5.4370975217511376e-05, "loss": 2.2493, "step": 105064 }, { "epoch": 0.66, "learning_rate": 5.4364731213189766e-05, "loss": 2.263, "step": 105072 }, { "epoch": 0.66, "learning_rate": 5.4358487348961585e-05, "loss": 2.2511, "step": 105080 }, { "epoch": 0.66, "learning_rate": 5.4352243624982015e-05, "loss": 2.2559, "step": 105088 }, { "epoch": 0.66, "learning_rate": 5.434600004140633e-05, "loss": 2.2404, "step": 105096 }, { "epoch": 0.66, "learning_rate": 5.43397565983897e-05, "loss": 2.2427, "step": 105104 }, { "epoch": 0.66, "learning_rate": 5.433351329608736e-05, "loss": 2.2496, "step": 105112 }, { "epoch": 0.66, "learning_rate": 5.432727013465453e-05, "loss": 2.2461, "step": 105120 }, { "epoch": 0.66, "learning_rate": 5.432102711424638e-05, "loss": 2.2379, "step": 105128 }, { "epoch": 0.66, "learning_rate": 5.431478423501815e-05, "loss": 2.2447, "step": 105136 }, { "epoch": 0.66, "learning_rate": 5.430854149712501e-05, "loss": 2.2376, "step": 105144 }, { "epoch": 0.66, "learning_rate": 5.430229890072217e-05, "loss": 2.2501, "step": 105152 }, { "epoch": 0.66, "learning_rate": 5.429605644596483e-05, "loss": 2.2321, "step": 105160 }, { "epoch": 0.66, "learning_rate": 5.428981413300814e-05, "loss": 2.2438, "step": 105168 }, { "epoch": 0.66, "learning_rate": 5.4283571962007326e-05, "loss": 2.2501, "step": 105176 }, { "epoch": 0.66, "learning_rate": 5.427732993311756e-05, "loss": 2.2443, "step": 105184 }, { "epoch": 0.66, "learning_rate": 5.4271088046494015e-05, "loss": 2.2543, "step": 105192 }, { "epoch": 0.66, "learning_rate": 5.426484630229187e-05, "loss": 2.2552, "step": 105200 }, { "epoch": 0.66, "learning_rate": 5.425860470066626e-05, "loss": 2.2466, "step": 105208 }, { "epoch": 0.66, "learning_rate": 5.425236324177241e-05, "loss": 2.2543, "step": 105216 }, { "epoch": 0.66, "learning_rate": 5.424612192576544e-05, "loss": 2.2431, "step": 105224 }, { "epoch": 0.66, "learning_rate": 5.423988075280053e-05, "loss": 2.2619, "step": 105232 }, { "epoch": 0.66, "learning_rate": 5.423363972303283e-05, "loss": 2.2311, "step": 105240 }, { "epoch": 0.66, "learning_rate": 5.4227398836617494e-05, "loss": 2.2697, "step": 105248 }, { "epoch": 0.66, "learning_rate": 5.422115809370967e-05, "loss": 2.2258, "step": 105256 }, { "epoch": 0.66, "learning_rate": 5.4214917494464504e-05, "loss": 2.2576, "step": 105264 }, { "epoch": 0.66, "learning_rate": 5.420867703903714e-05, "loss": 2.2407, "step": 105272 }, { "epoch": 0.66, "learning_rate": 5.4202436727582714e-05, "loss": 2.2596, "step": 105280 }, { "epoch": 0.66, "learning_rate": 5.419619656025636e-05, "loss": 2.2547, "step": 105288 }, { "epoch": 0.66, "learning_rate": 5.4189956537213206e-05, "loss": 2.2566, "step": 105296 }, { "epoch": 0.66, "learning_rate": 5.418371665860837e-05, "loss": 2.2602, "step": 105304 }, { "epoch": 0.66, "learning_rate": 5.417747692459702e-05, "loss": 2.2356, "step": 105312 }, { "epoch": 0.66, "learning_rate": 5.417123733533425e-05, "loss": 2.2486, "step": 105320 }, { "epoch": 0.66, "learning_rate": 5.416499789097515e-05, "loss": 2.2426, "step": 105328 }, { "epoch": 0.66, "learning_rate": 5.4158758591674874e-05, "loss": 2.2417, "step": 105336 }, { "epoch": 0.66, "learning_rate": 5.41525194375885e-05, "loss": 2.2367, "step": 105344 }, { "epoch": 0.66, "learning_rate": 5.414628042887116e-05, "loss": 2.2536, "step": 105352 }, { "epoch": 0.66, "learning_rate": 5.4140041565677935e-05, "loss": 2.2419, "step": 105360 }, { "epoch": 0.66, "learning_rate": 5.413380284816395e-05, "loss": 2.2283, "step": 105368 }, { "epoch": 0.66, "learning_rate": 5.412756427648427e-05, "loss": 2.2505, "step": 105376 }, { "epoch": 0.66, "learning_rate": 5.412132585079401e-05, "loss": 2.2644, "step": 105384 }, { "epoch": 0.66, "learning_rate": 5.411508757124826e-05, "loss": 2.2461, "step": 105392 }, { "epoch": 0.66, "learning_rate": 5.410884943800207e-05, "loss": 2.246, "step": 105400 }, { "epoch": 0.66, "learning_rate": 5.410261145121054e-05, "loss": 2.2343, "step": 105408 }, { "epoch": 0.66, "learning_rate": 5.4096373611028784e-05, "loss": 2.2463, "step": 105416 }, { "epoch": 0.66, "learning_rate": 5.4090135917611806e-05, "loss": 2.2541, "step": 105424 }, { "epoch": 0.66, "learning_rate": 5.408389837111474e-05, "loss": 2.2601, "step": 105432 }, { "epoch": 0.66, "learning_rate": 5.40776609716926e-05, "loss": 2.2384, "step": 105440 }, { "epoch": 0.66, "learning_rate": 5.4071423719500504e-05, "loss": 2.2498, "step": 105448 }, { "epoch": 0.66, "learning_rate": 5.406518661469344e-05, "loss": 2.2519, "step": 105456 }, { "epoch": 0.66, "learning_rate": 5.4058949657426525e-05, "loss": 2.2585, "step": 105464 }, { "epoch": 0.66, "learning_rate": 5.4052712847854804e-05, "loss": 2.2452, "step": 105472 }, { "epoch": 0.66, "learning_rate": 5.404647618613329e-05, "loss": 2.234, "step": 105480 }, { "epoch": 0.66, "learning_rate": 5.404023967241703e-05, "loss": 2.2379, "step": 105488 }, { "epoch": 0.66, "learning_rate": 5.403400330686112e-05, "loss": 2.2528, "step": 105496 }, { "epoch": 0.66, "learning_rate": 5.402776708962052e-05, "loss": 2.2472, "step": 105504 }, { "epoch": 0.66, "learning_rate": 5.402153102085032e-05, "loss": 2.2451, "step": 105512 }, { "epoch": 0.66, "learning_rate": 5.401529510070551e-05, "loss": 2.2503, "step": 105520 }, { "epoch": 0.66, "learning_rate": 5.4009059329341174e-05, "loss": 2.2425, "step": 105528 }, { "epoch": 0.66, "learning_rate": 5.4002823706912265e-05, "loss": 2.25, "step": 105536 }, { "epoch": 0.66, "learning_rate": 5.399658823357383e-05, "loss": 2.2604, "step": 105544 }, { "epoch": 0.66, "learning_rate": 5.3990352909480905e-05, "loss": 2.2649, "step": 105552 }, { "epoch": 0.66, "learning_rate": 5.398411773478846e-05, "loss": 2.2457, "step": 105560 }, { "epoch": 0.66, "learning_rate": 5.3977882709651536e-05, "loss": 2.2493, "step": 105568 }, { "epoch": 0.66, "learning_rate": 5.3971647834225117e-05, "loss": 2.2547, "step": 105576 }, { "epoch": 0.66, "learning_rate": 5.396541310866421e-05, "loss": 2.2405, "step": 105584 }, { "epoch": 0.66, "learning_rate": 5.3959178533123814e-05, "loss": 2.235, "step": 105592 }, { "epoch": 0.66, "learning_rate": 5.3952944107758905e-05, "loss": 2.2443, "step": 105600 }, { "epoch": 0.66, "learning_rate": 5.3946709832724495e-05, "loss": 2.2507, "step": 105608 }, { "epoch": 0.66, "learning_rate": 5.3940475708175565e-05, "loss": 2.2622, "step": 105616 }, { "epoch": 0.66, "learning_rate": 5.393424173426708e-05, "loss": 2.251, "step": 105624 }, { "epoch": 0.66, "learning_rate": 5.392800791115404e-05, "loss": 2.261, "step": 105632 }, { "epoch": 0.66, "learning_rate": 5.392177423899139e-05, "loss": 2.2623, "step": 105640 }, { "epoch": 0.66, "learning_rate": 5.39155407179341e-05, "loss": 2.2609, "step": 105648 }, { "epoch": 0.66, "learning_rate": 5.390930734813716e-05, "loss": 2.2545, "step": 105656 }, { "epoch": 0.66, "learning_rate": 5.3903074129755545e-05, "loss": 2.2417, "step": 105664 }, { "epoch": 0.66, "learning_rate": 5.389684106294417e-05, "loss": 2.2433, "step": 105672 }, { "epoch": 0.66, "learning_rate": 5.3890608147858e-05, "loss": 2.2421, "step": 105680 }, { "epoch": 0.66, "learning_rate": 5.388437538465203e-05, "loss": 2.2513, "step": 105688 }, { "epoch": 0.66, "learning_rate": 5.3878142773481156e-05, "loss": 2.2786, "step": 105696 }, { "epoch": 0.66, "learning_rate": 5.387191031450034e-05, "loss": 2.2598, "step": 105704 }, { "epoch": 0.66, "learning_rate": 5.3865678007864506e-05, "loss": 2.2572, "step": 105712 }, { "epoch": 0.66, "learning_rate": 5.385944585372864e-05, "loss": 2.2438, "step": 105720 }, { "epoch": 0.66, "learning_rate": 5.385321385224762e-05, "loss": 2.2429, "step": 105728 }, { "epoch": 0.66, "learning_rate": 5.384698200357638e-05, "loss": 2.2575, "step": 105736 }, { "epoch": 0.66, "learning_rate": 5.384075030786988e-05, "loss": 2.2481, "step": 105744 }, { "epoch": 0.66, "learning_rate": 5.3834518765283e-05, "loss": 2.2525, "step": 105752 }, { "epoch": 0.66, "learning_rate": 5.38282873759707e-05, "loss": 2.2427, "step": 105760 }, { "epoch": 0.66, "learning_rate": 5.382205614008785e-05, "loss": 2.2415, "step": 105768 }, { "epoch": 0.66, "learning_rate": 5.3815825057789374e-05, "loss": 2.262, "step": 105776 }, { "epoch": 0.66, "learning_rate": 5.380959412923019e-05, "loss": 2.235, "step": 105784 }, { "epoch": 0.66, "learning_rate": 5.3803363354565186e-05, "loss": 2.2395, "step": 105792 }, { "epoch": 0.66, "learning_rate": 5.3797132733949266e-05, "loss": 2.2272, "step": 105800 }, { "epoch": 0.66, "learning_rate": 5.379090226753733e-05, "loss": 2.2473, "step": 105808 }, { "epoch": 0.66, "learning_rate": 5.378467195548425e-05, "loss": 2.2453, "step": 105816 }, { "epoch": 0.66, "learning_rate": 5.377844179794492e-05, "loss": 2.2481, "step": 105824 }, { "epoch": 0.66, "learning_rate": 5.3772211795074235e-05, "loss": 2.2467, "step": 105832 }, { "epoch": 0.66, "learning_rate": 5.3765981947027045e-05, "loss": 2.2528, "step": 105840 }, { "epoch": 0.66, "learning_rate": 5.3759752253958274e-05, "loss": 2.2342, "step": 105848 }, { "epoch": 0.66, "learning_rate": 5.375352271602274e-05, "loss": 2.2593, "step": 105856 }, { "epoch": 0.66, "learning_rate": 5.374729333337532e-05, "loss": 2.2613, "step": 105864 }, { "epoch": 0.66, "learning_rate": 5.374106410617091e-05, "loss": 2.2522, "step": 105872 }, { "epoch": 0.66, "learning_rate": 5.373483503456436e-05, "loss": 2.2443, "step": 105880 }, { "epoch": 0.66, "learning_rate": 5.372860611871049e-05, "loss": 2.2659, "step": 105888 }, { "epoch": 0.66, "learning_rate": 5.3722377358764176e-05, "loss": 2.2505, "step": 105896 }, { "epoch": 0.66, "learning_rate": 5.371614875488029e-05, "loss": 2.2427, "step": 105904 }, { "epoch": 0.66, "learning_rate": 5.3709920307213626e-05, "loss": 2.2464, "step": 105912 }, { "epoch": 0.66, "learning_rate": 5.370369201591906e-05, "loss": 2.2453, "step": 105920 }, { "epoch": 0.66, "learning_rate": 5.36974638811514e-05, "loss": 2.2518, "step": 105928 }, { "epoch": 0.66, "learning_rate": 5.3691235903065526e-05, "loss": 2.2454, "step": 105936 }, { "epoch": 0.66, "learning_rate": 5.368500808181622e-05, "loss": 2.2568, "step": 105944 }, { "epoch": 0.66, "learning_rate": 5.367878041755832e-05, "loss": 2.2488, "step": 105952 }, { "epoch": 0.66, "learning_rate": 5.367255291044664e-05, "loss": 2.2361, "step": 105960 }, { "epoch": 0.66, "learning_rate": 5.3666325560636024e-05, "loss": 2.2468, "step": 105968 }, { "epoch": 0.66, "learning_rate": 5.3660098368281244e-05, "loss": 2.2579, "step": 105976 }, { "epoch": 0.66, "learning_rate": 5.3653871333537145e-05, "loss": 2.2424, "step": 105984 }, { "epoch": 0.66, "learning_rate": 5.36476444565585e-05, "loss": 2.2493, "step": 105992 }, { "epoch": 0.66, "learning_rate": 5.3641417737500146e-05, "loss": 2.2524, "step": 106000 }, { "epoch": 0.66, "learning_rate": 5.3635191176516855e-05, "loss": 2.2367, "step": 106008 }, { "epoch": 0.66, "learning_rate": 5.3628964773763424e-05, "loss": 2.2207, "step": 106016 }, { "epoch": 0.66, "learning_rate": 5.362273852939463e-05, "loss": 2.2342, "step": 106024 }, { "epoch": 0.66, "learning_rate": 5.361651244356529e-05, "loss": 2.2267, "step": 106032 }, { "epoch": 0.66, "learning_rate": 5.3610286516430166e-05, "loss": 2.2497, "step": 106040 }, { "epoch": 0.66, "learning_rate": 5.360406074814403e-05, "loss": 2.2328, "step": 106048 }, { "epoch": 0.66, "learning_rate": 5.359783513886165e-05, "loss": 2.2402, "step": 106056 }, { "epoch": 0.66, "learning_rate": 5.359160968873782e-05, "loss": 2.2471, "step": 106064 }, { "epoch": 0.66, "learning_rate": 5.358538439792731e-05, "loss": 2.2417, "step": 106072 }, { "epoch": 0.66, "learning_rate": 5.3579159266584834e-05, "loss": 2.252, "step": 106080 }, { "epoch": 0.66, "learning_rate": 5.357293429486518e-05, "loss": 2.2416, "step": 106088 }, { "epoch": 0.66, "learning_rate": 5.356670948292313e-05, "loss": 2.2405, "step": 106096 }, { "epoch": 0.66, "learning_rate": 5.356048483091338e-05, "loss": 2.2501, "step": 106104 }, { "epoch": 0.66, "learning_rate": 5.355426033899069e-05, "loss": 2.2331, "step": 106112 }, { "epoch": 0.66, "learning_rate": 5.354803600730984e-05, "loss": 2.2477, "step": 106120 }, { "epoch": 0.66, "learning_rate": 5.354181183602552e-05, "loss": 2.2532, "step": 106128 }, { "epoch": 0.66, "learning_rate": 5.3535587825292485e-05, "loss": 2.2284, "step": 106136 }, { "epoch": 0.66, "learning_rate": 5.352936397526544e-05, "loss": 2.2576, "step": 106144 }, { "epoch": 0.66, "learning_rate": 5.352314028609918e-05, "loss": 2.2397, "step": 106152 }, { "epoch": 0.66, "learning_rate": 5.3516916757948364e-05, "loss": 2.2287, "step": 106160 }, { "epoch": 0.66, "learning_rate": 5.3510693390967705e-05, "loss": 2.258, "step": 106168 }, { "epoch": 0.66, "learning_rate": 5.350447018531195e-05, "loss": 2.2459, "step": 106176 }, { "epoch": 0.66, "learning_rate": 5.349824714113579e-05, "loss": 2.2329, "step": 106184 }, { "epoch": 0.66, "learning_rate": 5.349202425859394e-05, "loss": 2.2466, "step": 106192 }, { "epoch": 0.66, "learning_rate": 5.3485801537841105e-05, "loss": 2.2569, "step": 106200 }, { "epoch": 0.66, "learning_rate": 5.3479578979031955e-05, "loss": 2.2581, "step": 106208 }, { "epoch": 0.66, "learning_rate": 5.347335658232121e-05, "loss": 2.2484, "step": 106216 }, { "epoch": 0.66, "learning_rate": 5.3467134347863544e-05, "loss": 2.2539, "step": 106224 }, { "epoch": 0.66, "learning_rate": 5.346091227581368e-05, "loss": 2.2275, "step": 106232 }, { "epoch": 0.66, "learning_rate": 5.3454690366326247e-05, "loss": 2.2476, "step": 106240 }, { "epoch": 0.66, "learning_rate": 5.344846861955595e-05, "loss": 2.2551, "step": 106248 }, { "epoch": 0.66, "learning_rate": 5.3442247035657475e-05, "loss": 2.2348, "step": 106256 }, { "epoch": 0.66, "learning_rate": 5.343602561478545e-05, "loss": 2.2449, "step": 106264 }, { "epoch": 0.66, "learning_rate": 5.342980435709457e-05, "loss": 2.2469, "step": 106272 }, { "epoch": 0.66, "learning_rate": 5.3423583262739484e-05, "loss": 2.2382, "step": 106280 }, { "epoch": 0.66, "learning_rate": 5.3417362331874885e-05, "loss": 2.2528, "step": 106288 }, { "epoch": 0.66, "learning_rate": 5.3411141564655364e-05, "loss": 2.2409, "step": 106296 }, { "epoch": 0.66, "learning_rate": 5.340492096123562e-05, "loss": 2.2628, "step": 106304 }, { "epoch": 0.66, "learning_rate": 5.33987005217703e-05, "loss": 2.2483, "step": 106312 }, { "epoch": 0.66, "learning_rate": 5.3392480246413986e-05, "loss": 2.2388, "step": 106320 }, { "epoch": 0.66, "learning_rate": 5.338626013532138e-05, "loss": 2.2499, "step": 106328 }, { "epoch": 0.66, "learning_rate": 5.338004018864708e-05, "loss": 2.2473, "step": 106336 }, { "epoch": 0.66, "learning_rate": 5.337382040654573e-05, "loss": 2.2528, "step": 106344 }, { "epoch": 0.66, "learning_rate": 5.336760078917194e-05, "loss": 2.2326, "step": 106352 }, { "epoch": 0.66, "learning_rate": 5.336138133668034e-05, "loss": 2.2514, "step": 106360 }, { "epoch": 0.66, "learning_rate": 5.3355162049225546e-05, "loss": 2.2477, "step": 106368 }, { "epoch": 0.66, "learning_rate": 5.3348942926962176e-05, "loss": 2.2452, "step": 106376 }, { "epoch": 0.66, "learning_rate": 5.334272397004483e-05, "loss": 2.2355, "step": 106384 }, { "epoch": 0.66, "learning_rate": 5.33365051786281e-05, "loss": 2.2374, "step": 106392 }, { "epoch": 0.67, "learning_rate": 5.3330286552866606e-05, "loss": 2.2272, "step": 106400 }, { "epoch": 0.67, "learning_rate": 5.332406809291494e-05, "loss": 2.2386, "step": 106408 }, { "epoch": 0.67, "learning_rate": 5.331784979892769e-05, "loss": 2.2478, "step": 106416 }, { "epoch": 0.67, "learning_rate": 5.331163167105944e-05, "loss": 2.2541, "step": 106424 }, { "epoch": 0.67, "learning_rate": 5.330541370946478e-05, "loss": 2.2379, "step": 106432 }, { "epoch": 0.67, "learning_rate": 5.3299195914298286e-05, "loss": 2.2394, "step": 106440 }, { "epoch": 0.67, "learning_rate": 5.329297828571453e-05, "loss": 2.2435, "step": 106448 }, { "epoch": 0.67, "learning_rate": 5.328676082386809e-05, "loss": 2.2293, "step": 106456 }, { "epoch": 0.67, "learning_rate": 5.328054352891352e-05, "loss": 2.2555, "step": 106464 }, { "epoch": 0.67, "learning_rate": 5.327432640100541e-05, "loss": 2.241, "step": 106472 }, { "epoch": 0.67, "learning_rate": 5.3268109440298274e-05, "loss": 2.2575, "step": 106480 }, { "epoch": 0.67, "learning_rate": 5.326189264694672e-05, "loss": 2.2305, "step": 106488 }, { "epoch": 0.67, "learning_rate": 5.325567602110525e-05, "loss": 2.2451, "step": 106496 }, { "epoch": 0.67, "learning_rate": 5.324945956292846e-05, "loss": 2.236, "step": 106504 }, { "epoch": 0.67, "learning_rate": 5.324324327257082e-05, "loss": 2.2498, "step": 106512 }, { "epoch": 0.67, "learning_rate": 5.323702715018694e-05, "loss": 2.2475, "step": 106520 }, { "epoch": 0.67, "learning_rate": 5.323081119593133e-05, "loss": 2.2482, "step": 106528 }, { "epoch": 0.67, "learning_rate": 5.3224595409958497e-05, "loss": 2.25, "step": 106536 }, { "epoch": 0.67, "learning_rate": 5.3218379792422966e-05, "loss": 2.2473, "step": 106544 }, { "epoch": 0.67, "learning_rate": 5.321216434347931e-05, "loss": 2.2473, "step": 106552 }, { "epoch": 0.67, "learning_rate": 5.3205949063282e-05, "loss": 2.2631, "step": 106560 }, { "epoch": 0.67, "learning_rate": 5.319973395198554e-05, "loss": 2.2586, "step": 106568 }, { "epoch": 0.67, "learning_rate": 5.3193519009744474e-05, "loss": 2.2473, "step": 106576 }, { "epoch": 0.67, "learning_rate": 5.318730423671329e-05, "loss": 2.2635, "step": 106584 }, { "epoch": 0.67, "learning_rate": 5.318108963304648e-05, "loss": 2.2503, "step": 106592 }, { "epoch": 0.67, "learning_rate": 5.3174875198898545e-05, "loss": 2.2422, "step": 106600 }, { "epoch": 0.67, "learning_rate": 5.316866093442399e-05, "loss": 2.2463, "step": 106608 }, { "epoch": 0.67, "learning_rate": 5.316244683977727e-05, "loss": 2.2246, "step": 106616 }, { "epoch": 0.67, "learning_rate": 5.3156232915112894e-05, "loss": 2.2385, "step": 106624 }, { "epoch": 0.67, "learning_rate": 5.3150019160585354e-05, "loss": 2.2451, "step": 106632 }, { "epoch": 0.67, "learning_rate": 5.314380557634909e-05, "loss": 2.2407, "step": 106640 }, { "epoch": 0.67, "learning_rate": 5.3137592162558595e-05, "loss": 2.2343, "step": 106648 }, { "epoch": 0.67, "learning_rate": 5.3131378919368325e-05, "loss": 2.2464, "step": 106656 }, { "epoch": 0.67, "learning_rate": 5.312516584693275e-05, "loss": 2.2498, "step": 106664 }, { "epoch": 0.67, "learning_rate": 5.3118952945406316e-05, "loss": 2.2477, "step": 106672 }, { "epoch": 0.67, "learning_rate": 5.311274021494348e-05, "loss": 2.2503, "step": 106680 }, { "epoch": 0.67, "learning_rate": 5.3106527655698726e-05, "loss": 2.2436, "step": 106688 }, { "epoch": 0.67, "learning_rate": 5.310031526782644e-05, "loss": 2.2494, "step": 106696 }, { "epoch": 0.67, "learning_rate": 5.309410305148108e-05, "loss": 2.2491, "step": 106704 }, { "epoch": 0.67, "learning_rate": 5.308789100681712e-05, "loss": 2.2363, "step": 106712 }, { "epoch": 0.67, "learning_rate": 5.308167913398896e-05, "loss": 2.2387, "step": 106720 }, { "epoch": 0.67, "learning_rate": 5.3075467433151026e-05, "loss": 2.2503, "step": 106728 }, { "epoch": 0.67, "learning_rate": 5.306925590445775e-05, "loss": 2.2328, "step": 106736 }, { "epoch": 0.67, "learning_rate": 5.306304454806356e-05, "loss": 2.2539, "step": 106744 }, { "epoch": 0.67, "learning_rate": 5.3056833364122835e-05, "loss": 2.2502, "step": 106752 }, { "epoch": 0.67, "learning_rate": 5.305062235279004e-05, "loss": 2.249, "step": 106760 }, { "epoch": 0.67, "learning_rate": 5.304441151421952e-05, "loss": 2.2498, "step": 106768 }, { "epoch": 0.67, "learning_rate": 5.303820084856574e-05, "loss": 2.2412, "step": 106776 }, { "epoch": 0.67, "learning_rate": 5.3031990355983054e-05, "loss": 2.2648, "step": 106784 }, { "epoch": 0.67, "learning_rate": 5.302578003662588e-05, "loss": 2.2543, "step": 106792 }, { "epoch": 0.67, "learning_rate": 5.30195698906486e-05, "loss": 2.2375, "step": 106800 }, { "epoch": 0.67, "learning_rate": 5.301335991820557e-05, "loss": 2.2364, "step": 106808 }, { "epoch": 0.67, "learning_rate": 5.300715011945121e-05, "loss": 2.2442, "step": 106816 }, { "epoch": 0.67, "learning_rate": 5.3000940494539894e-05, "loss": 2.2537, "step": 106824 }, { "epoch": 0.67, "learning_rate": 5.299473104362598e-05, "loss": 2.2396, "step": 106832 }, { "epoch": 0.67, "learning_rate": 5.298852176686382e-05, "loss": 2.2425, "step": 106840 }, { "epoch": 0.67, "learning_rate": 5.298231266440781e-05, "loss": 2.2447, "step": 106848 }, { "epoch": 0.67, "learning_rate": 5.29761037364123e-05, "loss": 2.239, "step": 106856 }, { "epoch": 0.67, "learning_rate": 5.296989498303162e-05, "loss": 2.2459, "step": 106864 }, { "epoch": 0.67, "learning_rate": 5.2963686404420154e-05, "loss": 2.228, "step": 106872 }, { "epoch": 0.67, "learning_rate": 5.295747800073223e-05, "loss": 2.2536, "step": 106880 }, { "epoch": 0.67, "learning_rate": 5.295126977212219e-05, "loss": 2.2423, "step": 106888 }, { "epoch": 0.67, "learning_rate": 5.294506171874438e-05, "loss": 2.2481, "step": 106896 }, { "epoch": 0.67, "learning_rate": 5.293885384075315e-05, "loss": 2.2603, "step": 106904 }, { "epoch": 0.67, "learning_rate": 5.293264613830277e-05, "loss": 2.2475, "step": 106912 }, { "epoch": 0.67, "learning_rate": 5.29264386115476e-05, "loss": 2.2318, "step": 106920 }, { "epoch": 0.67, "learning_rate": 5.292023126064196e-05, "loss": 2.2469, "step": 106928 }, { "epoch": 0.67, "learning_rate": 5.29140240857402e-05, "loss": 2.2387, "step": 106936 }, { "epoch": 0.67, "learning_rate": 5.290781708699657e-05, "loss": 2.2545, "step": 106944 }, { "epoch": 0.67, "learning_rate": 5.290161026456539e-05, "loss": 2.2453, "step": 106952 }, { "epoch": 0.67, "learning_rate": 5.289540361860099e-05, "loss": 2.2577, "step": 106960 }, { "epoch": 0.67, "learning_rate": 5.288919714925766e-05, "loss": 2.2478, "step": 106968 }, { "epoch": 0.67, "learning_rate": 5.2882990856689686e-05, "loss": 2.2463, "step": 106976 }, { "epoch": 0.67, "learning_rate": 5.2876784741051336e-05, "loss": 2.2451, "step": 106984 }, { "epoch": 0.67, "learning_rate": 5.287057880249694e-05, "loss": 2.2404, "step": 106992 }, { "epoch": 0.67, "learning_rate": 5.286437304118075e-05, "loss": 2.2401, "step": 107000 }, { "epoch": 0.67, "learning_rate": 5.285816745725703e-05, "loss": 2.2451, "step": 107008 }, { "epoch": 0.67, "learning_rate": 5.28519620508801e-05, "loss": 2.2519, "step": 107016 }, { "epoch": 0.67, "learning_rate": 5.284575682220416e-05, "loss": 2.2466, "step": 107024 }, { "epoch": 0.67, "learning_rate": 5.2839551771383534e-05, "loss": 2.2522, "step": 107032 }, { "epoch": 0.67, "learning_rate": 5.283334689857244e-05, "loss": 2.2386, "step": 107040 }, { "epoch": 0.67, "learning_rate": 5.282714220392515e-05, "loss": 2.2453, "step": 107048 }, { "epoch": 0.67, "learning_rate": 5.282093768759592e-05, "loss": 2.2382, "step": 107056 }, { "epoch": 0.67, "learning_rate": 5.281473334973897e-05, "loss": 2.2464, "step": 107064 }, { "epoch": 0.67, "learning_rate": 5.280852919050856e-05, "loss": 2.2494, "step": 107072 }, { "epoch": 0.67, "learning_rate": 5.280232521005892e-05, "loss": 2.2485, "step": 107080 }, { "epoch": 0.67, "learning_rate": 5.2796121408544284e-05, "loss": 2.2541, "step": 107088 }, { "epoch": 0.67, "learning_rate": 5.2789917786118906e-05, "loss": 2.2347, "step": 107096 }, { "epoch": 0.67, "learning_rate": 5.278371434293694e-05, "loss": 2.2377, "step": 107104 }, { "epoch": 0.67, "learning_rate": 5.277751107915265e-05, "loss": 2.2443, "step": 107112 }, { "epoch": 0.67, "learning_rate": 5.277130799492025e-05, "loss": 2.2503, "step": 107120 }, { "epoch": 0.67, "learning_rate": 5.276510509039396e-05, "loss": 2.2288, "step": 107128 }, { "epoch": 0.67, "learning_rate": 5.2758902365727955e-05, "loss": 2.2391, "step": 107136 }, { "epoch": 0.67, "learning_rate": 5.275269982107645e-05, "loss": 2.2287, "step": 107144 }, { "epoch": 0.67, "learning_rate": 5.274649745659366e-05, "loss": 2.2493, "step": 107152 }, { "epoch": 0.67, "learning_rate": 5.2740295272433735e-05, "loss": 2.2337, "step": 107160 }, { "epoch": 0.67, "learning_rate": 5.273409326875087e-05, "loss": 2.2474, "step": 107168 }, { "epoch": 0.67, "learning_rate": 5.272789144569929e-05, "loss": 2.2354, "step": 107176 }, { "epoch": 0.67, "learning_rate": 5.272168980343315e-05, "loss": 2.2308, "step": 107184 }, { "epoch": 0.67, "learning_rate": 5.27154883421066e-05, "loss": 2.2467, "step": 107192 }, { "epoch": 0.67, "learning_rate": 5.270928706187381e-05, "loss": 2.2419, "step": 107200 }, { "epoch": 0.67, "learning_rate": 5.2703085962889e-05, "loss": 2.2448, "step": 107208 }, { "epoch": 0.67, "learning_rate": 5.2696885045306274e-05, "loss": 2.2428, "step": 107216 }, { "epoch": 0.67, "learning_rate": 5.269068430927979e-05, "loss": 2.2287, "step": 107224 }, { "epoch": 0.67, "learning_rate": 5.2684483754963746e-05, "loss": 2.2458, "step": 107232 }, { "epoch": 0.67, "learning_rate": 5.267828338251224e-05, "loss": 2.2387, "step": 107240 }, { "epoch": 0.67, "learning_rate": 5.2672083192079426e-05, "loss": 2.2402, "step": 107248 }, { "epoch": 0.67, "learning_rate": 5.266588318381945e-05, "loss": 2.2392, "step": 107256 }, { "epoch": 0.67, "learning_rate": 5.265968335788645e-05, "loss": 2.2389, "step": 107264 }, { "epoch": 0.67, "learning_rate": 5.265348371443453e-05, "loss": 2.2454, "step": 107272 }, { "epoch": 0.67, "learning_rate": 5.264728425361782e-05, "loss": 2.247, "step": 107280 }, { "epoch": 0.67, "learning_rate": 5.264108497559048e-05, "loss": 2.2452, "step": 107288 }, { "epoch": 0.67, "learning_rate": 5.263488588050658e-05, "loss": 2.2464, "step": 107296 }, { "epoch": 0.67, "learning_rate": 5.2628686968520235e-05, "loss": 2.2383, "step": 107304 }, { "epoch": 0.67, "learning_rate": 5.2622488239785575e-05, "loss": 2.2512, "step": 107312 }, { "epoch": 0.67, "learning_rate": 5.261628969445667e-05, "loss": 2.2438, "step": 107320 }, { "epoch": 0.67, "learning_rate": 5.2610091332687615e-05, "loss": 2.2564, "step": 107328 }, { "epoch": 0.67, "learning_rate": 5.2603893154632546e-05, "loss": 2.2349, "step": 107336 }, { "epoch": 0.67, "learning_rate": 5.259769516044553e-05, "loss": 2.2547, "step": 107344 }, { "epoch": 0.67, "learning_rate": 5.2591497350280614e-05, "loss": 2.2296, "step": 107352 }, { "epoch": 0.67, "learning_rate": 5.2585299724291914e-05, "loss": 2.2388, "step": 107360 }, { "epoch": 0.67, "learning_rate": 5.257910228263352e-05, "loss": 2.2603, "step": 107368 }, { "epoch": 0.67, "learning_rate": 5.2572905025459466e-05, "loss": 2.2363, "step": 107376 }, { "epoch": 0.67, "learning_rate": 5.25667079529238e-05, "loss": 2.2421, "step": 107384 }, { "epoch": 0.67, "learning_rate": 5.256051106518064e-05, "loss": 2.2502, "step": 107392 }, { "epoch": 0.67, "learning_rate": 5.2554314362383996e-05, "loss": 2.239, "step": 107400 }, { "epoch": 0.67, "learning_rate": 5.2548117844687925e-05, "loss": 2.2325, "step": 107408 }, { "epoch": 0.67, "learning_rate": 5.2541921512246485e-05, "loss": 2.2479, "step": 107416 }, { "epoch": 0.67, "learning_rate": 5.253572536521372e-05, "loss": 2.23, "step": 107424 }, { "epoch": 0.67, "learning_rate": 5.252952940374365e-05, "loss": 2.242, "step": 107432 }, { "epoch": 0.67, "learning_rate": 5.2523333627990325e-05, "loss": 2.235, "step": 107440 }, { "epoch": 0.67, "learning_rate": 5.251713803810777e-05, "loss": 2.2521, "step": 107448 }, { "epoch": 0.67, "learning_rate": 5.2510942634249984e-05, "loss": 2.2306, "step": 107456 }, { "epoch": 0.67, "learning_rate": 5.250474741657102e-05, "loss": 2.249, "step": 107464 }, { "epoch": 0.67, "learning_rate": 5.249855238522487e-05, "loss": 2.2573, "step": 107472 }, { "epoch": 0.67, "learning_rate": 5.249235754036556e-05, "loss": 2.2298, "step": 107480 }, { "epoch": 0.67, "learning_rate": 5.248616288214707e-05, "loss": 2.2541, "step": 107488 }, { "epoch": 0.67, "learning_rate": 5.247996841072342e-05, "loss": 2.2371, "step": 107496 }, { "epoch": 0.67, "learning_rate": 5.2473774126248595e-05, "loss": 2.2438, "step": 107504 }, { "epoch": 0.67, "learning_rate": 5.24675800288766e-05, "loss": 2.2407, "step": 107512 }, { "epoch": 0.67, "learning_rate": 5.246138611876139e-05, "loss": 2.247, "step": 107520 }, { "epoch": 0.67, "learning_rate": 5.2455192396057004e-05, "loss": 2.253, "step": 107528 }, { "epoch": 0.67, "learning_rate": 5.244899886091734e-05, "loss": 2.2651, "step": 107536 }, { "epoch": 0.67, "learning_rate": 5.244280551349643e-05, "loss": 2.2462, "step": 107544 }, { "epoch": 0.67, "learning_rate": 5.243661235394821e-05, "loss": 2.2551, "step": 107552 }, { "epoch": 0.67, "learning_rate": 5.2430419382426686e-05, "loss": 2.2501, "step": 107560 }, { "epoch": 0.67, "learning_rate": 5.242422659908576e-05, "loss": 2.2573, "step": 107568 }, { "epoch": 0.67, "learning_rate": 5.241803400407941e-05, "loss": 2.2378, "step": 107576 }, { "epoch": 0.67, "learning_rate": 5.241184159756161e-05, "loss": 2.2518, "step": 107584 }, { "epoch": 0.67, "learning_rate": 5.240564937968626e-05, "loss": 2.2512, "step": 107592 }, { "epoch": 0.67, "learning_rate": 5.2399457350607314e-05, "loss": 2.2475, "step": 107600 }, { "epoch": 0.67, "learning_rate": 5.239326551047873e-05, "loss": 2.246, "step": 107608 }, { "epoch": 0.67, "learning_rate": 5.2387073859454406e-05, "loss": 2.2398, "step": 107616 }, { "epoch": 0.67, "learning_rate": 5.238088239768828e-05, "loss": 2.2579, "step": 107624 }, { "epoch": 0.67, "learning_rate": 5.2374691125334266e-05, "loss": 2.2408, "step": 107632 }, { "epoch": 0.67, "learning_rate": 5.23685000425463e-05, "loss": 2.2442, "step": 107640 }, { "epoch": 0.67, "learning_rate": 5.236230914947826e-05, "loss": 2.2504, "step": 107648 }, { "epoch": 0.67, "learning_rate": 5.235611844628408e-05, "loss": 2.239, "step": 107656 }, { "epoch": 0.67, "learning_rate": 5.234992793311767e-05, "loss": 2.2504, "step": 107664 }, { "epoch": 0.67, "learning_rate": 5.2343737610132895e-05, "loss": 2.2481, "step": 107672 }, { "epoch": 0.67, "learning_rate": 5.233754747748366e-05, "loss": 2.2541, "step": 107680 }, { "epoch": 0.67, "learning_rate": 5.2331357535323854e-05, "loss": 2.252, "step": 107688 }, { "epoch": 0.67, "learning_rate": 5.2325167783807374e-05, "loss": 2.2487, "step": 107696 }, { "epoch": 0.67, "learning_rate": 5.2318978223088066e-05, "loss": 2.2578, "step": 107704 }, { "epoch": 0.67, "learning_rate": 5.231278885331983e-05, "loss": 2.2567, "step": 107712 }, { "epoch": 0.67, "learning_rate": 5.2306599674656534e-05, "loss": 2.2408, "step": 107720 }, { "epoch": 0.67, "learning_rate": 5.230041068725202e-05, "loss": 2.2462, "step": 107728 }, { "epoch": 0.67, "learning_rate": 5.2294221891260165e-05, "loss": 2.2605, "step": 107736 }, { "epoch": 0.67, "learning_rate": 5.228803328683483e-05, "loss": 2.2536, "step": 107744 }, { "epoch": 0.67, "learning_rate": 5.2281844874129835e-05, "loss": 2.2602, "step": 107752 }, { "epoch": 0.67, "learning_rate": 5.2275656653299034e-05, "loss": 2.24, "step": 107760 }, { "epoch": 0.67, "learning_rate": 5.226946862449629e-05, "loss": 2.2392, "step": 107768 }, { "epoch": 0.67, "learning_rate": 5.226328078787544e-05, "loss": 2.2423, "step": 107776 }, { "epoch": 0.67, "learning_rate": 5.225709314359027e-05, "loss": 2.2349, "step": 107784 }, { "epoch": 0.67, "learning_rate": 5.2250905691794636e-05, "loss": 2.2346, "step": 107792 }, { "epoch": 0.67, "learning_rate": 5.224471843264238e-05, "loss": 2.2555, "step": 107800 }, { "epoch": 0.67, "learning_rate": 5.223853136628727e-05, "loss": 2.2434, "step": 107808 }, { "epoch": 0.67, "learning_rate": 5.2232344492883144e-05, "loss": 2.2386, "step": 107816 }, { "epoch": 0.67, "learning_rate": 5.22261578125838e-05, "loss": 2.2369, "step": 107824 }, { "epoch": 0.67, "learning_rate": 5.2219971325543085e-05, "loss": 2.2414, "step": 107832 }, { "epoch": 0.67, "learning_rate": 5.221378503191472e-05, "loss": 2.2342, "step": 107840 }, { "epoch": 0.67, "learning_rate": 5.220759893185252e-05, "loss": 2.2489, "step": 107848 }, { "epoch": 0.67, "learning_rate": 5.2201413025510315e-05, "loss": 2.2451, "step": 107856 }, { "epoch": 0.67, "learning_rate": 5.219522731304185e-05, "loss": 2.242, "step": 107864 }, { "epoch": 0.67, "learning_rate": 5.218904179460089e-05, "loss": 2.2308, "step": 107872 }, { "epoch": 0.67, "learning_rate": 5.2182856470341245e-05, "loss": 2.2543, "step": 107880 }, { "epoch": 0.67, "learning_rate": 5.217667134041666e-05, "loss": 2.2383, "step": 107888 }, { "epoch": 0.67, "learning_rate": 5.217048640498091e-05, "loss": 2.2345, "step": 107896 }, { "epoch": 0.67, "learning_rate": 5.216430166418774e-05, "loss": 2.2477, "step": 107904 }, { "epoch": 0.67, "learning_rate": 5.2158117118190916e-05, "loss": 2.2362, "step": 107912 }, { "epoch": 0.67, "learning_rate": 5.215193276714417e-05, "loss": 2.2435, "step": 107920 }, { "epoch": 0.67, "learning_rate": 5.214574861120127e-05, "loss": 2.2524, "step": 107928 }, { "epoch": 0.67, "learning_rate": 5.213956465051595e-05, "loss": 2.2434, "step": 107936 }, { "epoch": 0.67, "learning_rate": 5.21333808852419e-05, "loss": 2.2569, "step": 107944 }, { "epoch": 0.67, "learning_rate": 5.212719731553291e-05, "loss": 2.2267, "step": 107952 }, { "epoch": 0.67, "learning_rate": 5.2121013941542675e-05, "loss": 2.2345, "step": 107960 }, { "epoch": 0.67, "learning_rate": 5.211483076342491e-05, "loss": 2.2596, "step": 107968 }, { "epoch": 0.67, "learning_rate": 5.210864778133333e-05, "loss": 2.2473, "step": 107976 }, { "epoch": 0.67, "learning_rate": 5.2102464995421654e-05, "loss": 2.2535, "step": 107984 }, { "epoch": 0.67, "learning_rate": 5.209628240584361e-05, "loss": 2.2541, "step": 107992 }, { "epoch": 0.68, "learning_rate": 5.209010001275285e-05, "loss": 2.2342, "step": 108000 }, { "epoch": 0.68, "learning_rate": 5.208391781630307e-05, "loss": 2.243, "step": 108008 }, { "epoch": 0.68, "learning_rate": 5.207773581664803e-05, "loss": 2.2403, "step": 108016 }, { "epoch": 0.68, "learning_rate": 5.2071554013941334e-05, "loss": 2.2519, "step": 108024 }, { "epoch": 0.68, "learning_rate": 5.2065372408336696e-05, "loss": 2.2556, "step": 108032 }, { "epoch": 0.68, "learning_rate": 5.2059190999987796e-05, "loss": 2.2471, "step": 108040 }, { "epoch": 0.68, "learning_rate": 5.20530097890483e-05, "loss": 2.2296, "step": 108048 }, { "epoch": 0.68, "learning_rate": 5.204682877567187e-05, "loss": 2.2438, "step": 108056 }, { "epoch": 0.68, "learning_rate": 5.204064796001218e-05, "loss": 2.2287, "step": 108064 }, { "epoch": 0.68, "learning_rate": 5.203446734222286e-05, "loss": 2.2427, "step": 108072 }, { "epoch": 0.68, "learning_rate": 5.202828692245758e-05, "loss": 2.2481, "step": 108080 }, { "epoch": 0.68, "learning_rate": 5.202210670086998e-05, "loss": 2.2385, "step": 108088 }, { "epoch": 0.68, "learning_rate": 5.2015926677613716e-05, "loss": 2.2479, "step": 108096 }, { "epoch": 0.68, "learning_rate": 5.200974685284239e-05, "loss": 2.2634, "step": 108104 }, { "epoch": 0.68, "learning_rate": 5.200356722670967e-05, "loss": 2.243, "step": 108112 }, { "epoch": 0.68, "learning_rate": 5.199738779936916e-05, "loss": 2.2223, "step": 108120 }, { "epoch": 0.68, "learning_rate": 5.199120857097448e-05, "loss": 2.2586, "step": 108128 }, { "epoch": 0.68, "learning_rate": 5.1985029541679254e-05, "loss": 2.2535, "step": 108136 }, { "epoch": 0.68, "learning_rate": 5.1978850711637104e-05, "loss": 2.2574, "step": 108144 }, { "epoch": 0.68, "learning_rate": 5.1972672081001627e-05, "loss": 2.2357, "step": 108152 }, { "epoch": 0.68, "learning_rate": 5.196649364992641e-05, "loss": 2.2511, "step": 108160 }, { "epoch": 0.68, "learning_rate": 5.1960315418565063e-05, "loss": 2.2481, "step": 108168 }, { "epoch": 0.68, "learning_rate": 5.195413738707118e-05, "loss": 2.2447, "step": 108176 }, { "epoch": 0.68, "learning_rate": 5.1947959555598366e-05, "loss": 2.2513, "step": 108184 }, { "epoch": 0.68, "learning_rate": 5.1941781924300146e-05, "loss": 2.2449, "step": 108192 }, { "epoch": 0.68, "learning_rate": 5.193560449333015e-05, "loss": 2.2392, "step": 108200 }, { "epoch": 0.68, "learning_rate": 5.192942726284193e-05, "loss": 2.2463, "step": 108208 }, { "epoch": 0.68, "learning_rate": 5.192325023298905e-05, "loss": 2.2338, "step": 108216 }, { "epoch": 0.68, "learning_rate": 5.1917073403925067e-05, "loss": 2.2368, "step": 108224 }, { "epoch": 0.68, "learning_rate": 5.191089677580356e-05, "loss": 2.2345, "step": 108232 }, { "epoch": 0.68, "learning_rate": 5.190472034877807e-05, "loss": 2.242, "step": 108240 }, { "epoch": 0.68, "learning_rate": 5.1898544123002125e-05, "loss": 2.2567, "step": 108248 }, { "epoch": 0.68, "learning_rate": 5.189236809862929e-05, "loss": 2.2407, "step": 108256 }, { "epoch": 0.68, "learning_rate": 5.188619227581311e-05, "loss": 2.2398, "step": 108264 }, { "epoch": 0.68, "learning_rate": 5.188001665470708e-05, "loss": 2.2386, "step": 108272 }, { "epoch": 0.68, "learning_rate": 5.187384123546475e-05, "loss": 2.2398, "step": 108280 }, { "epoch": 0.68, "learning_rate": 5.186766601823965e-05, "loss": 2.2385, "step": 108288 }, { "epoch": 0.68, "learning_rate": 5.186149100318526e-05, "loss": 2.2321, "step": 108296 }, { "epoch": 0.68, "learning_rate": 5.185531619045513e-05, "loss": 2.2337, "step": 108304 }, { "epoch": 0.68, "learning_rate": 5.184914158020275e-05, "loss": 2.2455, "step": 108312 }, { "epoch": 0.68, "learning_rate": 5.1842967172581636e-05, "loss": 2.252, "step": 108320 }, { "epoch": 0.68, "learning_rate": 5.183679296774526e-05, "loss": 2.2442, "step": 108328 }, { "epoch": 0.68, "learning_rate": 5.1830618965847134e-05, "loss": 2.235, "step": 108336 }, { "epoch": 0.68, "learning_rate": 5.1824445167040746e-05, "loss": 2.2358, "step": 108344 }, { "epoch": 0.68, "learning_rate": 5.181827157147956e-05, "loss": 2.2614, "step": 108352 }, { "epoch": 0.68, "learning_rate": 5.181209817931705e-05, "loss": 2.2345, "step": 108360 }, { "epoch": 0.68, "learning_rate": 5.180592499070672e-05, "loss": 2.232, "step": 108368 }, { "epoch": 0.68, "learning_rate": 5.179975200580199e-05, "loss": 2.234, "step": 108376 }, { "epoch": 0.68, "learning_rate": 5.179357922475636e-05, "loss": 2.2424, "step": 108384 }, { "epoch": 0.68, "learning_rate": 5.178740664772326e-05, "loss": 2.2437, "step": 108392 }, { "epoch": 0.68, "learning_rate": 5.178123427485617e-05, "loss": 2.2427, "step": 108400 }, { "epoch": 0.68, "learning_rate": 5.177506210630851e-05, "loss": 2.2407, "step": 108408 }, { "epoch": 0.68, "learning_rate": 5.1768890142233716e-05, "loss": 2.2352, "step": 108416 }, { "epoch": 0.68, "learning_rate": 5.176271838278527e-05, "loss": 2.2305, "step": 108424 }, { "epoch": 0.68, "learning_rate": 5.175654682811655e-05, "loss": 2.238, "step": 108432 }, { "epoch": 0.68, "learning_rate": 5.175037547838098e-05, "loss": 2.2306, "step": 108440 }, { "epoch": 0.68, "learning_rate": 5.174420433373204e-05, "loss": 2.2458, "step": 108448 }, { "epoch": 0.68, "learning_rate": 5.1738033394323085e-05, "loss": 2.2426, "step": 108456 }, { "epoch": 0.68, "learning_rate": 5.173186266030754e-05, "loss": 2.2567, "step": 108464 }, { "epoch": 0.68, "learning_rate": 5.172569213183882e-05, "loss": 2.2534, "step": 108472 }, { "epoch": 0.68, "learning_rate": 5.1719521809070336e-05, "loss": 2.2528, "step": 108480 }, { "epoch": 0.68, "learning_rate": 5.171335169215545e-05, "loss": 2.247, "step": 108488 }, { "epoch": 0.68, "learning_rate": 5.1707181781247584e-05, "loss": 2.2624, "step": 108496 }, { "epoch": 0.68, "learning_rate": 5.170101207650011e-05, "loss": 2.2456, "step": 108504 }, { "epoch": 0.68, "learning_rate": 5.1694842578066397e-05, "loss": 2.2419, "step": 108512 }, { "epoch": 0.68, "learning_rate": 5.168867328609983e-05, "loss": 2.2347, "step": 108520 }, { "epoch": 0.68, "learning_rate": 5.168250420075378e-05, "loss": 2.251, "step": 108528 }, { "epoch": 0.68, "learning_rate": 5.1676335322181613e-05, "loss": 2.2219, "step": 108536 }, { "epoch": 0.68, "learning_rate": 5.167016665053668e-05, "loss": 2.2462, "step": 108544 }, { "epoch": 0.68, "learning_rate": 5.166399818597234e-05, "loss": 2.2306, "step": 108552 }, { "epoch": 0.68, "learning_rate": 5.165782992864194e-05, "loss": 2.2367, "step": 108560 }, { "epoch": 0.68, "learning_rate": 5.165166187869883e-05, "loss": 2.2296, "step": 108568 }, { "epoch": 0.68, "learning_rate": 5.1645494036296326e-05, "loss": 2.2453, "step": 108576 }, { "epoch": 0.68, "learning_rate": 5.1639326401587804e-05, "loss": 2.2515, "step": 108584 }, { "epoch": 0.68, "learning_rate": 5.1633158974726536e-05, "loss": 2.2376, "step": 108592 }, { "epoch": 0.68, "learning_rate": 5.16269917558659e-05, "loss": 2.242, "step": 108600 }, { "epoch": 0.68, "learning_rate": 5.162082474515917e-05, "loss": 2.2501, "step": 108608 }, { "epoch": 0.68, "learning_rate": 5.1614657942759706e-05, "loss": 2.2362, "step": 108616 }, { "epoch": 0.68, "learning_rate": 5.160849134882075e-05, "loss": 2.2622, "step": 108624 }, { "epoch": 0.68, "learning_rate": 5.160232496349564e-05, "loss": 2.239, "step": 108632 }, { "epoch": 0.68, "learning_rate": 5.159615878693771e-05, "loss": 2.2518, "step": 108640 }, { "epoch": 0.68, "learning_rate": 5.158999281930019e-05, "loss": 2.271, "step": 108648 }, { "epoch": 0.68, "learning_rate": 5.158382706073639e-05, "loss": 2.2458, "step": 108656 }, { "epoch": 0.68, "learning_rate": 5.15776615113996e-05, "loss": 2.2495, "step": 108664 }, { "epoch": 0.68, "learning_rate": 5.15714961714431e-05, "loss": 2.2411, "step": 108672 }, { "epoch": 0.68, "learning_rate": 5.156533104102013e-05, "loss": 2.2437, "step": 108680 }, { "epoch": 0.68, "learning_rate": 5.1559166120284e-05, "loss": 2.2347, "step": 108688 }, { "epoch": 0.68, "learning_rate": 5.1553001409387925e-05, "loss": 2.2444, "step": 108696 }, { "epoch": 0.68, "learning_rate": 5.15468369084852e-05, "loss": 2.253, "step": 108704 }, { "epoch": 0.68, "learning_rate": 5.1540672617729036e-05, "loss": 2.2491, "step": 108712 }, { "epoch": 0.68, "learning_rate": 5.153450853727273e-05, "loss": 2.2399, "step": 108720 }, { "epoch": 0.68, "learning_rate": 5.152834466726947e-05, "loss": 2.2418, "step": 108728 }, { "epoch": 0.68, "learning_rate": 5.1522181007872515e-05, "loss": 2.2337, "step": 108736 }, { "epoch": 0.68, "learning_rate": 5.15160175592351e-05, "loss": 2.2456, "step": 108744 }, { "epoch": 0.68, "learning_rate": 5.150985432151043e-05, "loss": 2.2418, "step": 108752 }, { "epoch": 0.68, "learning_rate": 5.150369129485173e-05, "loss": 2.2336, "step": 108760 }, { "epoch": 0.68, "learning_rate": 5.149752847941223e-05, "loss": 2.2402, "step": 108768 }, { "epoch": 0.68, "learning_rate": 5.149136587534513e-05, "loss": 2.2486, "step": 108776 }, { "epoch": 0.68, "learning_rate": 5.148520348280361e-05, "loss": 2.2404, "step": 108784 }, { "epoch": 0.68, "learning_rate": 5.14790413019409e-05, "loss": 2.2446, "step": 108792 }, { "epoch": 0.68, "learning_rate": 5.147287933291018e-05, "loss": 2.2257, "step": 108800 }, { "epoch": 0.68, "learning_rate": 5.1466717575864646e-05, "loss": 2.2374, "step": 108808 }, { "epoch": 0.68, "learning_rate": 5.146055603095744e-05, "loss": 2.247, "step": 108816 }, { "epoch": 0.68, "learning_rate": 5.145439469834179e-05, "loss": 2.2362, "step": 108824 }, { "epoch": 0.68, "learning_rate": 5.1448233578170856e-05, "loss": 2.2275, "step": 108832 }, { "epoch": 0.68, "learning_rate": 5.144207267059778e-05, "loss": 2.2342, "step": 108840 }, { "epoch": 0.68, "learning_rate": 5.143591197577573e-05, "loss": 2.2506, "step": 108848 }, { "epoch": 0.68, "learning_rate": 5.142975149385789e-05, "loss": 2.249, "step": 108856 }, { "epoch": 0.68, "learning_rate": 5.142359122499738e-05, "loss": 2.247, "step": 108864 }, { "epoch": 0.68, "learning_rate": 5.141743116934734e-05, "loss": 2.2444, "step": 108872 }, { "epoch": 0.68, "learning_rate": 5.1411271327060936e-05, "loss": 2.2513, "step": 108880 }, { "epoch": 0.68, "learning_rate": 5.1405111698291296e-05, "loss": 2.2437, "step": 108888 }, { "epoch": 0.68, "learning_rate": 5.1398952283191536e-05, "loss": 2.2307, "step": 108896 }, { "epoch": 0.68, "learning_rate": 5.13927930819148e-05, "loss": 2.2518, "step": 108904 }, { "epoch": 0.68, "learning_rate": 5.13866340946142e-05, "loss": 2.2552, "step": 108912 }, { "epoch": 0.68, "learning_rate": 5.138047532144281e-05, "loss": 2.2477, "step": 108920 }, { "epoch": 0.68, "learning_rate": 5.137431676255379e-05, "loss": 2.2486, "step": 108928 }, { "epoch": 0.68, "learning_rate": 5.136815841810022e-05, "loss": 2.2612, "step": 108936 }, { "epoch": 0.68, "learning_rate": 5.13620002882352e-05, "loss": 2.2367, "step": 108944 }, { "epoch": 0.68, "learning_rate": 5.1355842373111815e-05, "loss": 2.242, "step": 108952 }, { "epoch": 0.68, "learning_rate": 5.134968467288317e-05, "loss": 2.256, "step": 108960 }, { "epoch": 0.68, "learning_rate": 5.134352718770233e-05, "loss": 2.2487, "step": 108968 }, { "epoch": 0.68, "learning_rate": 5.1337369917722376e-05, "loss": 2.2453, "step": 108976 }, { "epoch": 0.68, "learning_rate": 5.133121286309638e-05, "loss": 2.2613, "step": 108984 }, { "epoch": 0.68, "learning_rate": 5.1325056023977416e-05, "loss": 2.2421, "step": 108992 }, { "epoch": 0.68, "learning_rate": 5.1318899400518504e-05, "loss": 2.2389, "step": 109000 }, { "epoch": 0.68, "learning_rate": 5.1312742992872745e-05, "loss": 2.2503, "step": 109008 }, { "epoch": 0.68, "learning_rate": 5.130658680119316e-05, "loss": 2.2445, "step": 109016 }, { "epoch": 0.68, "learning_rate": 5.1300430825632826e-05, "loss": 2.228, "step": 109024 }, { "epoch": 0.68, "learning_rate": 5.129427506634473e-05, "loss": 2.2521, "step": 109032 }, { "epoch": 0.68, "learning_rate": 5.128811952348194e-05, "loss": 2.2573, "step": 109040 }, { "epoch": 0.68, "learning_rate": 5.12819641971975e-05, "loss": 2.2569, "step": 109048 }, { "epoch": 0.68, "learning_rate": 5.1275809087644375e-05, "loss": 2.2354, "step": 109056 }, { "epoch": 0.68, "learning_rate": 5.126965419497562e-05, "loss": 2.2492, "step": 109064 }, { "epoch": 0.68, "learning_rate": 5.126349951934426e-05, "loss": 2.2326, "step": 109072 }, { "epoch": 0.68, "learning_rate": 5.125734506090327e-05, "loss": 2.2545, "step": 109080 }, { "epoch": 0.68, "learning_rate": 5.125119081980567e-05, "loss": 2.2438, "step": 109088 }, { "epoch": 0.68, "learning_rate": 5.1245036796204424e-05, "loss": 2.2468, "step": 109096 }, { "epoch": 0.68, "learning_rate": 5.123888299025259e-05, "loss": 2.2616, "step": 109104 }, { "epoch": 0.68, "learning_rate": 5.1232729402103075e-05, "loss": 2.2424, "step": 109112 }, { "epoch": 0.68, "learning_rate": 5.122657603190889e-05, "loss": 2.2483, "step": 109120 }, { "epoch": 0.68, "learning_rate": 5.1220422879823024e-05, "loss": 2.2366, "step": 109128 }, { "epoch": 0.68, "learning_rate": 5.121426994599843e-05, "loss": 2.237, "step": 109136 }, { "epoch": 0.68, "learning_rate": 5.1208117230588045e-05, "loss": 2.2192, "step": 109144 }, { "epoch": 0.68, "learning_rate": 5.1201964733744876e-05, "loss": 2.2275, "step": 109152 }, { "epoch": 0.68, "learning_rate": 5.119581245562185e-05, "loss": 2.2356, "step": 109160 }, { "epoch": 0.68, "learning_rate": 5.11896603963719e-05, "loss": 2.2611, "step": 109168 }, { "epoch": 0.68, "learning_rate": 5.118350855614799e-05, "loss": 2.2623, "step": 109176 }, { "epoch": 0.68, "learning_rate": 5.117735693510306e-05, "loss": 2.2605, "step": 109184 }, { "epoch": 0.68, "learning_rate": 5.117120553339001e-05, "loss": 2.2348, "step": 109192 }, { "epoch": 0.68, "learning_rate": 5.116505435116178e-05, "loss": 2.2452, "step": 109200 }, { "epoch": 0.68, "learning_rate": 5.1158903388571313e-05, "loss": 2.2444, "step": 109208 }, { "epoch": 0.68, "learning_rate": 5.115275264577146e-05, "loss": 2.2327, "step": 109216 }, { "epoch": 0.68, "learning_rate": 5.11466021229152e-05, "loss": 2.2259, "step": 109224 }, { "epoch": 0.68, "learning_rate": 5.114045182015539e-05, "loss": 2.2309, "step": 109232 }, { "epoch": 0.68, "learning_rate": 5.113430173764495e-05, "loss": 2.2492, "step": 109240 }, { "epoch": 0.68, "learning_rate": 5.112815187553675e-05, "loss": 2.2139, "step": 109248 }, { "epoch": 0.68, "learning_rate": 5.11220022339837e-05, "loss": 2.236, "step": 109256 }, { "epoch": 0.68, "learning_rate": 5.1115852813138685e-05, "loss": 2.2414, "step": 109264 }, { "epoch": 0.68, "learning_rate": 5.1109703613154544e-05, "loss": 2.2513, "step": 109272 }, { "epoch": 0.68, "learning_rate": 5.110355463418418e-05, "loss": 2.2361, "step": 109280 }, { "epoch": 0.68, "learning_rate": 5.1097405876380454e-05, "loss": 2.2272, "step": 109288 }, { "epoch": 0.68, "learning_rate": 5.1091257339896194e-05, "loss": 2.2373, "step": 109296 }, { "epoch": 0.68, "learning_rate": 5.1085109024884284e-05, "loss": 2.2335, "step": 109304 }, { "epoch": 0.68, "learning_rate": 5.107896093149757e-05, "loss": 2.2647, "step": 109312 }, { "epoch": 0.68, "learning_rate": 5.1072813059888894e-05, "loss": 2.2577, "step": 109320 }, { "epoch": 0.68, "learning_rate": 5.1066665410211064e-05, "loss": 2.2502, "step": 109328 }, { "epoch": 0.68, "learning_rate": 5.106051798261695e-05, "loss": 2.2464, "step": 109336 }, { "epoch": 0.68, "learning_rate": 5.105437077725936e-05, "loss": 2.2311, "step": 109344 }, { "epoch": 0.68, "learning_rate": 5.1048223794291126e-05, "loss": 2.242, "step": 109352 }, { "epoch": 0.68, "learning_rate": 5.1042077033865035e-05, "loss": 2.2425, "step": 109360 }, { "epoch": 0.68, "learning_rate": 5.103593049613391e-05, "loss": 2.238, "step": 109368 }, { "epoch": 0.68, "learning_rate": 5.1029784181250584e-05, "loss": 2.2447, "step": 109376 }, { "epoch": 0.68, "learning_rate": 5.102363808936781e-05, "loss": 2.2479, "step": 109384 }, { "epoch": 0.68, "learning_rate": 5.101749222063841e-05, "loss": 2.2396, "step": 109392 }, { "epoch": 0.68, "learning_rate": 5.101134657521516e-05, "loss": 2.2243, "step": 109400 }, { "epoch": 0.68, "learning_rate": 5.100520115325084e-05, "loss": 2.2265, "step": 109408 }, { "epoch": 0.68, "learning_rate": 5.0999055954898224e-05, "loss": 2.2445, "step": 109416 }, { "epoch": 0.68, "learning_rate": 5.0992910980310104e-05, "loss": 2.2482, "step": 109424 }, { "epoch": 0.68, "learning_rate": 5.09867662296392e-05, "loss": 2.2301, "step": 109432 }, { "epoch": 0.68, "learning_rate": 5.0980621703038324e-05, "loss": 2.2461, "step": 109440 }, { "epoch": 0.68, "learning_rate": 5.097447740066019e-05, "loss": 2.2419, "step": 109448 }, { "epoch": 0.68, "learning_rate": 5.096833332265758e-05, "loss": 2.2359, "step": 109456 }, { "epoch": 0.68, "learning_rate": 5.09621894691832e-05, "loss": 2.2271, "step": 109464 }, { "epoch": 0.68, "learning_rate": 5.095604584038979e-05, "loss": 2.2401, "step": 109472 }, { "epoch": 0.68, "learning_rate": 5.094990243643012e-05, "loss": 2.2316, "step": 109480 }, { "epoch": 0.68, "learning_rate": 5.094375925745689e-05, "loss": 2.2398, "step": 109488 }, { "epoch": 0.68, "learning_rate": 5.0937616303622804e-05, "loss": 2.2407, "step": 109496 }, { "epoch": 0.68, "learning_rate": 5.093147357508061e-05, "loss": 2.2305, "step": 109504 }, { "epoch": 0.68, "learning_rate": 5.0925331071982984e-05, "loss": 2.2319, "step": 109512 }, { "epoch": 0.68, "learning_rate": 5.091918879448265e-05, "loss": 2.2279, "step": 109520 }, { "epoch": 0.68, "learning_rate": 5.091304674273231e-05, "loss": 2.2373, "step": 109528 }, { "epoch": 0.68, "learning_rate": 5.090690491688465e-05, "loss": 2.2472, "step": 109536 }, { "epoch": 0.68, "learning_rate": 5.0900763317092345e-05, "loss": 2.2416, "step": 109544 }, { "epoch": 0.68, "learning_rate": 5.089462194350808e-05, "loss": 2.2317, "step": 109552 }, { "epoch": 0.68, "learning_rate": 5.0888480796284545e-05, "loss": 2.2386, "step": 109560 }, { "epoch": 0.68, "learning_rate": 5.0882339875574406e-05, "loss": 2.2303, "step": 109568 }, { "epoch": 0.68, "learning_rate": 5.0876199181530304e-05, "loss": 2.2415, "step": 109576 }, { "epoch": 0.68, "learning_rate": 5.0870058714304915e-05, "loss": 2.2357, "step": 109584 }, { "epoch": 0.68, "learning_rate": 5.0863918474050895e-05, "loss": 2.2265, "step": 109592 }, { "epoch": 0.69, "learning_rate": 5.08577784609209e-05, "loss": 2.2499, "step": 109600 }, { "epoch": 0.69, "learning_rate": 5.0851638675067536e-05, "loss": 2.2472, "step": 109608 }, { "epoch": 0.69, "learning_rate": 5.084549911664348e-05, "loss": 2.2303, "step": 109616 }, { "epoch": 0.69, "learning_rate": 5.083935978580133e-05, "loss": 2.2423, "step": 109624 }, { "epoch": 0.69, "learning_rate": 5.083322068269373e-05, "loss": 2.2279, "step": 109632 }, { "epoch": 0.69, "learning_rate": 5.082708180747331e-05, "loss": 2.2372, "step": 109640 }, { "epoch": 0.69, "learning_rate": 5.082094316029264e-05, "loss": 2.2377, "step": 109648 }, { "epoch": 0.69, "learning_rate": 5.081480474130435e-05, "loss": 2.2499, "step": 109656 }, { "epoch": 0.69, "learning_rate": 5.080866655066105e-05, "loss": 2.2334, "step": 109664 }, { "epoch": 0.69, "learning_rate": 5.080252858851535e-05, "loss": 2.2371, "step": 109672 }, { "epoch": 0.69, "learning_rate": 5.079639085501979e-05, "loss": 2.2398, "step": 109680 }, { "epoch": 0.69, "learning_rate": 5.0790253350327e-05, "loss": 2.2412, "step": 109688 }, { "epoch": 0.69, "learning_rate": 5.078411607458957e-05, "loss": 2.2387, "step": 109696 }, { "epoch": 0.69, "learning_rate": 5.077797902796002e-05, "loss": 2.2398, "step": 109704 }, { "epoch": 0.69, "learning_rate": 5.0771842210590946e-05, "loss": 2.2519, "step": 109712 }, { "epoch": 0.69, "learning_rate": 5.076570562263489e-05, "loss": 2.2479, "step": 109720 }, { "epoch": 0.69, "learning_rate": 5.075956926424448e-05, "loss": 2.2433, "step": 109728 }, { "epoch": 0.69, "learning_rate": 5.0753433135572195e-05, "loss": 2.2297, "step": 109736 }, { "epoch": 0.69, "learning_rate": 5.0747297236770584e-05, "loss": 2.2227, "step": 109744 }, { "epoch": 0.69, "learning_rate": 5.0741161567992215e-05, "loss": 2.2436, "step": 109752 }, { "epoch": 0.69, "learning_rate": 5.073502612938961e-05, "loss": 2.2512, "step": 109760 }, { "epoch": 0.69, "learning_rate": 5.0728890921115276e-05, "loss": 2.2485, "step": 109768 }, { "epoch": 0.69, "learning_rate": 5.0722755943321774e-05, "loss": 2.2483, "step": 109776 }, { "epoch": 0.69, "learning_rate": 5.071662119616159e-05, "loss": 2.2467, "step": 109784 }, { "epoch": 0.69, "learning_rate": 5.071048667978724e-05, "loss": 2.239, "step": 109792 }, { "epoch": 0.69, "learning_rate": 5.070435239435125e-05, "loss": 2.2544, "step": 109800 }, { "epoch": 0.69, "learning_rate": 5.06982183400061e-05, "loss": 2.2384, "step": 109808 }, { "epoch": 0.69, "learning_rate": 5.069208451690428e-05, "loss": 2.2483, "step": 109816 }, { "epoch": 0.69, "learning_rate": 5.068595092519828e-05, "loss": 2.243, "step": 109824 }, { "epoch": 0.69, "learning_rate": 5.067981756504059e-05, "loss": 2.2459, "step": 109832 }, { "epoch": 0.69, "learning_rate": 5.067368443658367e-05, "loss": 2.2479, "step": 109840 }, { "epoch": 0.69, "learning_rate": 5.0667551539980016e-05, "loss": 2.2442, "step": 109848 }, { "epoch": 0.69, "learning_rate": 5.0661418875382074e-05, "loss": 2.2307, "step": 109856 }, { "epoch": 0.69, "learning_rate": 5.0655286442942305e-05, "loss": 2.2343, "step": 109864 }, { "epoch": 0.69, "learning_rate": 5.064915424281316e-05, "loss": 2.2421, "step": 109872 }, { "epoch": 0.69, "learning_rate": 5.0643022275147075e-05, "loss": 2.2466, "step": 109880 }, { "epoch": 0.69, "learning_rate": 5.063689054009655e-05, "loss": 2.2175, "step": 109888 }, { "epoch": 0.69, "learning_rate": 5.063075903781395e-05, "loss": 2.2506, "step": 109896 }, { "epoch": 0.69, "learning_rate": 5.062462776845172e-05, "loss": 2.2419, "step": 109904 }, { "epoch": 0.69, "learning_rate": 5.061849673216232e-05, "loss": 2.2356, "step": 109912 }, { "epoch": 0.69, "learning_rate": 5.061236592909813e-05, "loss": 2.2455, "step": 109920 }, { "epoch": 0.69, "learning_rate": 5.060623535941158e-05, "loss": 2.222, "step": 109928 }, { "epoch": 0.69, "learning_rate": 5.060010502325505e-05, "loss": 2.2406, "step": 109936 }, { "epoch": 0.69, "learning_rate": 5.0593974920780995e-05, "loss": 2.2374, "step": 109944 }, { "epoch": 0.69, "learning_rate": 5.058784505214177e-05, "loss": 2.2351, "step": 109952 }, { "epoch": 0.69, "learning_rate": 5.058171541748977e-05, "loss": 2.2619, "step": 109960 }, { "epoch": 0.69, "learning_rate": 5.0575586016977385e-05, "loss": 2.2312, "step": 109968 }, { "epoch": 0.69, "learning_rate": 5.056945685075698e-05, "loss": 2.25, "step": 109976 }, { "epoch": 0.69, "learning_rate": 5.0563327918980954e-05, "loss": 2.2467, "step": 109984 }, { "epoch": 0.69, "learning_rate": 5.0557199221801644e-05, "loss": 2.2486, "step": 109992 }, { "epoch": 0.69, "learning_rate": 5.055107075937142e-05, "loss": 2.2411, "step": 110000 }, { "epoch": 0.69, "learning_rate": 5.054494253184263e-05, "loss": 2.2351, "step": 110008 }, { "epoch": 0.69, "learning_rate": 5.053881453936763e-05, "loss": 2.2445, "step": 110016 }, { "epoch": 0.69, "learning_rate": 5.053268678209877e-05, "loss": 2.2243, "step": 110024 }, { "epoch": 0.69, "learning_rate": 5.052655926018839e-05, "loss": 2.2392, "step": 110032 }, { "epoch": 0.69, "learning_rate": 5.052043197378878e-05, "loss": 2.2394, "step": 110040 }, { "epoch": 0.69, "learning_rate": 5.0514304923052334e-05, "loss": 2.24, "step": 110048 }, { "epoch": 0.69, "learning_rate": 5.050817810813129e-05, "loss": 2.2396, "step": 110056 }, { "epoch": 0.69, "learning_rate": 5.050205152917802e-05, "loss": 2.241, "step": 110064 }, { "epoch": 0.69, "learning_rate": 5.049592518634483e-05, "loss": 2.2414, "step": 110072 }, { "epoch": 0.69, "learning_rate": 5.0489799079783995e-05, "loss": 2.2512, "step": 110080 }, { "epoch": 0.69, "learning_rate": 5.048367320964782e-05, "loss": 2.2517, "step": 110088 }, { "epoch": 0.69, "learning_rate": 5.047754757608858e-05, "loss": 2.2315, "step": 110096 }, { "epoch": 0.69, "learning_rate": 5.047142217925862e-05, "loss": 2.2499, "step": 110104 }, { "epoch": 0.69, "learning_rate": 5.046529701931013e-05, "loss": 2.2531, "step": 110112 }, { "epoch": 0.69, "learning_rate": 5.0459172096395436e-05, "loss": 2.249, "step": 110120 }, { "epoch": 0.69, "learning_rate": 5.045304741066682e-05, "loss": 2.223, "step": 110128 }, { "epoch": 0.69, "learning_rate": 5.044692296227649e-05, "loss": 2.2577, "step": 110136 }, { "epoch": 0.69, "learning_rate": 5.0440798751376725e-05, "loss": 2.2527, "step": 110144 }, { "epoch": 0.69, "learning_rate": 5.0434674778119786e-05, "loss": 2.2386, "step": 110152 }, { "epoch": 0.69, "learning_rate": 5.0428551042657914e-05, "loss": 2.2534, "step": 110160 }, { "epoch": 0.69, "learning_rate": 5.0422427545143324e-05, "loss": 2.2497, "step": 110168 }, { "epoch": 0.69, "learning_rate": 5.041630428572825e-05, "loss": 2.2382, "step": 110176 }, { "epoch": 0.69, "learning_rate": 5.041018126456496e-05, "loss": 2.2361, "step": 110184 }, { "epoch": 0.69, "learning_rate": 5.0404058481805614e-05, "loss": 2.2366, "step": 110192 }, { "epoch": 0.69, "learning_rate": 5.039793593760245e-05, "loss": 2.2461, "step": 110200 }, { "epoch": 0.69, "learning_rate": 5.03918136321077e-05, "loss": 2.2436, "step": 110208 }, { "epoch": 0.69, "learning_rate": 5.03856915654735e-05, "loss": 2.2542, "step": 110216 }, { "epoch": 0.69, "learning_rate": 5.037956973785212e-05, "loss": 2.251, "step": 110224 }, { "epoch": 0.69, "learning_rate": 5.0373448149395706e-05, "loss": 2.2448, "step": 110232 }, { "epoch": 0.69, "learning_rate": 5.036732680025644e-05, "loss": 2.2425, "step": 110240 }, { "epoch": 0.69, "learning_rate": 5.036120569058653e-05, "loss": 2.2443, "step": 110248 }, { "epoch": 0.69, "learning_rate": 5.035508482053812e-05, "loss": 2.2454, "step": 110256 }, { "epoch": 0.69, "learning_rate": 5.034896419026339e-05, "loss": 2.2516, "step": 110264 }, { "epoch": 0.69, "learning_rate": 5.0342843799914476e-05, "loss": 2.2495, "step": 110272 }, { "epoch": 0.69, "learning_rate": 5.0336723649643545e-05, "loss": 2.2466, "step": 110280 }, { "epoch": 0.69, "learning_rate": 5.0330603739602766e-05, "loss": 2.2373, "step": 110288 }, { "epoch": 0.69, "learning_rate": 5.032448406994428e-05, "loss": 2.2466, "step": 110296 }, { "epoch": 0.69, "learning_rate": 5.031836464082016e-05, "loss": 2.2342, "step": 110304 }, { "epoch": 0.69, "learning_rate": 5.03122454523826e-05, "loss": 2.2348, "step": 110312 }, { "epoch": 0.69, "learning_rate": 5.0306126504783736e-05, "loss": 2.2528, "step": 110320 }, { "epoch": 0.69, "learning_rate": 5.030000779817563e-05, "loss": 2.2636, "step": 110328 }, { "epoch": 0.69, "learning_rate": 5.02938893327104e-05, "loss": 2.2466, "step": 110336 }, { "epoch": 0.69, "learning_rate": 5.0287771108540195e-05, "loss": 2.2463, "step": 110344 }, { "epoch": 0.69, "learning_rate": 5.028165312581708e-05, "loss": 2.2441, "step": 110352 }, { "epoch": 0.69, "learning_rate": 5.0275535384693165e-05, "loss": 2.2562, "step": 110360 }, { "epoch": 0.69, "learning_rate": 5.026941788532053e-05, "loss": 2.253, "step": 110368 }, { "epoch": 0.69, "learning_rate": 5.026330062785125e-05, "loss": 2.2555, "step": 110376 }, { "epoch": 0.69, "learning_rate": 5.0257183612437405e-05, "loss": 2.2322, "step": 110384 }, { "epoch": 0.69, "learning_rate": 5.025106683923109e-05, "loss": 2.2359, "step": 110392 }, { "epoch": 0.69, "learning_rate": 5.024495030838434e-05, "loss": 2.2468, "step": 110400 }, { "epoch": 0.69, "learning_rate": 5.0238834020049206e-05, "loss": 2.2298, "step": 110408 }, { "epoch": 0.69, "learning_rate": 5.023271797437776e-05, "loss": 2.2458, "step": 110416 }, { "epoch": 0.69, "learning_rate": 5.022660217152204e-05, "loss": 2.2294, "step": 110424 }, { "epoch": 0.69, "learning_rate": 5.02204866116341e-05, "loss": 2.2345, "step": 110432 }, { "epoch": 0.69, "learning_rate": 5.0214371294865944e-05, "loss": 2.2585, "step": 110440 }, { "epoch": 0.69, "learning_rate": 5.020825622136962e-05, "loss": 2.222, "step": 110448 }, { "epoch": 0.69, "learning_rate": 5.0202141391297153e-05, "loss": 2.2288, "step": 110456 }, { "epoch": 0.69, "learning_rate": 5.019602680480053e-05, "loss": 2.2368, "step": 110464 }, { "epoch": 0.69, "learning_rate": 5.01899124620318e-05, "loss": 2.2483, "step": 110472 }, { "epoch": 0.69, "learning_rate": 5.0183798363142954e-05, "loss": 2.2516, "step": 110480 }, { "epoch": 0.69, "learning_rate": 5.0177684508285974e-05, "loss": 2.2443, "step": 110488 }, { "epoch": 0.69, "learning_rate": 5.017157089761284e-05, "loss": 2.2449, "step": 110496 }, { "epoch": 0.69, "learning_rate": 5.016545753127557e-05, "loss": 2.2382, "step": 110504 }, { "epoch": 0.69, "learning_rate": 5.0159344409426134e-05, "loss": 2.2574, "step": 110512 }, { "epoch": 0.69, "learning_rate": 5.0153231532216494e-05, "loss": 2.2289, "step": 110520 }, { "epoch": 0.69, "learning_rate": 5.0147118899798616e-05, "loss": 2.2462, "step": 110528 }, { "epoch": 0.69, "learning_rate": 5.014100651232449e-05, "loss": 2.247, "step": 110536 }, { "epoch": 0.69, "learning_rate": 5.013489436994603e-05, "loss": 2.2488, "step": 110544 }, { "epoch": 0.69, "learning_rate": 5.0128782472815205e-05, "loss": 2.2436, "step": 110552 }, { "epoch": 0.69, "learning_rate": 5.012267082108397e-05, "loss": 2.2419, "step": 110560 }, { "epoch": 0.69, "learning_rate": 5.011655941490423e-05, "loss": 2.258, "step": 110568 }, { "epoch": 0.69, "learning_rate": 5.011044825442793e-05, "loss": 2.253, "step": 110576 }, { "epoch": 0.69, "learning_rate": 5.010433733980701e-05, "loss": 2.2456, "step": 110584 }, { "epoch": 0.69, "learning_rate": 5.009822667119337e-05, "loss": 2.2591, "step": 110592 }, { "epoch": 0.69, "learning_rate": 5.009211624873891e-05, "loss": 2.2537, "step": 110600 }, { "epoch": 0.69, "learning_rate": 5.008600607259557e-05, "loss": 2.2444, "step": 110608 }, { "epoch": 0.69, "learning_rate": 5.007989614291523e-05, "loss": 2.2505, "step": 110616 }, { "epoch": 0.69, "learning_rate": 5.007378645984977e-05, "loss": 2.2457, "step": 110624 }, { "epoch": 0.69, "learning_rate": 5.0067677023551106e-05, "loss": 2.237, "step": 110632 }, { "epoch": 0.69, "learning_rate": 5.0061567834171096e-05, "loss": 2.2478, "step": 110640 }, { "epoch": 0.69, "learning_rate": 5.005545889186164e-05, "loss": 2.239, "step": 110648 }, { "epoch": 0.69, "learning_rate": 5.004935019677457e-05, "loss": 2.2475, "step": 110656 }, { "epoch": 0.69, "learning_rate": 5.0043241749061784e-05, "loss": 2.2508, "step": 110664 }, { "epoch": 0.69, "learning_rate": 5.003713354887514e-05, "loss": 2.2438, "step": 110672 }, { "epoch": 0.69, "learning_rate": 5.003102559636645e-05, "loss": 2.2417, "step": 110680 }, { "epoch": 0.69, "learning_rate": 5.0024917891687585e-05, "loss": 2.2504, "step": 110688 }, { "epoch": 0.69, "learning_rate": 5.001881043499039e-05, "loss": 2.2594, "step": 110696 }, { "epoch": 0.69, "learning_rate": 5.001270322642669e-05, "loss": 2.2296, "step": 110704 }, { "epoch": 0.69, "learning_rate": 5.0006596266148295e-05, "loss": 2.2494, "step": 110712 }, { "epoch": 0.69, "learning_rate": 5.000048955430703e-05, "loss": 2.2293, "step": 110720 }, { "epoch": 0.69, "learning_rate": 4.999438309105475e-05, "loss": 2.2431, "step": 110728 }, { "epoch": 0.69, "learning_rate": 4.9988276876543214e-05, "loss": 2.249, "step": 110736 }, { "epoch": 0.69, "learning_rate": 4.998217091092422e-05, "loss": 2.239, "step": 110744 }, { "epoch": 0.69, "learning_rate": 4.997606519434961e-05, "loss": 2.2405, "step": 110752 }, { "epoch": 0.69, "learning_rate": 4.996995972697113e-05, "loss": 2.2425, "step": 110760 }, { "epoch": 0.69, "learning_rate": 4.9963854508940565e-05, "loss": 2.2514, "step": 110768 }, { "epoch": 0.69, "learning_rate": 4.99577495404097e-05, "loss": 2.2447, "step": 110776 }, { "epoch": 0.69, "learning_rate": 4.995164482153034e-05, "loss": 2.2379, "step": 110784 }, { "epoch": 0.69, "learning_rate": 4.99455403524542e-05, "loss": 2.2483, "step": 110792 }, { "epoch": 0.69, "learning_rate": 4.993943613333305e-05, "loss": 2.2136, "step": 110800 }, { "epoch": 0.69, "learning_rate": 4.993333216431866e-05, "loss": 2.2412, "step": 110808 }, { "epoch": 0.69, "learning_rate": 4.9927228445562744e-05, "loss": 2.2345, "step": 110816 }, { "epoch": 0.69, "learning_rate": 4.9921124977217064e-05, "loss": 2.2569, "step": 110824 }, { "epoch": 0.69, "learning_rate": 4.991502175943336e-05, "loss": 2.2343, "step": 110832 }, { "epoch": 0.69, "learning_rate": 4.9908918792363335e-05, "loss": 2.2472, "step": 110840 }, { "epoch": 0.69, "learning_rate": 4.990281607615872e-05, "loss": 2.2344, "step": 110848 }, { "epoch": 0.69, "learning_rate": 4.989671361097123e-05, "loss": 2.2304, "step": 110856 }, { "epoch": 0.69, "learning_rate": 4.989061139695258e-05, "loss": 2.2386, "step": 110864 }, { "epoch": 0.69, "learning_rate": 4.9884509434254464e-05, "loss": 2.2461, "step": 110872 }, { "epoch": 0.69, "learning_rate": 4.987840772302857e-05, "loss": 2.2413, "step": 110880 }, { "epoch": 0.69, "learning_rate": 4.987230626342662e-05, "loss": 2.2426, "step": 110888 }, { "epoch": 0.69, "learning_rate": 4.986620505560024e-05, "loss": 2.2354, "step": 110896 }, { "epoch": 0.69, "learning_rate": 4.986010409970115e-05, "loss": 2.2422, "step": 110904 }, { "epoch": 0.69, "learning_rate": 4.985400339588103e-05, "loss": 2.2433, "step": 110912 }, { "epoch": 0.69, "learning_rate": 4.98479029442915e-05, "loss": 2.2198, "step": 110920 }, { "epoch": 0.69, "learning_rate": 4.9841802745084245e-05, "loss": 2.25, "step": 110928 }, { "epoch": 0.69, "learning_rate": 4.983570279841092e-05, "loss": 2.2316, "step": 110936 }, { "epoch": 0.69, "learning_rate": 4.9829603104423173e-05, "loss": 2.2477, "step": 110944 }, { "epoch": 0.69, "learning_rate": 4.982350366327262e-05, "loss": 2.2489, "step": 110952 }, { "epoch": 0.69, "learning_rate": 4.9817404475110896e-05, "loss": 2.2348, "step": 110960 }, { "epoch": 0.69, "learning_rate": 4.981130554008966e-05, "loss": 2.2505, "step": 110968 }, { "epoch": 0.69, "learning_rate": 4.980520685836051e-05, "loss": 2.2339, "step": 110976 }, { "epoch": 0.69, "learning_rate": 4.9799108430075054e-05, "loss": 2.2421, "step": 110984 }, { "epoch": 0.69, "learning_rate": 4.97930102553849e-05, "loss": 2.2417, "step": 110992 }, { "epoch": 0.69, "learning_rate": 4.9786912334441685e-05, "loss": 2.2277, "step": 111000 }, { "epoch": 0.69, "learning_rate": 4.9780814667396945e-05, "loss": 2.2452, "step": 111008 }, { "epoch": 0.69, "learning_rate": 4.97747172544023e-05, "loss": 2.2373, "step": 111016 }, { "epoch": 0.69, "learning_rate": 4.976862009560935e-05, "loss": 2.2485, "step": 111024 }, { "epoch": 0.69, "learning_rate": 4.9762523191169644e-05, "loss": 2.2458, "step": 111032 }, { "epoch": 0.69, "learning_rate": 4.9756426541234756e-05, "loss": 2.2357, "step": 111040 }, { "epoch": 0.69, "learning_rate": 4.9750330145956265e-05, "loss": 2.2588, "step": 111048 }, { "epoch": 0.69, "learning_rate": 4.974423400548571e-05, "loss": 2.2373, "step": 111056 }, { "epoch": 0.69, "learning_rate": 4.9738138119974636e-05, "loss": 2.2319, "step": 111064 }, { "epoch": 0.69, "learning_rate": 4.9732042489574614e-05, "loss": 2.2321, "step": 111072 }, { "epoch": 0.69, "learning_rate": 4.9725947114437166e-05, "loss": 2.2416, "step": 111080 }, { "epoch": 0.69, "learning_rate": 4.971985199471382e-05, "loss": 2.2471, "step": 111088 }, { "epoch": 0.69, "learning_rate": 4.97137571305561e-05, "loss": 2.2404, "step": 111096 }, { "epoch": 0.69, "learning_rate": 4.970766252211556e-05, "loss": 2.2333, "step": 111104 }, { "epoch": 0.69, "learning_rate": 4.970156816954366e-05, "loss": 2.2383, "step": 111112 }, { "epoch": 0.69, "learning_rate": 4.9695474072991934e-05, "loss": 2.243, "step": 111120 }, { "epoch": 0.69, "learning_rate": 4.968938023261188e-05, "loss": 2.232, "step": 111128 }, { "epoch": 0.69, "learning_rate": 4.968328664855501e-05, "loss": 2.2548, "step": 111136 }, { "epoch": 0.69, "learning_rate": 4.967719332097276e-05, "loss": 2.2474, "step": 111144 }, { "epoch": 0.69, "learning_rate": 4.9671100250016655e-05, "loss": 2.2509, "step": 111152 }, { "epoch": 0.69, "learning_rate": 4.966500743583817e-05, "loss": 2.2359, "step": 111160 }, { "epoch": 0.69, "learning_rate": 4.9658914878588744e-05, "loss": 2.2493, "step": 111168 }, { "epoch": 0.69, "learning_rate": 4.9652822578419853e-05, "loss": 2.2416, "step": 111176 }, { "epoch": 0.69, "learning_rate": 4.964673053548297e-05, "loss": 2.2335, "step": 111184 }, { "epoch": 0.69, "learning_rate": 4.9640638749929515e-05, "loss": 2.2377, "step": 111192 }, { "epoch": 0.69, "learning_rate": 4.9634547221910946e-05, "loss": 2.2161, "step": 111200 }, { "epoch": 0.7, "learning_rate": 4.9628455951578685e-05, "loss": 2.2277, "step": 111208 }, { "epoch": 0.7, "learning_rate": 4.962236493908419e-05, "loss": 2.2536, "step": 111216 }, { "epoch": 0.7, "learning_rate": 4.961627418457886e-05, "loss": 2.2372, "step": 111224 }, { "epoch": 0.7, "learning_rate": 4.961018368821411e-05, "loss": 2.2548, "step": 111232 }, { "epoch": 0.7, "learning_rate": 4.960409345014137e-05, "loss": 2.244, "step": 111240 }, { "epoch": 0.7, "learning_rate": 4.9598003470512027e-05, "loss": 2.2403, "step": 111248 }, { "epoch": 0.7, "learning_rate": 4.9591913749477484e-05, "loss": 2.2403, "step": 111256 }, { "epoch": 0.7, "learning_rate": 4.9585824287189144e-05, "loss": 2.2535, "step": 111264 }, { "epoch": 0.7, "learning_rate": 4.957973508379837e-05, "loss": 2.2478, "step": 111272 }, { "epoch": 0.7, "learning_rate": 4.9573646139456556e-05, "loss": 2.227, "step": 111280 }, { "epoch": 0.7, "learning_rate": 4.9567557454315065e-05, "loss": 2.2244, "step": 111288 }, { "epoch": 0.7, "learning_rate": 4.956146902852527e-05, "loss": 2.2265, "step": 111296 }, { "epoch": 0.7, "learning_rate": 4.955538086223852e-05, "loss": 2.2369, "step": 111304 }, { "epoch": 0.7, "learning_rate": 4.954929295560618e-05, "loss": 2.2461, "step": 111312 }, { "epoch": 0.7, "learning_rate": 4.95432053087796e-05, "loss": 2.2331, "step": 111320 }, { "epoch": 0.7, "learning_rate": 4.953711792191009e-05, "loss": 2.2333, "step": 111328 }, { "epoch": 0.7, "learning_rate": 4.9531030795149e-05, "loss": 2.2499, "step": 111336 }, { "epoch": 0.7, "learning_rate": 4.9524943928647663e-05, "loss": 2.247, "step": 111344 }, { "epoch": 0.7, "learning_rate": 4.9518857322557424e-05, "loss": 2.2236, "step": 111352 }, { "epoch": 0.7, "learning_rate": 4.9512770977029536e-05, "loss": 2.2319, "step": 111360 }, { "epoch": 0.7, "learning_rate": 4.9506684892215346e-05, "loss": 2.2182, "step": 111368 }, { "epoch": 0.7, "learning_rate": 4.9500599068266155e-05, "loss": 2.2415, "step": 111376 }, { "epoch": 0.7, "learning_rate": 4.949451350533324e-05, "loss": 2.2534, "step": 111384 }, { "epoch": 0.7, "learning_rate": 4.948842820356789e-05, "loss": 2.2381, "step": 111392 }, { "epoch": 0.7, "learning_rate": 4.948234316312141e-05, "loss": 2.2186, "step": 111400 }, { "epoch": 0.7, "learning_rate": 4.947625838414506e-05, "loss": 2.2254, "step": 111408 }, { "epoch": 0.7, "learning_rate": 4.947017386679009e-05, "loss": 2.2459, "step": 111416 }, { "epoch": 0.7, "learning_rate": 4.946408961120779e-05, "loss": 2.2477, "step": 111424 }, { "epoch": 0.7, "learning_rate": 4.945800561754941e-05, "loss": 2.2292, "step": 111432 }, { "epoch": 0.7, "learning_rate": 4.9451921885966184e-05, "loss": 2.2427, "step": 111440 }, { "epoch": 0.7, "learning_rate": 4.944583841660937e-05, "loss": 2.2378, "step": 111448 }, { "epoch": 0.7, "learning_rate": 4.9439755209630196e-05, "loss": 2.2292, "step": 111456 }, { "epoch": 0.7, "learning_rate": 4.9433672265179884e-05, "loss": 2.2436, "step": 111464 }, { "epoch": 0.7, "learning_rate": 4.9427589583409674e-05, "loss": 2.2393, "step": 111472 }, { "epoch": 0.7, "learning_rate": 4.942150716447076e-05, "loss": 2.2381, "step": 111480 }, { "epoch": 0.7, "learning_rate": 4.9415425008514385e-05, "loss": 2.2245, "step": 111488 }, { "epoch": 0.7, "learning_rate": 4.940934311569172e-05, "loss": 2.2528, "step": 111496 }, { "epoch": 0.7, "learning_rate": 4.9403261486153966e-05, "loss": 2.2387, "step": 111504 }, { "epoch": 0.7, "learning_rate": 4.9397180120052345e-05, "loss": 2.245, "step": 111512 }, { "epoch": 0.7, "learning_rate": 4.939109901753799e-05, "loss": 2.2375, "step": 111520 }, { "epoch": 0.7, "learning_rate": 4.938501817876211e-05, "loss": 2.2598, "step": 111528 }, { "epoch": 0.7, "learning_rate": 4.937893760387589e-05, "loss": 2.2504, "step": 111536 }, { "epoch": 0.7, "learning_rate": 4.937285729303045e-05, "loss": 2.2354, "step": 111544 }, { "epoch": 0.7, "learning_rate": 4.936677724637697e-05, "loss": 2.2452, "step": 111552 }, { "epoch": 0.7, "learning_rate": 4.93606974640666e-05, "loss": 2.2374, "step": 111560 }, { "epoch": 0.7, "learning_rate": 4.935461794625051e-05, "loss": 2.2466, "step": 111568 }, { "epoch": 0.7, "learning_rate": 4.9348538693079784e-05, "loss": 2.2473, "step": 111576 }, { "epoch": 0.7, "learning_rate": 4.9342459704705586e-05, "loss": 2.2582, "step": 111584 }, { "epoch": 0.7, "learning_rate": 4.933638098127905e-05, "loss": 2.2432, "step": 111592 }, { "epoch": 0.7, "learning_rate": 4.9330302522951274e-05, "loss": 2.2404, "step": 111600 }, { "epoch": 0.7, "learning_rate": 4.932422432987336e-05, "loss": 2.2429, "step": 111608 }, { "epoch": 0.7, "learning_rate": 4.931814640219644e-05, "loss": 2.2491, "step": 111616 }, { "epoch": 0.7, "learning_rate": 4.9312068740071596e-05, "loss": 2.2417, "step": 111624 }, { "epoch": 0.7, "learning_rate": 4.930599134364992e-05, "loss": 2.2216, "step": 111632 }, { "epoch": 0.7, "learning_rate": 4.92999142130825e-05, "loss": 2.2511, "step": 111640 }, { "epoch": 0.7, "learning_rate": 4.9293837348520414e-05, "loss": 2.235, "step": 111648 }, { "epoch": 0.7, "learning_rate": 4.928776075011473e-05, "loss": 2.2393, "step": 111656 }, { "epoch": 0.7, "learning_rate": 4.928168441801652e-05, "loss": 2.2621, "step": 111664 }, { "epoch": 0.7, "learning_rate": 4.927560835237685e-05, "loss": 2.2513, "step": 111672 }, { "epoch": 0.7, "learning_rate": 4.926953255334674e-05, "loss": 2.2542, "step": 111680 }, { "epoch": 0.7, "learning_rate": 4.926345702107725e-05, "loss": 2.244, "step": 111688 }, { "epoch": 0.7, "learning_rate": 4.9257381755719436e-05, "loss": 2.2561, "step": 111696 }, { "epoch": 0.7, "learning_rate": 4.925130675742431e-05, "loss": 2.2299, "step": 111704 }, { "epoch": 0.7, "learning_rate": 4.9245232026342916e-05, "loss": 2.23, "step": 111712 }, { "epoch": 0.7, "learning_rate": 4.923915756262625e-05, "loss": 2.2497, "step": 111720 }, { "epoch": 0.7, "learning_rate": 4.923308336642535e-05, "loss": 2.2485, "step": 111728 }, { "epoch": 0.7, "learning_rate": 4.922700943789118e-05, "loss": 2.2458, "step": 111736 }, { "epoch": 0.7, "learning_rate": 4.9220935777174776e-05, "loss": 2.2267, "step": 111744 }, { "epoch": 0.7, "learning_rate": 4.9214862384427134e-05, "loss": 2.2252, "step": 111752 }, { "epoch": 0.7, "learning_rate": 4.920878925979921e-05, "loss": 2.2479, "step": 111760 }, { "epoch": 0.7, "learning_rate": 4.920271640344198e-05, "loss": 2.2453, "step": 111768 }, { "epoch": 0.7, "learning_rate": 4.9196643815506435e-05, "loss": 2.2399, "step": 111776 }, { "epoch": 0.7, "learning_rate": 4.919057149614357e-05, "loss": 2.2408, "step": 111784 }, { "epoch": 0.7, "learning_rate": 4.9184499445504284e-05, "loss": 2.2467, "step": 111792 }, { "epoch": 0.7, "learning_rate": 4.917842766373955e-05, "loss": 2.2616, "step": 111800 }, { "epoch": 0.7, "learning_rate": 4.917235615100034e-05, "loss": 2.2413, "step": 111808 }, { "epoch": 0.7, "learning_rate": 4.916628490743756e-05, "loss": 2.226, "step": 111816 }, { "epoch": 0.7, "learning_rate": 4.9160213933202144e-05, "loss": 2.2451, "step": 111824 }, { "epoch": 0.7, "learning_rate": 4.9154143228445025e-05, "loss": 2.2461, "step": 111832 }, { "epoch": 0.7, "learning_rate": 4.914807279331715e-05, "loss": 2.2455, "step": 111840 }, { "epoch": 0.7, "learning_rate": 4.9142002627969373e-05, "loss": 2.2265, "step": 111848 }, { "epoch": 0.7, "learning_rate": 4.9135932732552635e-05, "loss": 2.2452, "step": 111856 }, { "epoch": 0.7, "learning_rate": 4.912986310721784e-05, "loss": 2.2543, "step": 111864 }, { "epoch": 0.7, "learning_rate": 4.912379375211585e-05, "loss": 2.2351, "step": 111872 }, { "epoch": 0.7, "learning_rate": 4.911772466739758e-05, "loss": 2.2316, "step": 111880 }, { "epoch": 0.7, "learning_rate": 4.91116558532139e-05, "loss": 2.2515, "step": 111888 }, { "epoch": 0.7, "learning_rate": 4.910558730971567e-05, "loss": 2.2552, "step": 111896 }, { "epoch": 0.7, "learning_rate": 4.909951903705376e-05, "loss": 2.2575, "step": 111904 }, { "epoch": 0.7, "learning_rate": 4.909345103537903e-05, "loss": 2.2638, "step": 111912 }, { "epoch": 0.7, "learning_rate": 4.908738330484234e-05, "loss": 2.245, "step": 111920 }, { "epoch": 0.7, "learning_rate": 4.908131584559451e-05, "loss": 2.2562, "step": 111928 }, { "epoch": 0.7, "learning_rate": 4.90752486577864e-05, "loss": 2.2279, "step": 111936 }, { "epoch": 0.7, "learning_rate": 4.906918174156885e-05, "loss": 2.2458, "step": 111944 }, { "epoch": 0.7, "learning_rate": 4.9063115097092645e-05, "loss": 2.2338, "step": 111952 }, { "epoch": 0.7, "learning_rate": 4.905704872450863e-05, "loss": 2.2579, "step": 111960 }, { "epoch": 0.7, "learning_rate": 4.905098262396763e-05, "loss": 2.2262, "step": 111968 }, { "epoch": 0.7, "learning_rate": 4.904491679562042e-05, "loss": 2.2398, "step": 111976 }, { "epoch": 0.7, "learning_rate": 4.903885123961779e-05, "loss": 2.2363, "step": 111984 }, { "epoch": 0.7, "learning_rate": 4.903278595611056e-05, "loss": 2.2466, "step": 111992 }, { "epoch": 0.7, "learning_rate": 4.902672094524952e-05, "loss": 2.2316, "step": 112000 }, { "epoch": 0.7, "learning_rate": 4.902065620718541e-05, "loss": 2.2531, "step": 112008 }, { "epoch": 0.7, "learning_rate": 4.9014591742069016e-05, "loss": 2.2436, "step": 112016 }, { "epoch": 0.7, "learning_rate": 4.900852755005111e-05, "loss": 2.2535, "step": 112024 }, { "epoch": 0.7, "learning_rate": 4.9002463631282444e-05, "loss": 2.2502, "step": 112032 }, { "epoch": 0.7, "learning_rate": 4.899639998591376e-05, "loss": 2.2305, "step": 112040 }, { "epoch": 0.7, "learning_rate": 4.89903366140958e-05, "loss": 2.2427, "step": 112048 }, { "epoch": 0.7, "learning_rate": 4.8984273515979326e-05, "loss": 2.2603, "step": 112056 }, { "epoch": 0.7, "learning_rate": 4.897821069171504e-05, "loss": 2.2485, "step": 112064 }, { "epoch": 0.7, "learning_rate": 4.8972148141453665e-05, "loss": 2.2286, "step": 112072 }, { "epoch": 0.7, "learning_rate": 4.8966085865345946e-05, "loss": 2.2404, "step": 112080 }, { "epoch": 0.7, "learning_rate": 4.896002386354255e-05, "loss": 2.2517, "step": 112088 }, { "epoch": 0.7, "learning_rate": 4.8953962136194206e-05, "loss": 2.2523, "step": 112096 }, { "epoch": 0.7, "learning_rate": 4.8947900683451606e-05, "loss": 2.2352, "step": 112104 }, { "epoch": 0.7, "learning_rate": 4.894183950546543e-05, "loss": 2.2541, "step": 112112 }, { "epoch": 0.7, "learning_rate": 4.893577860238636e-05, "loss": 2.2438, "step": 112120 }, { "epoch": 0.7, "learning_rate": 4.892971797436507e-05, "loss": 2.2396, "step": 112128 }, { "epoch": 0.7, "learning_rate": 4.892365762155226e-05, "loss": 2.2645, "step": 112136 }, { "epoch": 0.7, "learning_rate": 4.8917597544098545e-05, "loss": 2.2509, "step": 112144 }, { "epoch": 0.7, "learning_rate": 4.89115377421546e-05, "loss": 2.2574, "step": 112152 }, { "epoch": 0.7, "learning_rate": 4.8905478215871084e-05, "loss": 2.231, "step": 112160 }, { "epoch": 0.7, "learning_rate": 4.88994189653986e-05, "loss": 2.2372, "step": 112168 }, { "epoch": 0.7, "learning_rate": 4.889335999088782e-05, "loss": 2.2219, "step": 112176 }, { "epoch": 0.7, "learning_rate": 4.888730129248935e-05, "loss": 2.2281, "step": 112184 }, { "epoch": 0.7, "learning_rate": 4.888124287035384e-05, "loss": 2.2266, "step": 112192 }, { "epoch": 0.7, "learning_rate": 4.887518472463186e-05, "loss": 2.2497, "step": 112200 }, { "epoch": 0.7, "learning_rate": 4.8869126855474024e-05, "loss": 2.2431, "step": 112208 }, { "epoch": 0.7, "learning_rate": 4.886306926303097e-05, "loss": 2.2449, "step": 112216 }, { "epoch": 0.7, "learning_rate": 4.885701194745325e-05, "loss": 2.2442, "step": 112224 }, { "epoch": 0.7, "learning_rate": 4.885095490889146e-05, "loss": 2.2368, "step": 112232 }, { "epoch": 0.7, "learning_rate": 4.88448981474962e-05, "loss": 2.2518, "step": 112240 }, { "epoch": 0.7, "learning_rate": 4.8838841663418006e-05, "loss": 2.2379, "step": 112248 }, { "epoch": 0.7, "learning_rate": 4.883278545680746e-05, "loss": 2.2559, "step": 112256 }, { "epoch": 0.7, "learning_rate": 4.882672952781512e-05, "loss": 2.247, "step": 112264 }, { "epoch": 0.7, "learning_rate": 4.882067387659155e-05, "loss": 2.2455, "step": 112272 }, { "epoch": 0.7, "learning_rate": 4.8814618503287266e-05, "loss": 2.2627, "step": 112280 }, { "epoch": 0.7, "learning_rate": 4.8808563408052834e-05, "loss": 2.2468, "step": 112288 }, { "epoch": 0.7, "learning_rate": 4.880250859103877e-05, "loss": 2.2512, "step": 112296 }, { "epoch": 0.7, "learning_rate": 4.879645405239559e-05, "loss": 2.2584, "step": 112304 }, { "epoch": 0.7, "learning_rate": 4.879039979227382e-05, "loss": 2.2619, "step": 112312 }, { "epoch": 0.7, "learning_rate": 4.8784345810823986e-05, "loss": 2.242, "step": 112320 }, { "epoch": 0.7, "learning_rate": 4.877829210819656e-05, "loss": 2.2358, "step": 112328 }, { "epoch": 0.7, "learning_rate": 4.877223868454205e-05, "loss": 2.2388, "step": 112336 }, { "epoch": 0.7, "learning_rate": 4.876618554001094e-05, "loss": 2.2512, "step": 112344 }, { "epoch": 0.7, "learning_rate": 4.876013267475373e-05, "loss": 2.2589, "step": 112352 }, { "epoch": 0.7, "learning_rate": 4.8754080088920875e-05, "loss": 2.2425, "step": 112360 }, { "epoch": 0.7, "learning_rate": 4.874802778266285e-05, "loss": 2.2406, "step": 112368 }, { "epoch": 0.7, "learning_rate": 4.8741975756130144e-05, "loss": 2.2452, "step": 112376 }, { "epoch": 0.7, "learning_rate": 4.8735924009473157e-05, "loss": 2.2527, "step": 112384 }, { "epoch": 0.7, "learning_rate": 4.8729872542842354e-05, "loss": 2.2557, "step": 112392 }, { "epoch": 0.7, "learning_rate": 4.87238213563882e-05, "loss": 2.2513, "step": 112400 }, { "epoch": 0.7, "learning_rate": 4.871777045026112e-05, "loss": 2.244, "step": 112408 }, { "epoch": 0.7, "learning_rate": 4.871171982461152e-05, "loss": 2.2614, "step": 112416 }, { "epoch": 0.7, "learning_rate": 4.870566947958982e-05, "loss": 2.2414, "step": 112424 }, { "epoch": 0.7, "learning_rate": 4.869961941534647e-05, "loss": 2.2573, "step": 112432 }, { "epoch": 0.7, "learning_rate": 4.869356963203184e-05, "loss": 2.2417, "step": 112440 }, { "epoch": 0.7, "learning_rate": 4.8687520129796326e-05, "loss": 2.2339, "step": 112448 }, { "epoch": 0.7, "learning_rate": 4.868147090879035e-05, "loss": 2.225, "step": 112456 }, { "epoch": 0.7, "learning_rate": 4.867542196916426e-05, "loss": 2.2359, "step": 112464 }, { "epoch": 0.7, "learning_rate": 4.866937331106846e-05, "loss": 2.2574, "step": 112472 }, { "epoch": 0.7, "learning_rate": 4.86633249346533e-05, "loss": 2.2507, "step": 112480 }, { "epoch": 0.7, "learning_rate": 4.8657276840069164e-05, "loss": 2.2243, "step": 112488 }, { "epoch": 0.7, "learning_rate": 4.86512290274664e-05, "loss": 2.2345, "step": 112496 }, { "epoch": 0.7, "learning_rate": 4.864518149699534e-05, "loss": 2.2474, "step": 112504 }, { "epoch": 0.7, "learning_rate": 4.863913424880636e-05, "loss": 2.2312, "step": 112512 }, { "epoch": 0.7, "learning_rate": 4.863308728304977e-05, "loss": 2.2416, "step": 112520 }, { "epoch": 0.7, "learning_rate": 4.8627040599875906e-05, "loss": 2.2512, "step": 112528 }, { "epoch": 0.7, "learning_rate": 4.862099419943509e-05, "loss": 2.2484, "step": 112536 }, { "epoch": 0.7, "learning_rate": 4.861494808187764e-05, "loss": 2.2377, "step": 112544 }, { "epoch": 0.7, "learning_rate": 4.860890224735384e-05, "loss": 2.2418, "step": 112552 }, { "epoch": 0.7, "learning_rate": 4.860285669601402e-05, "loss": 2.2425, "step": 112560 }, { "epoch": 0.7, "learning_rate": 4.859681142800848e-05, "loss": 2.2428, "step": 112568 }, { "epoch": 0.7, "learning_rate": 4.859076644348745e-05, "loss": 2.2458, "step": 112576 }, { "epoch": 0.7, "learning_rate": 4.8584721742601266e-05, "loss": 2.2401, "step": 112584 }, { "epoch": 0.7, "learning_rate": 4.857867732550019e-05, "loss": 2.2299, "step": 112592 }, { "epoch": 0.7, "learning_rate": 4.857263319233447e-05, "loss": 2.2259, "step": 112600 }, { "epoch": 0.7, "learning_rate": 4.8566589343254356e-05, "loss": 2.2388, "step": 112608 }, { "epoch": 0.7, "learning_rate": 4.856054577841012e-05, "loss": 2.2287, "step": 112616 }, { "epoch": 0.7, "learning_rate": 4.855450249795202e-05, "loss": 2.2298, "step": 112624 }, { "epoch": 0.7, "learning_rate": 4.8548459502030254e-05, "loss": 2.2305, "step": 112632 }, { "epoch": 0.7, "learning_rate": 4.854241679079506e-05, "loss": 2.2384, "step": 112640 }, { "epoch": 0.7, "learning_rate": 4.85363743643967e-05, "loss": 2.2395, "step": 112648 }, { "epoch": 0.7, "learning_rate": 4.853033222298534e-05, "loss": 2.2234, "step": 112656 }, { "epoch": 0.7, "learning_rate": 4.85242903667112e-05, "loss": 2.2448, "step": 112664 }, { "epoch": 0.7, "learning_rate": 4.8518248795724486e-05, "loss": 2.25, "step": 112672 }, { "epoch": 0.7, "learning_rate": 4.8512207510175424e-05, "loss": 2.2387, "step": 112680 }, { "epoch": 0.7, "learning_rate": 4.850616651021416e-05, "loss": 2.2671, "step": 112688 }, { "epoch": 0.7, "learning_rate": 4.850012579599087e-05, "loss": 2.2231, "step": 112696 }, { "epoch": 0.7, "learning_rate": 4.849408536765577e-05, "loss": 2.2384, "step": 112704 }, { "epoch": 0.7, "learning_rate": 4.8488045225358974e-05, "loss": 2.2421, "step": 112712 }, { "epoch": 0.7, "learning_rate": 4.848200536925067e-05, "loss": 2.2411, "step": 112720 }, { "epoch": 0.7, "learning_rate": 4.847596579948102e-05, "loss": 2.2222, "step": 112728 }, { "epoch": 0.7, "learning_rate": 4.846992651620014e-05, "loss": 2.2319, "step": 112736 }, { "epoch": 0.7, "learning_rate": 4.8463887519558185e-05, "loss": 2.2396, "step": 112744 }, { "epoch": 0.7, "learning_rate": 4.8457848809705276e-05, "loss": 2.2443, "step": 112752 }, { "epoch": 0.7, "learning_rate": 4.845181038679155e-05, "loss": 2.2278, "step": 112760 }, { "epoch": 0.7, "learning_rate": 4.84457722509671e-05, "loss": 2.2418, "step": 112768 }, { "epoch": 0.7, "learning_rate": 4.8439734402382056e-05, "loss": 2.2341, "step": 112776 }, { "epoch": 0.7, "learning_rate": 4.843369684118652e-05, "loss": 2.2359, "step": 112784 }, { "epoch": 0.7, "learning_rate": 4.842765956753056e-05, "loss": 2.2362, "step": 112792 }, { "epoch": 0.7, "learning_rate": 4.842162258156429e-05, "loss": 2.2475, "step": 112800 }, { "epoch": 0.71, "learning_rate": 4.8415585883437797e-05, "loss": 2.2196, "step": 112808 }, { "epoch": 0.71, "learning_rate": 4.840954947330112e-05, "loss": 2.2389, "step": 112816 }, { "epoch": 0.71, "learning_rate": 4.8403513351304334e-05, "loss": 2.2313, "step": 112824 }, { "epoch": 0.71, "learning_rate": 4.839747751759752e-05, "loss": 2.2369, "step": 112832 }, { "epoch": 0.71, "learning_rate": 4.8391441972330734e-05, "loss": 2.2392, "step": 112840 }, { "epoch": 0.71, "learning_rate": 4.8385406715653986e-05, "loss": 2.2433, "step": 112848 }, { "epoch": 0.71, "learning_rate": 4.837937174771732e-05, "loss": 2.2369, "step": 112856 }, { "epoch": 0.71, "learning_rate": 4.83733370686708e-05, "loss": 2.2353, "step": 112864 }, { "epoch": 0.71, "learning_rate": 4.8367302678664406e-05, "loss": 2.2451, "step": 112872 }, { "epoch": 0.71, "learning_rate": 4.836126857784818e-05, "loss": 2.2288, "step": 112880 }, { "epoch": 0.71, "learning_rate": 4.8355234766372114e-05, "loss": 2.2415, "step": 112888 }, { "epoch": 0.71, "learning_rate": 4.834920124438624e-05, "loss": 2.2288, "step": 112896 }, { "epoch": 0.71, "learning_rate": 4.8343168012040506e-05, "loss": 2.2438, "step": 112904 }, { "epoch": 0.71, "learning_rate": 4.8337135069484936e-05, "loss": 2.2432, "step": 112912 }, { "epoch": 0.71, "learning_rate": 4.8331102416869495e-05, "loss": 2.2452, "step": 112920 }, { "epoch": 0.71, "learning_rate": 4.832507005434416e-05, "loss": 2.2388, "step": 112928 }, { "epoch": 0.71, "learning_rate": 4.831903798205888e-05, "loss": 2.242, "step": 112936 }, { "epoch": 0.71, "learning_rate": 4.831300620016364e-05, "loss": 2.2266, "step": 112944 }, { "epoch": 0.71, "learning_rate": 4.830697470880837e-05, "loss": 2.2507, "step": 112952 }, { "epoch": 0.71, "learning_rate": 4.830094350814303e-05, "loss": 2.2451, "step": 112960 }, { "epoch": 0.71, "learning_rate": 4.8294912598317535e-05, "loss": 2.2442, "step": 112968 }, { "epoch": 0.71, "learning_rate": 4.8288881979481835e-05, "loss": 2.2541, "step": 112976 }, { "epoch": 0.71, "learning_rate": 4.828285165178583e-05, "loss": 2.2463, "step": 112984 }, { "epoch": 0.71, "learning_rate": 4.827682161537946e-05, "loss": 2.2374, "step": 112992 }, { "epoch": 0.71, "learning_rate": 4.8270791870412636e-05, "loss": 2.2455, "step": 113000 }, { "epoch": 0.71, "learning_rate": 4.826476241703521e-05, "loss": 2.2429, "step": 113008 }, { "epoch": 0.71, "learning_rate": 4.825873325539711e-05, "loss": 2.2604, "step": 113016 }, { "epoch": 0.71, "learning_rate": 4.825270438564823e-05, "loss": 2.2603, "step": 113024 }, { "epoch": 0.71, "learning_rate": 4.824667580793845e-05, "loss": 2.243, "step": 113032 }, { "epoch": 0.71, "learning_rate": 4.8240647522417615e-05, "loss": 2.2571, "step": 113040 }, { "epoch": 0.71, "learning_rate": 4.823461952923558e-05, "loss": 2.2544, "step": 113048 }, { "epoch": 0.71, "learning_rate": 4.822859182854227e-05, "loss": 2.2413, "step": 113056 }, { "epoch": 0.71, "learning_rate": 4.822256442048745e-05, "loss": 2.24, "step": 113064 }, { "epoch": 0.71, "learning_rate": 4.8216537305221014e-05, "loss": 2.2469, "step": 113072 }, { "epoch": 0.71, "learning_rate": 4.821051048289278e-05, "loss": 2.2407, "step": 113080 }, { "epoch": 0.71, "learning_rate": 4.820448395365258e-05, "loss": 2.2384, "step": 113088 }, { "epoch": 0.71, "learning_rate": 4.819845771765023e-05, "loss": 2.2325, "step": 113096 }, { "epoch": 0.71, "learning_rate": 4.819243177503555e-05, "loss": 2.2537, "step": 113104 }, { "epoch": 0.71, "learning_rate": 4.818640612595834e-05, "loss": 2.2567, "step": 113112 }, { "epoch": 0.71, "learning_rate": 4.818038077056839e-05, "loss": 2.2483, "step": 113120 }, { "epoch": 0.71, "learning_rate": 4.817435570901551e-05, "loss": 2.2417, "step": 113128 }, { "epoch": 0.71, "learning_rate": 4.816833094144947e-05, "loss": 2.2557, "step": 113136 }, { "epoch": 0.71, "learning_rate": 4.816230646802005e-05, "loss": 2.2427, "step": 113144 }, { "epoch": 0.71, "learning_rate": 4.815628228887702e-05, "loss": 2.2447, "step": 113152 }, { "epoch": 0.71, "learning_rate": 4.8150258404170143e-05, "loss": 2.24, "step": 113160 }, { "epoch": 0.71, "learning_rate": 4.814423481404917e-05, "loss": 2.2396, "step": 113168 }, { "epoch": 0.71, "learning_rate": 4.813821151866384e-05, "loss": 2.2423, "step": 113176 }, { "epoch": 0.71, "learning_rate": 4.8132188518163915e-05, "loss": 2.261, "step": 113184 }, { "epoch": 0.71, "learning_rate": 4.812616581269912e-05, "loss": 2.2422, "step": 113192 }, { "epoch": 0.71, "learning_rate": 4.8120143402419164e-05, "loss": 2.2409, "step": 113200 }, { "epoch": 0.71, "learning_rate": 4.811412128747377e-05, "loss": 2.2504, "step": 113208 }, { "epoch": 0.71, "learning_rate": 4.810809946801269e-05, "loss": 2.2439, "step": 113216 }, { "epoch": 0.71, "learning_rate": 4.810207794418555e-05, "loss": 2.2439, "step": 113224 }, { "epoch": 0.71, "learning_rate": 4.80960567161421e-05, "loss": 2.2276, "step": 113232 }, { "epoch": 0.71, "learning_rate": 4.809003578403202e-05, "loss": 2.2581, "step": 113240 }, { "epoch": 0.71, "learning_rate": 4.8084015148005e-05, "loss": 2.2532, "step": 113248 }, { "epoch": 0.71, "learning_rate": 4.8077994808210676e-05, "loss": 2.2526, "step": 113256 }, { "epoch": 0.71, "learning_rate": 4.807197476479873e-05, "loss": 2.2446, "step": 113264 }, { "epoch": 0.71, "learning_rate": 4.806595501791886e-05, "loss": 2.2432, "step": 113272 }, { "epoch": 0.71, "learning_rate": 4.805993556772068e-05, "loss": 2.2386, "step": 113280 }, { "epoch": 0.71, "learning_rate": 4.8053916414353835e-05, "loss": 2.2519, "step": 113288 }, { "epoch": 0.71, "learning_rate": 4.8047897557967975e-05, "loss": 2.2389, "step": 113296 }, { "epoch": 0.71, "learning_rate": 4.804187899871271e-05, "loss": 2.243, "step": 113304 }, { "epoch": 0.71, "learning_rate": 4.803586073673768e-05, "loss": 2.2405, "step": 113312 }, { "epoch": 0.71, "learning_rate": 4.802984277219249e-05, "loss": 2.2396, "step": 113320 }, { "epoch": 0.71, "learning_rate": 4.802382510522677e-05, "loss": 2.24, "step": 113328 }, { "epoch": 0.71, "learning_rate": 4.8017807735990084e-05, "loss": 2.2409, "step": 113336 }, { "epoch": 0.71, "learning_rate": 4.8011790664632045e-05, "loss": 2.2456, "step": 113344 }, { "epoch": 0.71, "learning_rate": 4.800577389130224e-05, "loss": 2.2286, "step": 113352 }, { "epoch": 0.71, "learning_rate": 4.799975741615024e-05, "loss": 2.2408, "step": 113360 }, { "epoch": 0.71, "learning_rate": 4.7993741239325615e-05, "loss": 2.2578, "step": 113368 }, { "epoch": 0.71, "learning_rate": 4.7987725360977934e-05, "loss": 2.2403, "step": 113376 }, { "epoch": 0.71, "learning_rate": 4.7981709781256746e-05, "loss": 2.2306, "step": 113384 }, { "epoch": 0.71, "learning_rate": 4.79756945003116e-05, "loss": 2.2439, "step": 113392 }, { "epoch": 0.71, "learning_rate": 4.796967951829203e-05, "loss": 2.2408, "step": 113400 }, { "epoch": 0.71, "learning_rate": 4.79636648353476e-05, "loss": 2.2326, "step": 113408 }, { "epoch": 0.71, "learning_rate": 4.795765045162779e-05, "loss": 2.2384, "step": 113416 }, { "epoch": 0.71, "learning_rate": 4.795163636728215e-05, "loss": 2.2394, "step": 113424 }, { "epoch": 0.71, "learning_rate": 4.794562258246019e-05, "loss": 2.2455, "step": 113432 }, { "epoch": 0.71, "learning_rate": 4.7939609097311396e-05, "loss": 2.238, "step": 113440 }, { "epoch": 0.71, "learning_rate": 4.793359591198526e-05, "loss": 2.2399, "step": 113448 }, { "epoch": 0.71, "learning_rate": 4.79275830266313e-05, "loss": 2.2298, "step": 113456 }, { "epoch": 0.71, "learning_rate": 4.792157044139899e-05, "loss": 2.2356, "step": 113464 }, { "epoch": 0.71, "learning_rate": 4.791555815643778e-05, "loss": 2.2498, "step": 113472 }, { "epoch": 0.71, "learning_rate": 4.7909546171897136e-05, "loss": 2.2515, "step": 113480 }, { "epoch": 0.71, "learning_rate": 4.790353448792655e-05, "loss": 2.2434, "step": 113488 }, { "epoch": 0.71, "learning_rate": 4.7897523104675454e-05, "loss": 2.2228, "step": 113496 }, { "epoch": 0.71, "learning_rate": 4.7891512022293284e-05, "loss": 2.2347, "step": 113504 }, { "epoch": 0.71, "learning_rate": 4.78855012409295e-05, "loss": 2.236, "step": 113512 }, { "epoch": 0.71, "learning_rate": 4.787949076073349e-05, "loss": 2.2362, "step": 113520 }, { "epoch": 0.71, "learning_rate": 4.787348058185471e-05, "loss": 2.2405, "step": 113528 }, { "epoch": 0.71, "learning_rate": 4.786747070444256e-05, "loss": 2.2406, "step": 113536 }, { "epoch": 0.71, "learning_rate": 4.7861461128646465e-05, "loss": 2.2278, "step": 113544 }, { "epoch": 0.71, "learning_rate": 4.785545185461579e-05, "loss": 2.2489, "step": 113552 }, { "epoch": 0.71, "learning_rate": 4.784944288249995e-05, "loss": 2.2461, "step": 113560 }, { "epoch": 0.71, "learning_rate": 4.784343421244833e-05, "loss": 2.2459, "step": 113568 }, { "epoch": 0.71, "learning_rate": 4.783742584461028e-05, "loss": 2.2366, "step": 113576 }, { "epoch": 0.71, "learning_rate": 4.7831417779135204e-05, "loss": 2.2375, "step": 113584 }, { "epoch": 0.71, "learning_rate": 4.7825410016172446e-05, "loss": 2.2315, "step": 113592 }, { "epoch": 0.71, "learning_rate": 4.781940255587136e-05, "loss": 2.2379, "step": 113600 }, { "epoch": 0.71, "learning_rate": 4.78133953983813e-05, "loss": 2.2495, "step": 113608 }, { "epoch": 0.71, "learning_rate": 4.7807388543851584e-05, "loss": 2.2467, "step": 113616 }, { "epoch": 0.71, "learning_rate": 4.780138199243158e-05, "loss": 2.2502, "step": 113624 }, { "epoch": 0.71, "learning_rate": 4.779537574427056e-05, "loss": 2.2521, "step": 113632 }, { "epoch": 0.71, "learning_rate": 4.778936979951788e-05, "loss": 2.2577, "step": 113640 }, { "epoch": 0.71, "learning_rate": 4.7783364158322854e-05, "loss": 2.2394, "step": 113648 }, { "epoch": 0.71, "learning_rate": 4.777735882083474e-05, "loss": 2.2323, "step": 113656 }, { "epoch": 0.71, "learning_rate": 4.7771353787202856e-05, "loss": 2.2442, "step": 113664 }, { "epoch": 0.71, "learning_rate": 4.77653490575765e-05, "loss": 2.2448, "step": 113672 }, { "epoch": 0.71, "learning_rate": 4.7759344632104946e-05, "loss": 2.2328, "step": 113680 }, { "epoch": 0.71, "learning_rate": 4.775334051093745e-05, "loss": 2.2369, "step": 113688 }, { "epoch": 0.71, "learning_rate": 4.774733669422327e-05, "loss": 2.2421, "step": 113696 }, { "epoch": 0.71, "learning_rate": 4.7741333182111704e-05, "loss": 2.2438, "step": 113704 }, { "epoch": 0.71, "learning_rate": 4.7735329974751946e-05, "loss": 2.2367, "step": 113712 }, { "epoch": 0.71, "learning_rate": 4.772932707229327e-05, "loss": 2.236, "step": 113720 }, { "epoch": 0.71, "learning_rate": 4.77233244748849e-05, "loss": 2.2515, "step": 113728 }, { "epoch": 0.71, "learning_rate": 4.7717322182676063e-05, "loss": 2.2391, "step": 113736 }, { "epoch": 0.71, "learning_rate": 4.7711320195815965e-05, "loss": 2.237, "step": 113744 }, { "epoch": 0.71, "learning_rate": 4.770531851445383e-05, "loss": 2.2351, "step": 113752 }, { "epoch": 0.71, "learning_rate": 4.7699317138738866e-05, "loss": 2.2481, "step": 113760 }, { "epoch": 0.71, "learning_rate": 4.7693316068820245e-05, "loss": 2.2524, "step": 113768 }, { "epoch": 0.71, "learning_rate": 4.7687315304847166e-05, "loss": 2.2369, "step": 113776 }, { "epoch": 0.71, "learning_rate": 4.768131484696883e-05, "loss": 2.2417, "step": 113784 }, { "epoch": 0.71, "learning_rate": 4.767531469533437e-05, "loss": 2.2345, "step": 113792 }, { "epoch": 0.71, "learning_rate": 4.7669314850092965e-05, "loss": 2.2403, "step": 113800 }, { "epoch": 0.71, "learning_rate": 4.766331531139378e-05, "loss": 2.2415, "step": 113808 }, { "epoch": 0.71, "learning_rate": 4.765731607938598e-05, "loss": 2.2399, "step": 113816 }, { "epoch": 0.71, "learning_rate": 4.7651317154218674e-05, "loss": 2.2476, "step": 113824 }, { "epoch": 0.71, "learning_rate": 4.7645318536041005e-05, "loss": 2.2403, "step": 113832 }, { "epoch": 0.71, "learning_rate": 4.763932022500212e-05, "loss": 2.2342, "step": 113840 }, { "epoch": 0.71, "learning_rate": 4.7633322221251095e-05, "loss": 2.2309, "step": 113848 }, { "epoch": 0.71, "learning_rate": 4.762732452493708e-05, "loss": 2.252, "step": 113856 }, { "epoch": 0.71, "learning_rate": 4.762132713620918e-05, "loss": 2.2267, "step": 113864 }, { "epoch": 0.71, "learning_rate": 4.761533005521646e-05, "loss": 2.2428, "step": 113872 }, { "epoch": 0.71, "learning_rate": 4.760933328210802e-05, "loss": 2.2415, "step": 113880 }, { "epoch": 0.71, "learning_rate": 4.760333681703294e-05, "loss": 2.2086, "step": 113888 }, { "epoch": 0.71, "learning_rate": 4.759734066014032e-05, "loss": 2.2345, "step": 113896 }, { "epoch": 0.71, "learning_rate": 4.759134481157919e-05, "loss": 2.2359, "step": 113904 }, { "epoch": 0.71, "learning_rate": 4.7585349271498624e-05, "loss": 2.2503, "step": 113912 }, { "epoch": 0.71, "learning_rate": 4.757935404004767e-05, "loss": 2.2436, "step": 113920 }, { "epoch": 0.71, "learning_rate": 4.7573359117375363e-05, "loss": 2.2386, "step": 113928 }, { "epoch": 0.71, "learning_rate": 4.7567364503630736e-05, "loss": 2.2503, "step": 113936 }, { "epoch": 0.71, "learning_rate": 4.756137019896283e-05, "loss": 2.2478, "step": 113944 }, { "epoch": 0.71, "learning_rate": 4.7555376203520655e-05, "loss": 2.2259, "step": 113952 }, { "epoch": 0.71, "learning_rate": 4.754938251745323e-05, "loss": 2.2471, "step": 113960 }, { "epoch": 0.71, "learning_rate": 4.754338914090955e-05, "loss": 2.2241, "step": 113968 }, { "epoch": 0.71, "learning_rate": 4.753739607403861e-05, "loss": 2.242, "step": 113976 }, { "epoch": 0.71, "learning_rate": 4.75314033169894e-05, "loss": 2.2452, "step": 113984 }, { "epoch": 0.71, "learning_rate": 4.7525410869910905e-05, "loss": 2.2317, "step": 113992 }, { "epoch": 0.71, "learning_rate": 4.751941873295209e-05, "loss": 2.2265, "step": 114000 }, { "epoch": 0.71, "learning_rate": 4.751342690626193e-05, "loss": 2.2218, "step": 114008 }, { "epoch": 0.71, "learning_rate": 4.7507435389989386e-05, "loss": 2.2357, "step": 114016 }, { "epoch": 0.71, "learning_rate": 4.750144418428339e-05, "loss": 2.2292, "step": 114024 }, { "epoch": 0.71, "learning_rate": 4.74954532892929e-05, "loss": 2.2385, "step": 114032 }, { "epoch": 0.71, "learning_rate": 4.748946270516684e-05, "loss": 2.2337, "step": 114040 }, { "epoch": 0.71, "learning_rate": 4.7483472432054136e-05, "loss": 2.2568, "step": 114048 }, { "epoch": 0.71, "learning_rate": 4.747748247010374e-05, "loss": 2.2402, "step": 114056 }, { "epoch": 0.71, "learning_rate": 4.7471492819464504e-05, "loss": 2.2497, "step": 114064 }, { "epoch": 0.71, "learning_rate": 4.7465503480285363e-05, "loss": 2.2425, "step": 114072 }, { "epoch": 0.71, "learning_rate": 4.745951445271522e-05, "loss": 2.2479, "step": 114080 }, { "epoch": 0.71, "learning_rate": 4.745352573690296e-05, "loss": 2.2365, "step": 114088 }, { "epoch": 0.71, "learning_rate": 4.744753733299745e-05, "loss": 2.2326, "step": 114096 }, { "epoch": 0.71, "learning_rate": 4.7441549241147567e-05, "loss": 2.2425, "step": 114104 }, { "epoch": 0.71, "learning_rate": 4.743556146150219e-05, "loss": 2.2255, "step": 114112 }, { "epoch": 0.71, "learning_rate": 4.7429573994210163e-05, "loss": 2.2398, "step": 114120 }, { "epoch": 0.71, "learning_rate": 4.742358683942032e-05, "loss": 2.2389, "step": 114128 }, { "epoch": 0.71, "learning_rate": 4.741759999728155e-05, "loss": 2.2393, "step": 114136 }, { "epoch": 0.71, "learning_rate": 4.741161346794263e-05, "loss": 2.2417, "step": 114144 }, { "epoch": 0.71, "learning_rate": 4.740562725155242e-05, "loss": 2.2477, "step": 114152 }, { "epoch": 0.71, "learning_rate": 4.739964134825973e-05, "loss": 2.2419, "step": 114160 }, { "epoch": 0.71, "learning_rate": 4.7393655758213374e-05, "loss": 2.2349, "step": 114168 }, { "epoch": 0.71, "learning_rate": 4.738767048156214e-05, "loss": 2.2466, "step": 114176 }, { "epoch": 0.71, "learning_rate": 4.738168551845483e-05, "loss": 2.2424, "step": 114184 }, { "epoch": 0.71, "learning_rate": 4.7375700869040253e-05, "loss": 2.2373, "step": 114192 }, { "epoch": 0.71, "learning_rate": 4.7369716533467156e-05, "loss": 2.2433, "step": 114200 }, { "epoch": 0.71, "learning_rate": 4.736373251188432e-05, "loss": 2.2269, "step": 114208 }, { "epoch": 0.71, "learning_rate": 4.7357748804440526e-05, "loss": 2.2635, "step": 114216 }, { "epoch": 0.71, "learning_rate": 4.73517654112845e-05, "loss": 2.2373, "step": 114224 }, { "epoch": 0.71, "learning_rate": 4.734578233256501e-05, "loss": 2.2195, "step": 114232 }, { "epoch": 0.71, "learning_rate": 4.733979956843079e-05, "loss": 2.2453, "step": 114240 }, { "epoch": 0.71, "learning_rate": 4.733381711903058e-05, "loss": 2.2549, "step": 114248 }, { "epoch": 0.71, "learning_rate": 4.732783498451309e-05, "loss": 2.2452, "step": 114256 }, { "epoch": 0.71, "learning_rate": 4.732185316502704e-05, "loss": 2.2322, "step": 114264 }, { "epoch": 0.71, "learning_rate": 4.731587166072116e-05, "loss": 2.2494, "step": 114272 }, { "epoch": 0.71, "learning_rate": 4.730989047174412e-05, "loss": 2.2413, "step": 114280 }, { "epoch": 0.71, "learning_rate": 4.730390959824462e-05, "loss": 2.2258, "step": 114288 }, { "epoch": 0.71, "learning_rate": 4.729792904037136e-05, "loss": 2.2523, "step": 114296 }, { "epoch": 0.71, "learning_rate": 4.7291948798273026e-05, "loss": 2.2405, "step": 114304 }, { "epoch": 0.71, "learning_rate": 4.7285968872098245e-05, "loss": 2.2356, "step": 114312 }, { "epoch": 0.71, "learning_rate": 4.727998926199571e-05, "loss": 2.2263, "step": 114320 }, { "epoch": 0.71, "learning_rate": 4.7274009968114084e-05, "loss": 2.2254, "step": 114328 }, { "epoch": 0.71, "learning_rate": 4.7268030990601993e-05, "loss": 2.233, "step": 114336 }, { "epoch": 0.71, "learning_rate": 4.726205232960807e-05, "loss": 2.2291, "step": 114344 }, { "epoch": 0.71, "learning_rate": 4.7256073985280965e-05, "loss": 2.22, "step": 114352 }, { "epoch": 0.71, "learning_rate": 4.725009595776928e-05, "loss": 2.245, "step": 114360 }, { "epoch": 0.71, "learning_rate": 4.724411824722164e-05, "loss": 2.2364, "step": 114368 }, { "epoch": 0.71, "learning_rate": 4.723814085378665e-05, "loss": 2.2261, "step": 114376 }, { "epoch": 0.71, "learning_rate": 4.723216377761292e-05, "loss": 2.2259, "step": 114384 }, { "epoch": 0.71, "learning_rate": 4.7226187018849034e-05, "loss": 2.2428, "step": 114392 }, { "epoch": 0.71, "learning_rate": 4.7220210577643564e-05, "loss": 2.212, "step": 114400 }, { "epoch": 0.72, "learning_rate": 4.72142344541451e-05, "loss": 2.2399, "step": 114408 }, { "epoch": 0.72, "learning_rate": 4.72082586485022e-05, "loss": 2.2401, "step": 114416 }, { "epoch": 0.72, "learning_rate": 4.7202283160863416e-05, "loss": 2.251, "step": 114424 }, { "epoch": 0.72, "learning_rate": 4.719630799137731e-05, "loss": 2.2148, "step": 114432 }, { "epoch": 0.72, "learning_rate": 4.7190333140192435e-05, "loss": 2.2426, "step": 114440 }, { "epoch": 0.72, "learning_rate": 4.718435860745731e-05, "loss": 2.2385, "step": 114448 }, { "epoch": 0.72, "learning_rate": 4.7178384393320466e-05, "loss": 2.2372, "step": 114456 }, { "epoch": 0.72, "learning_rate": 4.7172410497930436e-05, "loss": 2.2225, "step": 114464 }, { "epoch": 0.72, "learning_rate": 4.71664369214357e-05, "loss": 2.2351, "step": 114472 }, { "epoch": 0.72, "learning_rate": 4.7160463663984786e-05, "loss": 2.2445, "step": 114480 }, { "epoch": 0.72, "learning_rate": 4.715449072572621e-05, "loss": 2.2361, "step": 114488 }, { "epoch": 0.72, "learning_rate": 4.714851810680841e-05, "loss": 2.258, "step": 114496 }, { "epoch": 0.72, "learning_rate": 4.714254580737989e-05, "loss": 2.2394, "step": 114504 }, { "epoch": 0.72, "learning_rate": 4.713657382758913e-05, "loss": 2.2387, "step": 114512 }, { "epoch": 0.72, "learning_rate": 4.7130602167584606e-05, "loss": 2.225, "step": 114520 }, { "epoch": 0.72, "learning_rate": 4.7124630827514735e-05, "loss": 2.2393, "step": 114528 }, { "epoch": 0.72, "learning_rate": 4.711865980752798e-05, "loss": 2.2542, "step": 114536 }, { "epoch": 0.72, "learning_rate": 4.711268910777282e-05, "loss": 2.2391, "step": 114544 }, { "epoch": 0.72, "learning_rate": 4.7106718728397625e-05, "loss": 2.2211, "step": 114552 }, { "epoch": 0.72, "learning_rate": 4.710074866955085e-05, "loss": 2.2296, "step": 114560 }, { "epoch": 0.72, "learning_rate": 4.709477893138094e-05, "loss": 2.2308, "step": 114568 }, { "epoch": 0.72, "learning_rate": 4.708880951403624e-05, "loss": 2.2336, "step": 114576 }, { "epoch": 0.72, "learning_rate": 4.7082840417665196e-05, "loss": 2.2311, "step": 114584 }, { "epoch": 0.72, "learning_rate": 4.7076871642416185e-05, "loss": 2.2513, "step": 114592 }, { "epoch": 0.72, "learning_rate": 4.707090318843761e-05, "loss": 2.2343, "step": 114600 }, { "epoch": 0.72, "learning_rate": 4.7064935055877815e-05, "loss": 2.236, "step": 114608 }, { "epoch": 0.72, "learning_rate": 4.705896724488519e-05, "loss": 2.2324, "step": 114616 }, { "epoch": 0.72, "learning_rate": 4.7052999755608096e-05, "loss": 2.2256, "step": 114624 }, { "epoch": 0.72, "learning_rate": 4.704703258819487e-05, "loss": 2.2282, "step": 114632 }, { "epoch": 0.72, "learning_rate": 4.704106574279388e-05, "loss": 2.2382, "step": 114640 }, { "epoch": 0.72, "learning_rate": 4.7035099219553444e-05, "loss": 2.2283, "step": 114648 }, { "epoch": 0.72, "learning_rate": 4.7029133018621894e-05, "loss": 2.2426, "step": 114656 }, { "epoch": 0.72, "learning_rate": 4.702316714014756e-05, "loss": 2.2426, "step": 114664 }, { "epoch": 0.72, "learning_rate": 4.7017201584278737e-05, "loss": 2.2184, "step": 114672 }, { "epoch": 0.72, "learning_rate": 4.701123635116376e-05, "loss": 2.226, "step": 114680 }, { "epoch": 0.72, "learning_rate": 4.7005271440950874e-05, "loss": 2.228, "step": 114688 }, { "epoch": 0.72, "learning_rate": 4.699930685378841e-05, "loss": 2.242, "step": 114696 }, { "epoch": 0.72, "learning_rate": 4.6993342589824655e-05, "loss": 2.2385, "step": 114704 }, { "epoch": 0.72, "learning_rate": 4.698737864920784e-05, "loss": 2.2388, "step": 114712 }, { "epoch": 0.72, "learning_rate": 4.698141503208625e-05, "loss": 2.2434, "step": 114720 }, { "epoch": 0.72, "learning_rate": 4.697545173860815e-05, "loss": 2.2279, "step": 114728 }, { "epoch": 0.72, "learning_rate": 4.69694887689218e-05, "loss": 2.249, "step": 114736 }, { "epoch": 0.72, "learning_rate": 4.696352612317539e-05, "loss": 2.2379, "step": 114744 }, { "epoch": 0.72, "learning_rate": 4.69575638015172e-05, "loss": 2.2523, "step": 114752 }, { "epoch": 0.72, "learning_rate": 4.695160180409544e-05, "loss": 2.2523, "step": 114760 }, { "epoch": 0.72, "learning_rate": 4.694564013105831e-05, "loss": 2.2487, "step": 114768 }, { "epoch": 0.72, "learning_rate": 4.693967878255404e-05, "loss": 2.2426, "step": 114776 }, { "epoch": 0.72, "learning_rate": 4.6933717758730814e-05, "loss": 2.2566, "step": 114784 }, { "epoch": 0.72, "learning_rate": 4.692775705973684e-05, "loss": 2.2527, "step": 114792 }, { "epoch": 0.72, "learning_rate": 4.692179668572029e-05, "loss": 2.2386, "step": 114800 }, { "epoch": 0.72, "learning_rate": 4.6915836636829335e-05, "loss": 2.2596, "step": 114808 }, { "epoch": 0.72, "learning_rate": 4.690987691321216e-05, "loss": 2.2296, "step": 114816 }, { "epoch": 0.72, "learning_rate": 4.6903917515016906e-05, "loss": 2.2402, "step": 114824 }, { "epoch": 0.72, "learning_rate": 4.689795844239173e-05, "loss": 2.2498, "step": 114832 }, { "epoch": 0.72, "learning_rate": 4.689199969548479e-05, "loss": 2.2464, "step": 114840 }, { "epoch": 0.72, "learning_rate": 4.6886041274444194e-05, "loss": 2.2441, "step": 114848 }, { "epoch": 0.72, "learning_rate": 4.6880083179418084e-05, "loss": 2.2388, "step": 114856 }, { "epoch": 0.72, "learning_rate": 4.687412541055458e-05, "loss": 2.2309, "step": 114864 }, { "epoch": 0.72, "learning_rate": 4.68681679680018e-05, "loss": 2.2473, "step": 114872 }, { "epoch": 0.72, "learning_rate": 4.6862210851907826e-05, "loss": 2.2492, "step": 114880 }, { "epoch": 0.72, "learning_rate": 4.6856254062420766e-05, "loss": 2.2413, "step": 114888 }, { "epoch": 0.72, "learning_rate": 4.685029759968873e-05, "loss": 2.2338, "step": 114896 }, { "epoch": 0.72, "learning_rate": 4.684434146385973e-05, "loss": 2.255, "step": 114904 }, { "epoch": 0.72, "learning_rate": 4.683838565508189e-05, "loss": 2.2429, "step": 114912 }, { "epoch": 0.72, "learning_rate": 4.6832430173503286e-05, "loss": 2.2564, "step": 114920 }, { "epoch": 0.72, "learning_rate": 4.682647501927192e-05, "loss": 2.2434, "step": 114928 }, { "epoch": 0.72, "learning_rate": 4.6820520192535866e-05, "loss": 2.264, "step": 114936 }, { "epoch": 0.72, "learning_rate": 4.6814565693443155e-05, "loss": 2.2385, "step": 114944 }, { "epoch": 0.72, "learning_rate": 4.6808611522141833e-05, "loss": 2.2498, "step": 114952 }, { "epoch": 0.72, "learning_rate": 4.6802657678779895e-05, "loss": 2.2462, "step": 114960 }, { "epoch": 0.72, "learning_rate": 4.6796704163505375e-05, "loss": 2.245, "step": 114968 }, { "epoch": 0.72, "learning_rate": 4.679075097646627e-05, "loss": 2.2473, "step": 114976 }, { "epoch": 0.72, "learning_rate": 4.678479811781058e-05, "loss": 2.2413, "step": 114984 }, { "epoch": 0.72, "learning_rate": 4.677884558768629e-05, "loss": 2.2377, "step": 114992 }, { "epoch": 0.72, "learning_rate": 4.677289338624138e-05, "loss": 2.2397, "step": 115000 }, { "epoch": 0.72, "learning_rate": 4.676694151362383e-05, "loss": 2.2394, "step": 115008 }, { "epoch": 0.72, "learning_rate": 4.676098996998159e-05, "loss": 2.2238, "step": 115016 }, { "epoch": 0.72, "learning_rate": 4.675503875546263e-05, "loss": 2.2623, "step": 115024 }, { "epoch": 0.72, "learning_rate": 4.67490878702149e-05, "loss": 2.2383, "step": 115032 }, { "epoch": 0.72, "learning_rate": 4.674313731438631e-05, "loss": 2.2449, "step": 115040 }, { "epoch": 0.72, "learning_rate": 4.673718708812483e-05, "loss": 2.2303, "step": 115048 }, { "epoch": 0.72, "learning_rate": 4.673123719157837e-05, "loss": 2.2485, "step": 115056 }, { "epoch": 0.72, "learning_rate": 4.672528762489483e-05, "loss": 2.231, "step": 115064 }, { "epoch": 0.72, "learning_rate": 4.671933838822214e-05, "loss": 2.248, "step": 115072 }, { "epoch": 0.72, "learning_rate": 4.671338948170818e-05, "loss": 2.2343, "step": 115080 }, { "epoch": 0.72, "learning_rate": 4.6707440905500856e-05, "loss": 2.2366, "step": 115088 }, { "epoch": 0.72, "learning_rate": 4.670149265974804e-05, "loss": 2.244, "step": 115096 }, { "epoch": 0.72, "learning_rate": 4.66955447445976e-05, "loss": 2.2477, "step": 115104 }, { "epoch": 0.72, "learning_rate": 4.668959716019743e-05, "loss": 2.2447, "step": 115112 }, { "epoch": 0.72, "learning_rate": 4.668364990669536e-05, "loss": 2.2318, "step": 115120 }, { "epoch": 0.72, "learning_rate": 4.667770298423923e-05, "loss": 2.2521, "step": 115128 }, { "epoch": 0.72, "learning_rate": 4.6671756392976906e-05, "loss": 2.2321, "step": 115136 }, { "epoch": 0.72, "learning_rate": 4.666581013305623e-05, "loss": 2.2471, "step": 115144 }, { "epoch": 0.72, "learning_rate": 4.6659864204625005e-05, "loss": 2.2533, "step": 115152 }, { "epoch": 0.72, "learning_rate": 4.6653918607831026e-05, "loss": 2.2535, "step": 115160 }, { "epoch": 0.72, "learning_rate": 4.664797334282216e-05, "loss": 2.2333, "step": 115168 }, { "epoch": 0.72, "learning_rate": 4.6642028409746166e-05, "loss": 2.2221, "step": 115176 }, { "epoch": 0.72, "learning_rate": 4.663608380875084e-05, "loss": 2.224, "step": 115184 }, { "epoch": 0.72, "learning_rate": 4.663013953998398e-05, "loss": 2.2576, "step": 115192 }, { "epoch": 0.72, "learning_rate": 4.662419560359333e-05, "loss": 2.2256, "step": 115200 }, { "epoch": 0.72, "learning_rate": 4.661825199972669e-05, "loss": 2.2493, "step": 115208 }, { "epoch": 0.72, "learning_rate": 4.6612308728531814e-05, "loss": 2.2352, "step": 115216 }, { "epoch": 0.72, "learning_rate": 4.660636579015644e-05, "loss": 2.2155, "step": 115224 }, { "epoch": 0.72, "learning_rate": 4.660042318474831e-05, "loss": 2.246, "step": 115232 }, { "epoch": 0.72, "learning_rate": 4.6594480912455164e-05, "loss": 2.2371, "step": 115240 }, { "epoch": 0.72, "learning_rate": 4.658853897342473e-05, "loss": 2.2372, "step": 115248 }, { "epoch": 0.72, "learning_rate": 4.658259736780473e-05, "loss": 2.2402, "step": 115256 }, { "epoch": 0.72, "learning_rate": 4.657665609574284e-05, "loss": 2.234, "step": 115264 }, { "epoch": 0.72, "learning_rate": 4.6570715157386825e-05, "loss": 2.2398, "step": 115272 }, { "epoch": 0.72, "learning_rate": 4.6564774552884304e-05, "loss": 2.2293, "step": 115280 }, { "epoch": 0.72, "learning_rate": 4.6558834282382995e-05, "loss": 2.2436, "step": 115288 }, { "epoch": 0.72, "learning_rate": 4.655289434603059e-05, "loss": 2.2407, "step": 115296 }, { "epoch": 0.72, "learning_rate": 4.654695474397475e-05, "loss": 2.2437, "step": 115304 }, { "epoch": 0.72, "learning_rate": 4.654101547636309e-05, "loss": 2.2473, "step": 115312 }, { "epoch": 0.72, "learning_rate": 4.653507654334331e-05, "loss": 2.2383, "step": 115320 }, { "epoch": 0.72, "learning_rate": 4.652913794506306e-05, "loss": 2.2481, "step": 115328 }, { "epoch": 0.72, "learning_rate": 4.652319968166993e-05, "loss": 2.2422, "step": 115336 }, { "epoch": 0.72, "learning_rate": 4.6517261753311566e-05, "loss": 2.2281, "step": 115344 }, { "epoch": 0.72, "learning_rate": 4.6511324160135586e-05, "loss": 2.2434, "step": 115352 }, { "epoch": 0.72, "learning_rate": 4.650538690228963e-05, "loss": 2.2348, "step": 115360 }, { "epoch": 0.72, "learning_rate": 4.649944997992124e-05, "loss": 2.2511, "step": 115368 }, { "epoch": 0.72, "learning_rate": 4.649351339317804e-05, "loss": 2.2249, "step": 115376 }, { "epoch": 0.72, "learning_rate": 4.6487577142207625e-05, "loss": 2.2387, "step": 115384 }, { "epoch": 0.72, "learning_rate": 4.648164122715755e-05, "loss": 2.2337, "step": 115392 }, { "epoch": 0.72, "learning_rate": 4.647570564817539e-05, "loss": 2.2208, "step": 115400 }, { "epoch": 0.72, "learning_rate": 4.6469770405408717e-05, "loss": 2.2271, "step": 115408 }, { "epoch": 0.72, "learning_rate": 4.646383549900506e-05, "loss": 2.2417, "step": 115416 }, { "epoch": 0.72, "learning_rate": 4.6457900929111966e-05, "loss": 2.2377, "step": 115424 }, { "epoch": 0.72, "learning_rate": 4.645196669587698e-05, "loss": 2.2313, "step": 115432 }, { "epoch": 0.72, "learning_rate": 4.644603279944763e-05, "loss": 2.2368, "step": 115440 }, { "epoch": 0.72, "learning_rate": 4.6440099239971414e-05, "loss": 2.2311, "step": 115448 }, { "epoch": 0.72, "learning_rate": 4.6434166017595846e-05, "loss": 2.2242, "step": 115456 }, { "epoch": 0.72, "learning_rate": 4.642823313246845e-05, "loss": 2.2385, "step": 115464 }, { "epoch": 0.72, "learning_rate": 4.64223005847367e-05, "loss": 2.2396, "step": 115472 }, { "epoch": 0.72, "learning_rate": 4.6416368374548067e-05, "loss": 2.2351, "step": 115480 }, { "epoch": 0.72, "learning_rate": 4.6410436502050045e-05, "loss": 2.2385, "step": 115488 }, { "epoch": 0.72, "learning_rate": 4.6404504967390105e-05, "loss": 2.2424, "step": 115496 }, { "epoch": 0.72, "learning_rate": 4.6398573770715685e-05, "loss": 2.2293, "step": 115504 }, { "epoch": 0.72, "learning_rate": 4.6392642912174255e-05, "loss": 2.2474, "step": 115512 }, { "epoch": 0.72, "learning_rate": 4.638671239191326e-05, "loss": 2.224, "step": 115520 }, { "epoch": 0.72, "learning_rate": 4.63807822100801e-05, "loss": 2.2476, "step": 115528 }, { "epoch": 0.72, "learning_rate": 4.6374852366822225e-05, "loss": 2.2377, "step": 115536 }, { "epoch": 0.72, "learning_rate": 4.636892286228707e-05, "loss": 2.23, "step": 115544 }, { "epoch": 0.72, "learning_rate": 4.6362993696622004e-05, "loss": 2.2375, "step": 115552 }, { "epoch": 0.72, "learning_rate": 4.635706486997444e-05, "loss": 2.2361, "step": 115560 }, { "epoch": 0.72, "learning_rate": 4.635113638249178e-05, "loss": 2.2554, "step": 115568 }, { "epoch": 0.72, "learning_rate": 4.634520823432142e-05, "loss": 2.2343, "step": 115576 }, { "epoch": 0.72, "learning_rate": 4.6339280425610695e-05, "loss": 2.2479, "step": 115584 }, { "epoch": 0.72, "learning_rate": 4.633335295650699e-05, "loss": 2.2272, "step": 115592 }, { "epoch": 0.72, "learning_rate": 4.632742582715768e-05, "loss": 2.2412, "step": 115600 }, { "epoch": 0.72, "learning_rate": 4.632149903771008e-05, "loss": 2.2362, "step": 115608 }, { "epoch": 0.72, "learning_rate": 4.631557258831155e-05, "loss": 2.2404, "step": 115616 }, { "epoch": 0.72, "learning_rate": 4.6309646479109435e-05, "loss": 2.2353, "step": 115624 }, { "epoch": 0.72, "learning_rate": 4.630372071025103e-05, "loss": 2.2554, "step": 115632 }, { "epoch": 0.72, "learning_rate": 4.629779528188367e-05, "loss": 2.253, "step": 115640 }, { "epoch": 0.72, "learning_rate": 4.629187019415465e-05, "loss": 2.2513, "step": 115648 }, { "epoch": 0.72, "learning_rate": 4.628594544721129e-05, "loss": 2.2603, "step": 115656 }, { "epoch": 0.72, "learning_rate": 4.628002104120086e-05, "loss": 2.2522, "step": 115664 }, { "epoch": 0.72, "learning_rate": 4.627409697627064e-05, "loss": 2.2561, "step": 115672 }, { "epoch": 0.72, "learning_rate": 4.6268173252567916e-05, "loss": 2.2431, "step": 115680 }, { "epoch": 0.72, "learning_rate": 4.626224987023994e-05, "loss": 2.2368, "step": 115688 }, { "epoch": 0.72, "learning_rate": 4.625632682943397e-05, "loss": 2.2512, "step": 115696 }, { "epoch": 0.72, "learning_rate": 4.625040413029727e-05, "loss": 2.2313, "step": 115704 }, { "epoch": 0.72, "learning_rate": 4.624448177297706e-05, "loss": 2.2323, "step": 115712 }, { "epoch": 0.72, "learning_rate": 4.623855975762057e-05, "loss": 2.2252, "step": 115720 }, { "epoch": 0.72, "learning_rate": 4.623263808437503e-05, "loss": 2.2328, "step": 115728 }, { "epoch": 0.72, "learning_rate": 4.6226716753387674e-05, "loss": 2.2331, "step": 115736 }, { "epoch": 0.72, "learning_rate": 4.6220795764805655e-05, "loss": 2.2412, "step": 115744 }, { "epoch": 0.72, "learning_rate": 4.621487511877621e-05, "loss": 2.2285, "step": 115752 }, { "epoch": 0.72, "learning_rate": 4.6208954815446525e-05, "loss": 2.2295, "step": 115760 }, { "epoch": 0.72, "learning_rate": 4.620303485496376e-05, "loss": 2.2342, "step": 115768 }, { "epoch": 0.72, "learning_rate": 4.61971152374751e-05, "loss": 2.2343, "step": 115776 }, { "epoch": 0.72, "learning_rate": 4.619119596312769e-05, "loss": 2.2371, "step": 115784 }, { "epoch": 0.72, "learning_rate": 4.618527703206872e-05, "loss": 2.2343, "step": 115792 }, { "epoch": 0.72, "learning_rate": 4.61793584444453e-05, "loss": 2.2329, "step": 115800 }, { "epoch": 0.72, "learning_rate": 4.617344020040459e-05, "loss": 2.2432, "step": 115808 }, { "epoch": 0.72, "learning_rate": 4.61675223000937e-05, "loss": 2.242, "step": 115816 }, { "epoch": 0.72, "learning_rate": 4.616160474365976e-05, "loss": 2.2469, "step": 115824 }, { "epoch": 0.72, "learning_rate": 4.6155687531249876e-05, "loss": 2.239, "step": 115832 }, { "epoch": 0.72, "learning_rate": 4.614977066301115e-05, "loss": 2.249, "step": 115840 }, { "epoch": 0.72, "learning_rate": 4.614385413909069e-05, "loss": 2.2216, "step": 115848 }, { "epoch": 0.72, "learning_rate": 4.613793795963556e-05, "loss": 2.2504, "step": 115856 }, { "epoch": 0.72, "learning_rate": 4.6132022124792854e-05, "loss": 2.2372, "step": 115864 }, { "epoch": 0.72, "learning_rate": 4.612610663470964e-05, "loss": 2.2255, "step": 115872 }, { "epoch": 0.72, "learning_rate": 4.6120191489532956e-05, "loss": 2.2458, "step": 115880 }, { "epoch": 0.72, "learning_rate": 4.6114276689409875e-05, "loss": 2.2428, "step": 115888 }, { "epoch": 0.72, "learning_rate": 4.610836223448745e-05, "loss": 2.2348, "step": 115896 }, { "epoch": 0.72, "learning_rate": 4.610244812491267e-05, "loss": 2.2419, "step": 115904 }, { "epoch": 0.72, "learning_rate": 4.609653436083261e-05, "loss": 2.2465, "step": 115912 }, { "epoch": 0.72, "learning_rate": 4.6090620942394244e-05, "loss": 2.2398, "step": 115920 }, { "epoch": 0.72, "learning_rate": 4.6084707869744627e-05, "loss": 2.2396, "step": 115928 }, { "epoch": 0.72, "learning_rate": 4.6078795143030725e-05, "loss": 2.2322, "step": 115936 }, { "epoch": 0.72, "learning_rate": 4.607288276239953e-05, "loss": 2.2419, "step": 115944 }, { "epoch": 0.72, "learning_rate": 4.606697072799805e-05, "loss": 2.2451, "step": 115952 }, { "epoch": 0.72, "learning_rate": 4.606105903997322e-05, "loss": 2.2184, "step": 115960 }, { "epoch": 0.72, "learning_rate": 4.605514769847203e-05, "loss": 2.2335, "step": 115968 }, { "epoch": 0.72, "learning_rate": 4.6049236703641455e-05, "loss": 2.2405, "step": 115976 }, { "epoch": 0.72, "learning_rate": 4.60433260556284e-05, "loss": 2.2346, "step": 115984 }, { "epoch": 0.72, "learning_rate": 4.6037415754579825e-05, "loss": 2.2329, "step": 115992 }, { "epoch": 0.72, "learning_rate": 4.603150580064265e-05, "loss": 2.2337, "step": 116000 }, { "epoch": 0.73, "learning_rate": 4.602559619396384e-05, "loss": 2.2297, "step": 116008 }, { "epoch": 0.73, "learning_rate": 4.601968693469026e-05, "loss": 2.2421, "step": 116016 }, { "epoch": 0.73, "learning_rate": 4.6013778022968826e-05, "loss": 2.2388, "step": 116024 }, { "epoch": 0.73, "learning_rate": 4.6007869458946444e-05, "loss": 2.2347, "step": 116032 }, { "epoch": 0.73, "learning_rate": 4.6001961242769994e-05, "loss": 2.2343, "step": 116040 }, { "epoch": 0.73, "learning_rate": 4.5996053374586365e-05, "loss": 2.2303, "step": 116048 }, { "epoch": 0.73, "learning_rate": 4.599014585454241e-05, "loss": 2.2532, "step": 116056 }, { "epoch": 0.73, "learning_rate": 4.5984238682785015e-05, "loss": 2.2308, "step": 116064 }, { "epoch": 0.73, "learning_rate": 4.5978331859461006e-05, "loss": 2.2383, "step": 116072 }, { "epoch": 0.73, "learning_rate": 4.5972425384717244e-05, "loss": 2.2317, "step": 116080 }, { "epoch": 0.73, "learning_rate": 4.596651925870057e-05, "loss": 2.2218, "step": 116088 }, { "epoch": 0.73, "learning_rate": 4.596061348155779e-05, "loss": 2.2267, "step": 116096 }, { "epoch": 0.73, "learning_rate": 4.5954708053435735e-05, "loss": 2.2246, "step": 116104 }, { "epoch": 0.73, "learning_rate": 4.5948802974481226e-05, "loss": 2.2299, "step": 116112 }, { "epoch": 0.73, "learning_rate": 4.594289824484104e-05, "loss": 2.2342, "step": 116120 }, { "epoch": 0.73, "learning_rate": 4.593699386466198e-05, "loss": 2.2386, "step": 116128 }, { "epoch": 0.73, "learning_rate": 4.593108983409082e-05, "loss": 2.2351, "step": 116136 }, { "epoch": 0.73, "learning_rate": 4.592518615327438e-05, "loss": 2.2324, "step": 116144 }, { "epoch": 0.73, "learning_rate": 4.5919282822359355e-05, "loss": 2.2291, "step": 116152 }, { "epoch": 0.73, "learning_rate": 4.5913379841492555e-05, "loss": 2.2338, "step": 116160 }, { "epoch": 0.73, "learning_rate": 4.5907477210820725e-05, "loss": 2.2151, "step": 116168 }, { "epoch": 0.73, "learning_rate": 4.590157493049058e-05, "loss": 2.2396, "step": 116176 }, { "epoch": 0.73, "learning_rate": 4.5895673000648856e-05, "loss": 2.2272, "step": 116184 }, { "epoch": 0.73, "learning_rate": 4.588977142144228e-05, "loss": 2.2443, "step": 116192 }, { "epoch": 0.73, "learning_rate": 4.58838701930176e-05, "loss": 2.2364, "step": 116200 }, { "epoch": 0.73, "learning_rate": 4.5877969315521466e-05, "loss": 2.2381, "step": 116208 }, { "epoch": 0.73, "learning_rate": 4.587206878910059e-05, "loss": 2.2393, "step": 116216 }, { "epoch": 0.73, "learning_rate": 4.58661686139017e-05, "loss": 2.2331, "step": 116224 }, { "epoch": 0.73, "learning_rate": 4.586026879007142e-05, "loss": 2.2267, "step": 116232 }, { "epoch": 0.73, "learning_rate": 4.5854369317756456e-05, "loss": 2.238, "step": 116240 }, { "epoch": 0.73, "learning_rate": 4.584847019710345e-05, "loss": 2.2483, "step": 116248 }, { "epoch": 0.73, "learning_rate": 4.584257142825907e-05, "loss": 2.2518, "step": 116256 }, { "epoch": 0.73, "learning_rate": 4.5836673011369954e-05, "loss": 2.2556, "step": 116264 }, { "epoch": 0.73, "learning_rate": 4.583077494658272e-05, "loss": 2.2425, "step": 116272 }, { "epoch": 0.73, "learning_rate": 4.5824877234044025e-05, "loss": 2.2345, "step": 116280 }, { "epoch": 0.73, "learning_rate": 4.581897987390047e-05, "loss": 2.2476, "step": 116288 }, { "epoch": 0.73, "learning_rate": 4.5813082866298665e-05, "loss": 2.2513, "step": 116296 }, { "epoch": 0.73, "learning_rate": 4.580718621138522e-05, "loss": 2.2349, "step": 116304 }, { "epoch": 0.73, "learning_rate": 4.58012899093067e-05, "loss": 2.2432, "step": 116312 }, { "epoch": 0.73, "learning_rate": 4.579539396020973e-05, "loss": 2.2435, "step": 116320 }, { "epoch": 0.73, "learning_rate": 4.578949836424085e-05, "loss": 2.2473, "step": 116328 }, { "epoch": 0.73, "learning_rate": 4.578360312154663e-05, "loss": 2.247, "step": 116336 }, { "epoch": 0.73, "learning_rate": 4.577770823227363e-05, "loss": 2.2435, "step": 116344 }, { "epoch": 0.73, "learning_rate": 4.5771813696568396e-05, "loss": 2.2145, "step": 116352 }, { "epoch": 0.73, "learning_rate": 4.576591951457749e-05, "loss": 2.2237, "step": 116360 }, { "epoch": 0.73, "learning_rate": 4.57600256864474e-05, "loss": 2.2432, "step": 116368 }, { "epoch": 0.73, "learning_rate": 4.575413221232467e-05, "loss": 2.2253, "step": 116376 }, { "epoch": 0.73, "learning_rate": 4.574823909235583e-05, "loss": 2.2582, "step": 116384 }, { "epoch": 0.73, "learning_rate": 4.574234632668735e-05, "loss": 2.2318, "step": 116392 }, { "epoch": 0.73, "learning_rate": 4.573645391546573e-05, "loss": 2.2386, "step": 116400 }, { "epoch": 0.73, "learning_rate": 4.573056185883748e-05, "loss": 2.2549, "step": 116408 }, { "epoch": 0.73, "learning_rate": 4.572467015694908e-05, "loss": 2.2314, "step": 116416 }, { "epoch": 0.73, "learning_rate": 4.571877880994696e-05, "loss": 2.2351, "step": 116424 }, { "epoch": 0.73, "learning_rate": 4.5712887817977595e-05, "loss": 2.2417, "step": 116432 }, { "epoch": 0.73, "learning_rate": 4.570699718118747e-05, "loss": 2.2439, "step": 116440 }, { "epoch": 0.73, "learning_rate": 4.5701106899722976e-05, "loss": 2.2313, "step": 116448 }, { "epoch": 0.73, "learning_rate": 4.569521697373056e-05, "loss": 2.2459, "step": 116456 }, { "epoch": 0.73, "learning_rate": 4.568932740335668e-05, "loss": 2.2644, "step": 116464 }, { "epoch": 0.73, "learning_rate": 4.568343818874772e-05, "loss": 2.2448, "step": 116472 }, { "epoch": 0.73, "learning_rate": 4.567754933005008e-05, "loss": 2.2374, "step": 116480 }, { "epoch": 0.73, "learning_rate": 4.567166082741017e-05, "loss": 2.2318, "step": 116488 }, { "epoch": 0.73, "learning_rate": 4.5665772680974404e-05, "loss": 2.2532, "step": 116496 }, { "epoch": 0.73, "learning_rate": 4.565988489088912e-05, "loss": 2.2368, "step": 116504 }, { "epoch": 0.73, "learning_rate": 4.56539974573007e-05, "loss": 2.2328, "step": 116512 }, { "epoch": 0.73, "learning_rate": 4.5648110380355525e-05, "loss": 2.2426, "step": 116520 }, { "epoch": 0.73, "learning_rate": 4.564222366019993e-05, "loss": 2.2528, "step": 116528 }, { "epoch": 0.73, "learning_rate": 4.563633729698027e-05, "loss": 2.2354, "step": 116536 }, { "epoch": 0.73, "learning_rate": 4.5630451290842866e-05, "loss": 2.24, "step": 116544 }, { "epoch": 0.73, "learning_rate": 4.562456564193407e-05, "loss": 2.2415, "step": 116552 }, { "epoch": 0.73, "learning_rate": 4.561868035040018e-05, "loss": 2.2497, "step": 116560 }, { "epoch": 0.73, "learning_rate": 4.5612795416387496e-05, "loss": 2.2498, "step": 116568 }, { "epoch": 0.73, "learning_rate": 4.560691084004236e-05, "loss": 2.2364, "step": 116576 }, { "epoch": 0.73, "learning_rate": 4.560102662151101e-05, "loss": 2.2475, "step": 116584 }, { "epoch": 0.73, "learning_rate": 4.559514276093977e-05, "loss": 2.2394, "step": 116592 }, { "epoch": 0.73, "learning_rate": 4.5589259258474904e-05, "loss": 2.238, "step": 116600 }, { "epoch": 0.73, "learning_rate": 4.5583376114262646e-05, "loss": 2.249, "step": 116608 }, { "epoch": 0.73, "learning_rate": 4.5577493328449286e-05, "loss": 2.2634, "step": 116616 }, { "epoch": 0.73, "learning_rate": 4.557161090118105e-05, "loss": 2.2547, "step": 116624 }, { "epoch": 0.73, "learning_rate": 4.556572883260421e-05, "loss": 2.2533, "step": 116632 }, { "epoch": 0.73, "learning_rate": 4.5559847122864954e-05, "loss": 2.2438, "step": 116640 }, { "epoch": 0.73, "learning_rate": 4.555396577210951e-05, "loss": 2.2466, "step": 116648 }, { "epoch": 0.73, "learning_rate": 4.5548084780484125e-05, "loss": 2.2372, "step": 116656 }, { "epoch": 0.73, "learning_rate": 4.5542204148134946e-05, "loss": 2.2383, "step": 116664 }, { "epoch": 0.73, "learning_rate": 4.553632387520821e-05, "loss": 2.2331, "step": 116672 }, { "epoch": 0.73, "learning_rate": 4.553044396185008e-05, "loss": 2.2359, "step": 116680 }, { "epoch": 0.73, "learning_rate": 4.5524564408206735e-05, "loss": 2.2511, "step": 116688 }, { "epoch": 0.73, "learning_rate": 4.551868521442435e-05, "loss": 2.2359, "step": 116696 }, { "epoch": 0.73, "learning_rate": 4.551280638064906e-05, "loss": 2.2325, "step": 116704 }, { "epoch": 0.73, "learning_rate": 4.5506927907027054e-05, "loss": 2.2398, "step": 116712 }, { "epoch": 0.73, "learning_rate": 4.550104979370443e-05, "loss": 2.2333, "step": 116720 }, { "epoch": 0.73, "learning_rate": 4.5495172040827335e-05, "loss": 2.2314, "step": 116728 }, { "epoch": 0.73, "learning_rate": 4.54892946485419e-05, "loss": 2.2615, "step": 116736 }, { "epoch": 0.73, "learning_rate": 4.5483417616994214e-05, "loss": 2.23, "step": 116744 }, { "epoch": 0.73, "learning_rate": 4.547754094633039e-05, "loss": 2.229, "step": 116752 }, { "epoch": 0.73, "learning_rate": 4.547166463669654e-05, "loss": 2.2399, "step": 116760 }, { "epoch": 0.73, "learning_rate": 4.546578868823874e-05, "loss": 2.2347, "step": 116768 }, { "epoch": 0.73, "learning_rate": 4.5459913101103056e-05, "loss": 2.2515, "step": 116776 }, { "epoch": 0.73, "learning_rate": 4.5454037875435565e-05, "loss": 2.2511, "step": 116784 }, { "epoch": 0.73, "learning_rate": 4.544816301138234e-05, "loss": 2.2248, "step": 116792 }, { "epoch": 0.73, "learning_rate": 4.5442288509089404e-05, "loss": 2.2568, "step": 116800 }, { "epoch": 0.73, "learning_rate": 4.543641436870279e-05, "loss": 2.2473, "step": 116808 }, { "epoch": 0.73, "learning_rate": 4.543054059036858e-05, "loss": 2.2513, "step": 116816 }, { "epoch": 0.73, "learning_rate": 4.542466717423275e-05, "loss": 2.2269, "step": 116824 }, { "epoch": 0.73, "learning_rate": 4.541879412044133e-05, "loss": 2.2413, "step": 116832 }, { "epoch": 0.73, "learning_rate": 4.5412921429140316e-05, "loss": 2.2369, "step": 116840 }, { "epoch": 0.73, "learning_rate": 4.5407049100475734e-05, "loss": 2.241, "step": 116848 }, { "epoch": 0.73, "learning_rate": 4.5401177134593534e-05, "loss": 2.2367, "step": 116856 }, { "epoch": 0.73, "learning_rate": 4.539530553163971e-05, "loss": 2.2443, "step": 116864 }, { "epoch": 0.73, "learning_rate": 4.538943429176023e-05, "loss": 2.2411, "step": 116872 }, { "epoch": 0.73, "learning_rate": 4.538356341510105e-05, "loss": 2.2471, "step": 116880 }, { "epoch": 0.73, "learning_rate": 4.5377692901808124e-05, "loss": 2.2403, "step": 116888 }, { "epoch": 0.73, "learning_rate": 4.5371822752027386e-05, "loss": 2.2458, "step": 116896 }, { "epoch": 0.73, "learning_rate": 4.536595296590479e-05, "loss": 2.2467, "step": 116904 }, { "epoch": 0.73, "learning_rate": 4.536008354358623e-05, "loss": 2.2357, "step": 116912 }, { "epoch": 0.73, "learning_rate": 4.535421448521765e-05, "loss": 2.2235, "step": 116920 }, { "epoch": 0.73, "learning_rate": 4.5348345790944943e-05, "loss": 2.2341, "step": 116928 }, { "epoch": 0.73, "learning_rate": 4.5342477460913993e-05, "loss": 2.2363, "step": 116936 }, { "epoch": 0.73, "learning_rate": 4.53366094952707e-05, "loss": 2.2351, "step": 116944 }, { "epoch": 0.73, "learning_rate": 4.533074189416095e-05, "loss": 2.233, "step": 116952 }, { "epoch": 0.73, "learning_rate": 4.532487465773059e-05, "loss": 2.2363, "step": 116960 }, { "epoch": 0.73, "learning_rate": 4.531900778612549e-05, "loss": 2.2487, "step": 116968 }, { "epoch": 0.73, "learning_rate": 4.531314127949151e-05, "loss": 2.2471, "step": 116976 }, { "epoch": 0.73, "learning_rate": 4.5307275137974495e-05, "loss": 2.2231, "step": 116984 }, { "epoch": 0.73, "learning_rate": 4.530140936172025e-05, "loss": 2.2541, "step": 116992 }, { "epoch": 0.73, "learning_rate": 4.5295543950874624e-05, "loss": 2.2606, "step": 117000 }, { "epoch": 0.73, "learning_rate": 4.528967890558344e-05, "loss": 2.2468, "step": 117008 }, { "epoch": 0.73, "learning_rate": 4.5283814225992476e-05, "loss": 2.2322, "step": 117016 }, { "epoch": 0.73, "learning_rate": 4.527794991224753e-05, "loss": 2.2367, "step": 117024 }, { "epoch": 0.73, "learning_rate": 4.527208596449442e-05, "loss": 2.2355, "step": 117032 }, { "epoch": 0.73, "learning_rate": 4.52662223828789e-05, "loss": 2.2452, "step": 117040 }, { "epoch": 0.73, "learning_rate": 4.526035916754674e-05, "loss": 2.2294, "step": 117048 }, { "epoch": 0.73, "learning_rate": 4.52544963186437e-05, "loss": 2.2341, "step": 117056 }, { "epoch": 0.73, "learning_rate": 4.524863383631556e-05, "loss": 2.2247, "step": 117064 }, { "epoch": 0.73, "learning_rate": 4.524277172070801e-05, "loss": 2.2409, "step": 117072 }, { "epoch": 0.73, "learning_rate": 4.523690997196682e-05, "loss": 2.2172, "step": 117080 }, { "epoch": 0.73, "learning_rate": 4.523104859023772e-05, "loss": 2.2171, "step": 117088 }, { "epoch": 0.73, "learning_rate": 4.5225187575666386e-05, "loss": 2.2251, "step": 117096 }, { "epoch": 0.73, "learning_rate": 4.521932692839856e-05, "loss": 2.2337, "step": 117104 }, { "epoch": 0.73, "learning_rate": 4.5213466648579915e-05, "loss": 2.2384, "step": 117112 }, { "epoch": 0.73, "learning_rate": 4.520760673635616e-05, "loss": 2.2311, "step": 117120 }, { "epoch": 0.73, "learning_rate": 4.520174719187296e-05, "loss": 2.2299, "step": 117128 }, { "epoch": 0.73, "learning_rate": 4.5195888015275974e-05, "loss": 2.2392, "step": 117136 }, { "epoch": 0.73, "learning_rate": 4.519002920671089e-05, "loss": 2.2331, "step": 117144 }, { "epoch": 0.73, "learning_rate": 4.518417076632332e-05, "loss": 2.2414, "step": 117152 }, { "epoch": 0.73, "learning_rate": 4.517831269425894e-05, "loss": 2.2433, "step": 117160 }, { "epoch": 0.73, "learning_rate": 4.5172454990663385e-05, "loss": 2.2398, "step": 117168 }, { "epoch": 0.73, "learning_rate": 4.516659765568223e-05, "loss": 2.2221, "step": 117176 }, { "epoch": 0.73, "learning_rate": 4.516074068946114e-05, "loss": 2.2423, "step": 117184 }, { "epoch": 0.73, "learning_rate": 4.5154884092145685e-05, "loss": 2.2226, "step": 117192 }, { "epoch": 0.73, "learning_rate": 4.514902786388151e-05, "loss": 2.2513, "step": 117200 }, { "epoch": 0.73, "learning_rate": 4.514317200481414e-05, "loss": 2.2447, "step": 117208 }, { "epoch": 0.73, "learning_rate": 4.513731651508918e-05, "loss": 2.2311, "step": 117216 }, { "epoch": 0.73, "learning_rate": 4.513146139485223e-05, "loss": 2.2216, "step": 117224 }, { "epoch": 0.73, "learning_rate": 4.512560664424879e-05, "loss": 2.2415, "step": 117232 }, { "epoch": 0.73, "learning_rate": 4.511975226342444e-05, "loss": 2.2339, "step": 117240 }, { "epoch": 0.73, "learning_rate": 4.5113898252524716e-05, "loss": 2.2387, "step": 117248 }, { "epoch": 0.73, "learning_rate": 4.510804461169518e-05, "loss": 2.2342, "step": 117256 }, { "epoch": 0.73, "learning_rate": 4.5102191341081295e-05, "loss": 2.2349, "step": 117264 }, { "epoch": 0.73, "learning_rate": 4.50963384408286e-05, "loss": 2.2507, "step": 117272 }, { "epoch": 0.73, "learning_rate": 4.509048591108263e-05, "loss": 2.2339, "step": 117280 }, { "epoch": 0.73, "learning_rate": 4.508463375198884e-05, "loss": 2.228, "step": 117288 }, { "epoch": 0.73, "learning_rate": 4.507878196369273e-05, "loss": 2.2358, "step": 117296 }, { "epoch": 0.73, "learning_rate": 4.507293054633978e-05, "loss": 2.2401, "step": 117304 }, { "epoch": 0.73, "learning_rate": 4.5067079500075435e-05, "loss": 2.2246, "step": 117312 }, { "epoch": 0.73, "learning_rate": 4.5061228825045176e-05, "loss": 2.2411, "step": 117320 }, { "epoch": 0.73, "learning_rate": 4.5055378521394446e-05, "loss": 2.2552, "step": 117328 }, { "epoch": 0.73, "learning_rate": 4.504952858926869e-05, "loss": 2.2335, "step": 117336 }, { "epoch": 0.73, "learning_rate": 4.504367902881332e-05, "loss": 2.2403, "step": 117344 }, { "epoch": 0.73, "learning_rate": 4.503782984017377e-05, "loss": 2.2216, "step": 117352 }, { "epoch": 0.73, "learning_rate": 4.503198102349546e-05, "loss": 2.2261, "step": 117360 }, { "epoch": 0.73, "learning_rate": 4.502613257892377e-05, "loss": 2.2364, "step": 117368 }, { "epoch": 0.73, "learning_rate": 4.50202845066041e-05, "loss": 2.2359, "step": 117376 }, { "epoch": 0.73, "learning_rate": 4.501443680668185e-05, "loss": 2.2423, "step": 117384 }, { "epoch": 0.73, "learning_rate": 4.500858947930238e-05, "loss": 2.2465, "step": 117392 }, { "epoch": 0.73, "learning_rate": 4.500274252461105e-05, "loss": 2.2302, "step": 117400 }, { "epoch": 0.73, "learning_rate": 4.499689594275322e-05, "loss": 2.2308, "step": 117408 }, { "epoch": 0.73, "learning_rate": 4.499104973387426e-05, "loss": 2.2183, "step": 117416 }, { "epoch": 0.73, "learning_rate": 4.498520389811947e-05, "loss": 2.2202, "step": 117424 }, { "epoch": 0.73, "learning_rate": 4.497935843563419e-05, "loss": 2.2311, "step": 117432 }, { "epoch": 0.73, "learning_rate": 4.4973513346563776e-05, "loss": 2.2485, "step": 117440 }, { "epoch": 0.73, "learning_rate": 4.496766863105348e-05, "loss": 2.2447, "step": 117448 }, { "epoch": 0.73, "learning_rate": 4.4961824289248625e-05, "loss": 2.2244, "step": 117456 }, { "epoch": 0.73, "learning_rate": 4.495598032129451e-05, "loss": 2.2429, "step": 117464 }, { "epoch": 0.73, "learning_rate": 4.495013672733643e-05, "loss": 2.2393, "step": 117472 }, { "epoch": 0.73, "learning_rate": 4.494429350751963e-05, "loss": 2.2417, "step": 117480 }, { "epoch": 0.73, "learning_rate": 4.493845066198937e-05, "loss": 2.2525, "step": 117488 }, { "epoch": 0.73, "learning_rate": 4.4932608190890936e-05, "loss": 2.2457, "step": 117496 }, { "epoch": 0.73, "learning_rate": 4.4926766094369545e-05, "loss": 2.2392, "step": 117504 }, { "epoch": 0.73, "learning_rate": 4.492092437257043e-05, "loss": 2.2451, "step": 117512 }, { "epoch": 0.73, "learning_rate": 4.491508302563884e-05, "loss": 2.2312, "step": 117520 }, { "epoch": 0.73, "learning_rate": 4.490924205371997e-05, "loss": 2.2394, "step": 117528 }, { "epoch": 0.73, "learning_rate": 4.490340145695904e-05, "loss": 2.2487, "step": 117536 }, { "epoch": 0.73, "learning_rate": 4.4897561235501236e-05, "loss": 2.2376, "step": 117544 }, { "epoch": 0.73, "learning_rate": 4.4891721389491756e-05, "loss": 2.257, "step": 117552 }, { "epoch": 0.73, "learning_rate": 4.488588191907578e-05, "loss": 2.2365, "step": 117560 }, { "epoch": 0.73, "learning_rate": 4.4880042824398484e-05, "loss": 2.2533, "step": 117568 }, { "epoch": 0.73, "learning_rate": 4.4874204105605014e-05, "loss": 2.2405, "step": 117576 }, { "epoch": 0.73, "learning_rate": 4.4868365762840525e-05, "loss": 2.2293, "step": 117584 }, { "epoch": 0.73, "learning_rate": 4.486252779625015e-05, "loss": 2.2355, "step": 117592 }, { "epoch": 0.73, "learning_rate": 4.4856690205979046e-05, "loss": 2.2406, "step": 117600 }, { "epoch": 0.74, "learning_rate": 4.4850852992172324e-05, "loss": 2.2366, "step": 117608 }, { "epoch": 0.74, "learning_rate": 4.484501615497509e-05, "loss": 2.2365, "step": 117616 }, { "epoch": 0.74, "learning_rate": 4.483917969453246e-05, "loss": 2.235, "step": 117624 }, { "epoch": 0.74, "learning_rate": 4.483334361098953e-05, "loss": 2.2584, "step": 117632 }, { "epoch": 0.74, "learning_rate": 4.482750790449136e-05, "loss": 2.2641, "step": 117640 }, { "epoch": 0.74, "learning_rate": 4.482167257518306e-05, "loss": 2.2448, "step": 117648 }, { "epoch": 0.74, "learning_rate": 4.481583762320969e-05, "loss": 2.2481, "step": 117656 }, { "epoch": 0.74, "learning_rate": 4.481000304871629e-05, "loss": 2.2441, "step": 117664 }, { "epoch": 0.74, "learning_rate": 4.480416885184791e-05, "loss": 2.2368, "step": 117672 }, { "epoch": 0.74, "learning_rate": 4.47983350327496e-05, "loss": 2.2277, "step": 117680 }, { "epoch": 0.74, "learning_rate": 4.47925015915664e-05, "loss": 2.2278, "step": 117688 }, { "epoch": 0.74, "learning_rate": 4.478666852844331e-05, "loss": 2.2266, "step": 117696 }, { "epoch": 0.74, "learning_rate": 4.478083584352534e-05, "loss": 2.2658, "step": 117704 }, { "epoch": 0.74, "learning_rate": 4.4775003536957515e-05, "loss": 2.2495, "step": 117712 }, { "epoch": 0.74, "learning_rate": 4.476917160888479e-05, "loss": 2.2432, "step": 117720 }, { "epoch": 0.74, "learning_rate": 4.4763340059452174e-05, "loss": 2.2433, "step": 117728 }, { "epoch": 0.74, "learning_rate": 4.4757508888804636e-05, "loss": 2.2519, "step": 117736 }, { "epoch": 0.74, "learning_rate": 4.475167809708715e-05, "loss": 2.2469, "step": 117744 }, { "epoch": 0.74, "learning_rate": 4.4745847684444644e-05, "loss": 2.2377, "step": 117752 }, { "epoch": 0.74, "learning_rate": 4.474001765102207e-05, "loss": 2.2402, "step": 117760 }, { "epoch": 0.74, "learning_rate": 4.4734187996964386e-05, "loss": 2.2456, "step": 117768 }, { "epoch": 0.74, "learning_rate": 4.4728358722416486e-05, "loss": 2.249, "step": 117776 }, { "epoch": 0.74, "learning_rate": 4.472252982752331e-05, "loss": 2.2385, "step": 117784 }, { "epoch": 0.74, "learning_rate": 4.471670131242976e-05, "loss": 2.252, "step": 117792 }, { "epoch": 0.74, "learning_rate": 4.4710873177280715e-05, "loss": 2.2401, "step": 117800 }, { "epoch": 0.74, "learning_rate": 4.4705045422221085e-05, "loss": 2.233, "step": 117808 }, { "epoch": 0.74, "learning_rate": 4.469921804739574e-05, "loss": 2.2531, "step": 117816 }, { "epoch": 0.74, "learning_rate": 4.469339105294957e-05, "loss": 2.2426, "step": 117824 }, { "epoch": 0.74, "learning_rate": 4.46875644390274e-05, "loss": 2.251, "step": 117832 }, { "epoch": 0.74, "learning_rate": 4.4681738205774085e-05, "loss": 2.2638, "step": 117840 }, { "epoch": 0.74, "learning_rate": 4.4675912353334505e-05, "loss": 2.2392, "step": 117848 }, { "epoch": 0.74, "learning_rate": 4.467008688185345e-05, "loss": 2.2333, "step": 117856 }, { "epoch": 0.74, "learning_rate": 4.4664261791475736e-05, "loss": 2.2625, "step": 117864 }, { "epoch": 0.74, "learning_rate": 4.4658437082346226e-05, "loss": 2.2235, "step": 117872 }, { "epoch": 0.74, "learning_rate": 4.465261275460967e-05, "loss": 2.2447, "step": 117880 }, { "epoch": 0.74, "learning_rate": 4.464678880841089e-05, "loss": 2.2401, "step": 117888 }, { "epoch": 0.74, "learning_rate": 4.464096524389465e-05, "loss": 2.2416, "step": 117896 }, { "epoch": 0.74, "learning_rate": 4.4635142061205764e-05, "loss": 2.2376, "step": 117904 }, { "epoch": 0.74, "learning_rate": 4.462931926048895e-05, "loss": 2.2377, "step": 117912 }, { "epoch": 0.74, "learning_rate": 4.4623496841889e-05, "loss": 2.2507, "step": 117920 }, { "epoch": 0.74, "learning_rate": 4.461767480555063e-05, "loss": 2.2312, "step": 117928 }, { "epoch": 0.74, "learning_rate": 4.4611853151618596e-05, "loss": 2.2395, "step": 117936 }, { "epoch": 0.74, "learning_rate": 4.4606031880237605e-05, "loss": 2.2458, "step": 117944 }, { "epoch": 0.74, "learning_rate": 4.46002109915524e-05, "loss": 2.2518, "step": 117952 }, { "epoch": 0.74, "learning_rate": 4.4594390485707686e-05, "loss": 2.2493, "step": 117960 }, { "epoch": 0.74, "learning_rate": 4.458857036284814e-05, "loss": 2.2306, "step": 117968 }, { "epoch": 0.74, "learning_rate": 4.4582750623118466e-05, "loss": 2.247, "step": 117976 }, { "epoch": 0.74, "learning_rate": 4.4576931266663354e-05, "loss": 2.2255, "step": 117984 }, { "epoch": 0.74, "learning_rate": 4.457111229362745e-05, "loss": 2.2352, "step": 117992 }, { "epoch": 0.74, "learning_rate": 4.456529370415542e-05, "loss": 2.2227, "step": 118000 }, { "epoch": 0.74, "learning_rate": 4.455947549839195e-05, "loss": 2.2492, "step": 118008 }, { "epoch": 0.74, "learning_rate": 4.4553657676481605e-05, "loss": 2.2379, "step": 118016 }, { "epoch": 0.74, "learning_rate": 4.454784023856909e-05, "loss": 2.2192, "step": 118024 }, { "epoch": 0.74, "learning_rate": 4.454202318479899e-05, "loss": 2.2482, "step": 118032 }, { "epoch": 0.74, "learning_rate": 4.453620651531595e-05, "loss": 2.2611, "step": 118040 }, { "epoch": 0.74, "learning_rate": 4.453039023026453e-05, "loss": 2.2324, "step": 118048 }, { "epoch": 0.74, "learning_rate": 4.452457432978934e-05, "loss": 2.2404, "step": 118056 }, { "epoch": 0.74, "learning_rate": 4.451875881403499e-05, "loss": 2.247, "step": 118064 }, { "epoch": 0.74, "learning_rate": 4.451294368314603e-05, "loss": 2.2509, "step": 118072 }, { "epoch": 0.74, "learning_rate": 4.4507128937267004e-05, "loss": 2.248, "step": 118080 }, { "epoch": 0.74, "learning_rate": 4.45013145765425e-05, "loss": 2.2484, "step": 118088 }, { "epoch": 0.74, "learning_rate": 4.449550060111707e-05, "loss": 2.2445, "step": 118096 }, { "epoch": 0.74, "learning_rate": 4.448968701113523e-05, "loss": 2.256, "step": 118104 }, { "epoch": 0.74, "learning_rate": 4.4483873806741496e-05, "loss": 2.2427, "step": 118112 }, { "epoch": 0.74, "learning_rate": 4.447806098808043e-05, "loss": 2.2343, "step": 118120 }, { "epoch": 0.74, "learning_rate": 4.447224855529648e-05, "loss": 2.2435, "step": 118128 }, { "epoch": 0.74, "learning_rate": 4.446643650853419e-05, "loss": 2.2505, "step": 118136 }, { "epoch": 0.74, "learning_rate": 4.4460624847938024e-05, "loss": 2.25, "step": 118144 }, { "epoch": 0.74, "learning_rate": 4.445481357365246e-05, "loss": 2.2341, "step": 118152 }, { "epoch": 0.74, "learning_rate": 4.4449002685821984e-05, "loss": 2.2433, "step": 118160 }, { "epoch": 0.74, "learning_rate": 4.4443192184591044e-05, "loss": 2.236, "step": 118168 }, { "epoch": 0.74, "learning_rate": 4.44373820701041e-05, "loss": 2.2642, "step": 118176 }, { "epoch": 0.74, "learning_rate": 4.4431572342505565e-05, "loss": 2.2467, "step": 118184 }, { "epoch": 0.74, "learning_rate": 4.4425763001939905e-05, "loss": 2.2243, "step": 118192 }, { "epoch": 0.74, "learning_rate": 4.441995404855152e-05, "loss": 2.2247, "step": 118200 }, { "epoch": 0.74, "learning_rate": 4.441414548248483e-05, "loss": 2.2446, "step": 118208 }, { "epoch": 0.74, "learning_rate": 4.440833730388422e-05, "loss": 2.2256, "step": 118216 }, { "epoch": 0.74, "learning_rate": 4.4402529512894116e-05, "loss": 2.2389, "step": 118224 }, { "epoch": 0.74, "learning_rate": 4.439672210965885e-05, "loss": 2.2474, "step": 118232 }, { "epoch": 0.74, "learning_rate": 4.439091509432283e-05, "loss": 2.2366, "step": 118240 }, { "epoch": 0.74, "learning_rate": 4.438510846703041e-05, "loss": 2.2333, "step": 118248 }, { "epoch": 0.74, "learning_rate": 4.437930222792597e-05, "loss": 2.2411, "step": 118256 }, { "epoch": 0.74, "learning_rate": 4.43734963771538e-05, "loss": 2.233, "step": 118264 }, { "epoch": 0.74, "learning_rate": 4.4367690914858275e-05, "loss": 2.2323, "step": 118272 }, { "epoch": 0.74, "learning_rate": 4.436188584118372e-05, "loss": 2.2353, "step": 118280 }, { "epoch": 0.74, "learning_rate": 4.435608115627442e-05, "loss": 2.2581, "step": 118288 }, { "epoch": 0.74, "learning_rate": 4.43502768602747e-05, "loss": 2.249, "step": 118296 }, { "epoch": 0.74, "learning_rate": 4.434447295332885e-05, "loss": 2.2316, "step": 118304 }, { "epoch": 0.74, "learning_rate": 4.433866943558118e-05, "loss": 2.2388, "step": 118312 }, { "epoch": 0.74, "learning_rate": 4.433286630717593e-05, "loss": 2.2267, "step": 118320 }, { "epoch": 0.74, "learning_rate": 4.432706356825738e-05, "loss": 2.2405, "step": 118328 }, { "epoch": 0.74, "learning_rate": 4.432126121896979e-05, "loss": 2.2485, "step": 118336 }, { "epoch": 0.74, "learning_rate": 4.431545925945741e-05, "loss": 2.2314, "step": 118344 }, { "epoch": 0.74, "learning_rate": 4.430965768986446e-05, "loss": 2.2203, "step": 118352 }, { "epoch": 0.74, "learning_rate": 4.43038565103352e-05, "loss": 2.2372, "step": 118360 }, { "epoch": 0.74, "learning_rate": 4.429805572101381e-05, "loss": 2.2396, "step": 118368 }, { "epoch": 0.74, "learning_rate": 4.429225532204452e-05, "loss": 2.2396, "step": 118376 }, { "epoch": 0.74, "learning_rate": 4.428645531357153e-05, "loss": 2.2355, "step": 118384 }, { "epoch": 0.74, "learning_rate": 4.428065569573903e-05, "loss": 2.2398, "step": 118392 }, { "epoch": 0.74, "learning_rate": 4.427485646869118e-05, "loss": 2.2485, "step": 118400 }, { "epoch": 0.74, "learning_rate": 4.426905763257216e-05, "loss": 2.2359, "step": 118408 }, { "epoch": 0.74, "learning_rate": 4.4263259187526143e-05, "loss": 2.2271, "step": 118416 }, { "epoch": 0.74, "learning_rate": 4.425746113369727e-05, "loss": 2.2311, "step": 118424 }, { "epoch": 0.74, "learning_rate": 4.425166347122967e-05, "loss": 2.2345, "step": 118432 }, { "epoch": 0.74, "learning_rate": 4.4245866200267486e-05, "loss": 2.2389, "step": 118440 }, { "epoch": 0.74, "learning_rate": 4.424006932095484e-05, "loss": 2.2264, "step": 118448 }, { "epoch": 0.74, "learning_rate": 4.423427283343583e-05, "loss": 2.2236, "step": 118456 }, { "epoch": 0.74, "learning_rate": 4.4228476737854574e-05, "loss": 2.2392, "step": 118464 }, { "epoch": 0.74, "learning_rate": 4.422268103435517e-05, "loss": 2.2486, "step": 118472 }, { "epoch": 0.74, "learning_rate": 4.4216885723081655e-05, "loss": 2.2449, "step": 118480 }, { "epoch": 0.74, "learning_rate": 4.421109080417815e-05, "loss": 2.2341, "step": 118488 }, { "epoch": 0.74, "learning_rate": 4.420529627778871e-05, "loss": 2.2335, "step": 118496 }, { "epoch": 0.74, "learning_rate": 4.4199502144057355e-05, "loss": 2.2234, "step": 118504 }, { "epoch": 0.74, "learning_rate": 4.419370840312815e-05, "loss": 2.2574, "step": 118512 }, { "epoch": 0.74, "learning_rate": 4.418791505514513e-05, "loss": 2.221, "step": 118520 }, { "epoch": 0.74, "learning_rate": 4.418212210025234e-05, "loss": 2.2505, "step": 118528 }, { "epoch": 0.74, "learning_rate": 4.417632953859374e-05, "loss": 2.2443, "step": 118536 }, { "epoch": 0.74, "learning_rate": 4.4170537370313366e-05, "loss": 2.237, "step": 118544 }, { "epoch": 0.74, "learning_rate": 4.4164745595555225e-05, "loss": 2.2271, "step": 118552 }, { "epoch": 0.74, "learning_rate": 4.4158954214463277e-05, "loss": 2.2384, "step": 118560 }, { "epoch": 0.74, "learning_rate": 4.41531632271815e-05, "loss": 2.2409, "step": 118568 }, { "epoch": 0.74, "learning_rate": 4.414737263385387e-05, "loss": 2.2408, "step": 118576 }, { "epoch": 0.74, "learning_rate": 4.414158243462433e-05, "loss": 2.2314, "step": 118584 }, { "epoch": 0.74, "learning_rate": 4.413579262963683e-05, "loss": 2.2336, "step": 118592 }, { "epoch": 0.74, "learning_rate": 4.41300032190353e-05, "loss": 2.2383, "step": 118600 }, { "epoch": 0.74, "learning_rate": 4.412421420296369e-05, "loss": 2.2481, "step": 118608 }, { "epoch": 0.74, "learning_rate": 4.411842558156588e-05, "loss": 2.2281, "step": 118616 }, { "epoch": 0.74, "learning_rate": 4.4112637354985785e-05, "loss": 2.2464, "step": 118624 }, { "epoch": 0.74, "learning_rate": 4.410684952336733e-05, "loss": 2.2392, "step": 118632 }, { "epoch": 0.74, "learning_rate": 4.410106208685436e-05, "loss": 2.2334, "step": 118640 }, { "epoch": 0.74, "learning_rate": 4.409527504559078e-05, "loss": 2.2248, "step": 118648 }, { "epoch": 0.74, "learning_rate": 4.4089488399720444e-05, "loss": 2.2376, "step": 118656 }, { "epoch": 0.74, "learning_rate": 4.4083702149387215e-05, "loss": 2.2288, "step": 118664 }, { "epoch": 0.74, "learning_rate": 4.407791629473493e-05, "loss": 2.2391, "step": 118672 }, { "epoch": 0.74, "learning_rate": 4.407213083590743e-05, "loss": 2.2342, "step": 118680 }, { "epoch": 0.74, "learning_rate": 4.406634577304856e-05, "loss": 2.2271, "step": 118688 }, { "epoch": 0.74, "learning_rate": 4.4060561106302116e-05, "loss": 2.2522, "step": 118696 }, { "epoch": 0.74, "learning_rate": 4.405477683581189e-05, "loss": 2.2226, "step": 118704 }, { "epoch": 0.74, "learning_rate": 4.404899296172173e-05, "loss": 2.2393, "step": 118712 }, { "epoch": 0.74, "learning_rate": 4.4043209484175386e-05, "loss": 2.2253, "step": 118720 }, { "epoch": 0.74, "learning_rate": 4.403742640331664e-05, "loss": 2.2342, "step": 118728 }, { "epoch": 0.74, "learning_rate": 4.403164371928925e-05, "loss": 2.2261, "step": 118736 }, { "epoch": 0.74, "learning_rate": 4.402586143223702e-05, "loss": 2.2224, "step": 118744 }, { "epoch": 0.74, "learning_rate": 4.402007954230365e-05, "loss": 2.2447, "step": 118752 }, { "epoch": 0.74, "learning_rate": 4.4014298049632896e-05, "loss": 2.2467, "step": 118760 }, { "epoch": 0.74, "learning_rate": 4.4008516954368496e-05, "loss": 2.2425, "step": 118768 }, { "epoch": 0.74, "learning_rate": 4.4002736256654144e-05, "loss": 2.2268, "step": 118776 }, { "epoch": 0.74, "learning_rate": 4.3996955956633565e-05, "loss": 2.2385, "step": 118784 }, { "epoch": 0.74, "learning_rate": 4.3991176054450464e-05, "loss": 2.2352, "step": 118792 }, { "epoch": 0.74, "learning_rate": 4.398539655024852e-05, "loss": 2.2399, "step": 118800 }, { "epoch": 0.74, "learning_rate": 4.3979617444171414e-05, "loss": 2.2274, "step": 118808 }, { "epoch": 0.74, "learning_rate": 4.397383873636281e-05, "loss": 2.2419, "step": 118816 }, { "epoch": 0.74, "learning_rate": 4.3968060426966385e-05, "loss": 2.2312, "step": 118824 }, { "epoch": 0.74, "learning_rate": 4.3962282516125765e-05, "loss": 2.2269, "step": 118832 }, { "epoch": 0.74, "learning_rate": 4.3956505003984604e-05, "loss": 2.2443, "step": 118840 }, { "epoch": 0.74, "learning_rate": 4.3950727890686545e-05, "loss": 2.2357, "step": 118848 }, { "epoch": 0.74, "learning_rate": 4.394495117637516e-05, "loss": 2.232, "step": 118856 }, { "epoch": 0.74, "learning_rate": 4.393917486119411e-05, "loss": 2.2361, "step": 118864 }, { "epoch": 0.74, "learning_rate": 4.393339894528697e-05, "loss": 2.2439, "step": 118872 }, { "epoch": 0.74, "learning_rate": 4.392762342879735e-05, "loss": 2.2398, "step": 118880 }, { "epoch": 0.74, "learning_rate": 4.392184831186879e-05, "loss": 2.2352, "step": 118888 }, { "epoch": 0.74, "learning_rate": 4.3916073594644895e-05, "loss": 2.2429, "step": 118896 }, { "epoch": 0.74, "learning_rate": 4.391029927726923e-05, "loss": 2.2409, "step": 118904 }, { "epoch": 0.74, "learning_rate": 4.390452535988532e-05, "loss": 2.2325, "step": 118912 }, { "epoch": 0.74, "learning_rate": 4.38987518426367e-05, "loss": 2.2411, "step": 118920 }, { "epoch": 0.74, "learning_rate": 4.389297872566694e-05, "loss": 2.2531, "step": 118928 }, { "epoch": 0.74, "learning_rate": 4.388720600911953e-05, "loss": 2.2405, "step": 118936 }, { "epoch": 0.74, "learning_rate": 4.388143369313798e-05, "loss": 2.2421, "step": 118944 }, { "epoch": 0.74, "learning_rate": 4.387566177786577e-05, "loss": 2.2462, "step": 118952 }, { "epoch": 0.74, "learning_rate": 4.386989026344647e-05, "loss": 2.2607, "step": 118960 }, { "epoch": 0.74, "learning_rate": 4.386411915002348e-05, "loss": 2.2363, "step": 118968 }, { "epoch": 0.74, "learning_rate": 4.3858348437740296e-05, "loss": 2.2367, "step": 118976 }, { "epoch": 0.74, "learning_rate": 4.385257812674039e-05, "loss": 2.2622, "step": 118984 }, { "epoch": 0.74, "learning_rate": 4.3846808217167196e-05, "loss": 2.2296, "step": 118992 }, { "epoch": 0.74, "learning_rate": 4.384103870916416e-05, "loss": 2.2415, "step": 119000 }, { "epoch": 0.74, "learning_rate": 4.3835269602874716e-05, "loss": 2.2218, "step": 119008 }, { "epoch": 0.74, "learning_rate": 4.38295008984423e-05, "loss": 2.2212, "step": 119016 }, { "epoch": 0.74, "learning_rate": 4.3823732596010294e-05, "loss": 2.2352, "step": 119024 }, { "epoch": 0.74, "learning_rate": 4.38179646957221e-05, "loss": 2.2451, "step": 119032 }, { "epoch": 0.74, "learning_rate": 4.381219719772114e-05, "loss": 2.2341, "step": 119040 }, { "epoch": 0.74, "learning_rate": 4.380643010215076e-05, "loss": 2.2446, "step": 119048 }, { "epoch": 0.74, "learning_rate": 4.380066340915434e-05, "loss": 2.2503, "step": 119056 }, { "epoch": 0.74, "learning_rate": 4.3794897118875275e-05, "loss": 2.2366, "step": 119064 }, { "epoch": 0.74, "learning_rate": 4.378913123145685e-05, "loss": 2.2427, "step": 119072 }, { "epoch": 0.74, "learning_rate": 4.378336574704245e-05, "loss": 2.2333, "step": 119080 }, { "epoch": 0.74, "learning_rate": 4.37776006657754e-05, "loss": 2.2441, "step": 119088 }, { "epoch": 0.74, "learning_rate": 4.377183598779903e-05, "loss": 2.2401, "step": 119096 }, { "epoch": 0.74, "learning_rate": 4.376607171325662e-05, "loss": 2.2468, "step": 119104 }, { "epoch": 0.74, "learning_rate": 4.3760307842291495e-05, "loss": 2.2295, "step": 119112 }, { "epoch": 0.74, "learning_rate": 4.3754544375046954e-05, "loss": 2.2089, "step": 119120 }, { "epoch": 0.74, "learning_rate": 4.3748781311666246e-05, "loss": 2.2498, "step": 119128 }, { "epoch": 0.74, "learning_rate": 4.374301865229265e-05, "loss": 2.2333, "step": 119136 }, { "epoch": 0.74, "learning_rate": 4.373725639706944e-05, "loss": 2.2448, "step": 119144 }, { "epoch": 0.74, "learning_rate": 4.3731494546139885e-05, "loss": 2.2472, "step": 119152 }, { "epoch": 0.74, "learning_rate": 4.3725733099647176e-05, "loss": 2.2299, "step": 119160 }, { "epoch": 0.74, "learning_rate": 4.371997205773457e-05, "loss": 2.2277, "step": 119168 }, { "epoch": 0.74, "learning_rate": 4.37142114205453e-05, "loss": 2.2376, "step": 119176 }, { "epoch": 0.74, "learning_rate": 4.370845118822254e-05, "loss": 2.2361, "step": 119184 }, { "epoch": 0.74, "learning_rate": 4.3702691360909524e-05, "loss": 2.2381, "step": 119192 }, { "epoch": 0.74, "learning_rate": 4.369693193874943e-05, "loss": 2.2589, "step": 119200 }, { "epoch": 0.75, "learning_rate": 4.3691172921885435e-05, "loss": 2.2403, "step": 119208 }, { "epoch": 0.75, "learning_rate": 4.368541431046071e-05, "loss": 2.2474, "step": 119216 }, { "epoch": 0.75, "learning_rate": 4.367965610461841e-05, "loss": 2.23, "step": 119224 }, { "epoch": 0.75, "learning_rate": 4.36738983045017e-05, "loss": 2.2291, "step": 119232 }, { "epoch": 0.75, "learning_rate": 4.366814091025371e-05, "loss": 2.2353, "step": 119240 }, { "epoch": 0.75, "learning_rate": 4.366238392201756e-05, "loss": 2.245, "step": 119248 }, { "epoch": 0.75, "learning_rate": 4.3656627339936384e-05, "loss": 2.2144, "step": 119256 }, { "epoch": 0.75, "learning_rate": 4.3650871164153284e-05, "loss": 2.2309, "step": 119264 }, { "epoch": 0.75, "learning_rate": 4.364511539481136e-05, "loss": 2.242, "step": 119272 }, { "epoch": 0.75, "learning_rate": 4.3639360032053724e-05, "loss": 2.2557, "step": 119280 }, { "epoch": 0.75, "learning_rate": 4.3633605076023405e-05, "loss": 2.2385, "step": 119288 }, { "epoch": 0.75, "learning_rate": 4.3627850526863505e-05, "loss": 2.225, "step": 119296 }, { "epoch": 0.75, "learning_rate": 4.362209638471708e-05, "loss": 2.2499, "step": 119304 }, { "epoch": 0.75, "learning_rate": 4.361634264972719e-05, "loss": 2.2424, "step": 119312 }, { "epoch": 0.75, "learning_rate": 4.3610589322036846e-05, "loss": 2.2473, "step": 119320 }, { "epoch": 0.75, "learning_rate": 4.360483640178909e-05, "loss": 2.2518, "step": 119328 }, { "epoch": 0.75, "learning_rate": 4.359908388912695e-05, "loss": 2.2506, "step": 119336 }, { "epoch": 0.75, "learning_rate": 4.359333178419342e-05, "loss": 2.2318, "step": 119344 }, { "epoch": 0.75, "learning_rate": 4.35875800871315e-05, "loss": 2.2351, "step": 119352 }, { "epoch": 0.75, "learning_rate": 4.358182879808417e-05, "loss": 2.244, "step": 119360 }, { "epoch": 0.75, "learning_rate": 4.357607791719445e-05, "loss": 2.2307, "step": 119368 }, { "epoch": 0.75, "learning_rate": 4.3570327444605255e-05, "loss": 2.2227, "step": 119376 }, { "epoch": 0.75, "learning_rate": 4.3564577380459556e-05, "loss": 2.2409, "step": 119384 }, { "epoch": 0.75, "learning_rate": 4.355882772490032e-05, "loss": 2.2342, "step": 119392 }, { "epoch": 0.75, "learning_rate": 4.3553078478070465e-05, "loss": 2.2367, "step": 119400 }, { "epoch": 0.75, "learning_rate": 4.3547329640112924e-05, "loss": 2.2443, "step": 119408 }, { "epoch": 0.75, "learning_rate": 4.354158121117062e-05, "loss": 2.2355, "step": 119416 }, { "epoch": 0.75, "learning_rate": 4.3535833191386445e-05, "loss": 2.2384, "step": 119424 }, { "epoch": 0.75, "learning_rate": 4.3530085580903304e-05, "loss": 2.2284, "step": 119432 }, { "epoch": 0.75, "learning_rate": 4.352433837986409e-05, "loss": 2.2476, "step": 119440 }, { "epoch": 0.75, "learning_rate": 4.351859158841167e-05, "loss": 2.2391, "step": 119448 }, { "epoch": 0.75, "learning_rate": 4.351284520668891e-05, "loss": 2.2429, "step": 119456 }, { "epoch": 0.75, "learning_rate": 4.350709923483867e-05, "loss": 2.2418, "step": 119464 }, { "epoch": 0.75, "learning_rate": 4.350135367300381e-05, "loss": 2.24, "step": 119472 }, { "epoch": 0.75, "learning_rate": 4.349560852132712e-05, "loss": 2.2211, "step": 119480 }, { "epoch": 0.75, "learning_rate": 4.3489863779951465e-05, "loss": 2.2465, "step": 119488 }, { "epoch": 0.75, "learning_rate": 4.348411944901965e-05, "loss": 2.2397, "step": 119496 }, { "epoch": 0.75, "learning_rate": 4.347837552867449e-05, "loss": 2.2429, "step": 119504 }, { "epoch": 0.75, "learning_rate": 4.347263201905876e-05, "loss": 2.2405, "step": 119512 }, { "epoch": 0.75, "learning_rate": 4.346688892031524e-05, "loss": 2.2344, "step": 119520 }, { "epoch": 0.75, "learning_rate": 4.346114623258674e-05, "loss": 2.2427, "step": 119528 }, { "epoch": 0.75, "learning_rate": 4.3455403956015986e-05, "loss": 2.2406, "step": 119536 }, { "epoch": 0.75, "learning_rate": 4.344966209074574e-05, "loss": 2.2486, "step": 119544 }, { "epoch": 0.75, "learning_rate": 4.344392063691876e-05, "loss": 2.2427, "step": 119552 }, { "epoch": 0.75, "learning_rate": 4.343817959467777e-05, "loss": 2.2552, "step": 119560 }, { "epoch": 0.75, "learning_rate": 4.3432438964165486e-05, "loss": 2.2353, "step": 119568 }, { "epoch": 0.75, "learning_rate": 4.342669874552463e-05, "loss": 2.251, "step": 119576 }, { "epoch": 0.75, "learning_rate": 4.3420958938897914e-05, "loss": 2.2508, "step": 119584 }, { "epoch": 0.75, "learning_rate": 4.341521954442801e-05, "loss": 2.2474, "step": 119592 }, { "epoch": 0.75, "learning_rate": 4.340948056225761e-05, "loss": 2.2453, "step": 119600 }, { "epoch": 0.75, "learning_rate": 4.340374199252939e-05, "loss": 2.2543, "step": 119608 }, { "epoch": 0.75, "learning_rate": 4.3398003835385995e-05, "loss": 2.2389, "step": 119616 }, { "epoch": 0.75, "learning_rate": 4.339226609097009e-05, "loss": 2.2222, "step": 119624 }, { "epoch": 0.75, "learning_rate": 4.338652875942433e-05, "loss": 2.2276, "step": 119632 }, { "epoch": 0.75, "learning_rate": 4.338079184089131e-05, "loss": 2.2299, "step": 119640 }, { "epoch": 0.75, "learning_rate": 4.337505533551367e-05, "loss": 2.2461, "step": 119648 }, { "epoch": 0.75, "learning_rate": 4.336931924343403e-05, "loss": 2.2367, "step": 119656 }, { "epoch": 0.75, "learning_rate": 4.3363583564794975e-05, "loss": 2.2367, "step": 119664 }, { "epoch": 0.75, "learning_rate": 4.33578482997391e-05, "loss": 2.2421, "step": 119672 }, { "epoch": 0.75, "learning_rate": 4.335211344840897e-05, "loss": 2.2253, "step": 119680 }, { "epoch": 0.75, "learning_rate": 4.33463790109472e-05, "loss": 2.2359, "step": 119688 }, { "epoch": 0.75, "learning_rate": 4.334064498749628e-05, "loss": 2.2182, "step": 119696 }, { "epoch": 0.75, "learning_rate": 4.333491137819882e-05, "loss": 2.2401, "step": 119704 }, { "epoch": 0.75, "learning_rate": 4.3329178183197314e-05, "loss": 2.2467, "step": 119712 }, { "epoch": 0.75, "learning_rate": 4.332344540263433e-05, "loss": 2.2355, "step": 119720 }, { "epoch": 0.75, "learning_rate": 4.331771303665235e-05, "loss": 2.2497, "step": 119728 }, { "epoch": 0.75, "learning_rate": 4.3311981085393894e-05, "loss": 2.2222, "step": 119736 }, { "epoch": 0.75, "learning_rate": 4.330624954900147e-05, "loss": 2.2194, "step": 119744 }, { "epoch": 0.75, "learning_rate": 4.3300518427617556e-05, "loss": 2.2418, "step": 119752 }, { "epoch": 0.75, "learning_rate": 4.3294787721384604e-05, "loss": 2.2475, "step": 119760 }, { "epoch": 0.75, "learning_rate": 4.3289057430445136e-05, "loss": 2.242, "step": 119768 }, { "epoch": 0.75, "learning_rate": 4.3283327554941564e-05, "loss": 2.2459, "step": 119776 }, { "epoch": 0.75, "learning_rate": 4.327759809501632e-05, "loss": 2.2358, "step": 119784 }, { "epoch": 0.75, "learning_rate": 4.32718690508119e-05, "loss": 2.2397, "step": 119792 }, { "epoch": 0.75, "learning_rate": 4.326614042247068e-05, "loss": 2.2152, "step": 119800 }, { "epoch": 0.75, "learning_rate": 4.3260412210135074e-05, "loss": 2.2361, "step": 119808 }, { "epoch": 0.75, "learning_rate": 4.325468441394751e-05, "loss": 2.2397, "step": 119816 }, { "epoch": 0.75, "learning_rate": 4.324895703405037e-05, "loss": 2.2237, "step": 119824 }, { "epoch": 0.75, "learning_rate": 4.3243230070586035e-05, "loss": 2.2385, "step": 119832 }, { "epoch": 0.75, "learning_rate": 4.323750352369688e-05, "loss": 2.2285, "step": 119840 }, { "epoch": 0.75, "learning_rate": 4.3231777393525265e-05, "loss": 2.2374, "step": 119848 }, { "epoch": 0.75, "learning_rate": 4.3226051680213564e-05, "loss": 2.2396, "step": 119856 }, { "epoch": 0.75, "learning_rate": 4.322032638390408e-05, "loss": 2.2275, "step": 119864 }, { "epoch": 0.75, "learning_rate": 4.321460150473916e-05, "loss": 2.2333, "step": 119872 }, { "epoch": 0.75, "learning_rate": 4.3208877042861164e-05, "loss": 2.2449, "step": 119880 }, { "epoch": 0.75, "learning_rate": 4.320315299841233e-05, "loss": 2.2402, "step": 119888 }, { "epoch": 0.75, "learning_rate": 4.319742937153502e-05, "loss": 2.2254, "step": 119896 }, { "epoch": 0.75, "learning_rate": 4.3191706162371505e-05, "loss": 2.2383, "step": 119904 }, { "epoch": 0.75, "learning_rate": 4.318598337106403e-05, "loss": 2.2535, "step": 119912 }, { "epoch": 0.75, "learning_rate": 4.3180260997754926e-05, "loss": 2.2504, "step": 119920 }, { "epoch": 0.75, "learning_rate": 4.3174539042586396e-05, "loss": 2.2439, "step": 119928 }, { "epoch": 0.75, "learning_rate": 4.316881750570073e-05, "loss": 2.2384, "step": 119936 }, { "epoch": 0.75, "learning_rate": 4.316309638724015e-05, "loss": 2.2489, "step": 119944 }, { "epoch": 0.75, "learning_rate": 4.315737568734687e-05, "loss": 2.2351, "step": 119952 }, { "epoch": 0.75, "learning_rate": 4.315165540616313e-05, "loss": 2.2338, "step": 119960 }, { "epoch": 0.75, "learning_rate": 4.314593554383113e-05, "loss": 2.2322, "step": 119968 }, { "epoch": 0.75, "learning_rate": 4.3140216100493054e-05, "loss": 2.2465, "step": 119976 }, { "epoch": 0.75, "learning_rate": 4.313449707629111e-05, "loss": 2.2401, "step": 119984 }, { "epoch": 0.75, "learning_rate": 4.312877847136745e-05, "loss": 2.2424, "step": 119992 }, { "epoch": 0.75, "learning_rate": 4.3123060285864246e-05, "loss": 2.2424, "step": 120000 }, { "epoch": 0.75, "learning_rate": 4.311734251992367e-05, "loss": 2.2302, "step": 120008 }, { "epoch": 0.75, "learning_rate": 4.311162517368785e-05, "loss": 2.2293, "step": 120016 }, { "epoch": 0.75, "learning_rate": 4.310590824729891e-05, "loss": 2.237, "step": 120024 }, { "epoch": 0.75, "learning_rate": 4.310019174089901e-05, "loss": 2.2457, "step": 120032 }, { "epoch": 0.75, "learning_rate": 4.3094475654630223e-05, "loss": 2.2348, "step": 120040 }, { "epoch": 0.75, "learning_rate": 4.308875998863467e-05, "loss": 2.2471, "step": 120048 }, { "epoch": 0.75, "learning_rate": 4.308304474305444e-05, "loss": 2.2331, "step": 120056 }, { "epoch": 0.75, "learning_rate": 4.307732991803161e-05, "loss": 2.2436, "step": 120064 }, { "epoch": 0.75, "learning_rate": 4.307161551370829e-05, "loss": 2.2329, "step": 120072 }, { "epoch": 0.75, "learning_rate": 4.3065901530226463e-05, "loss": 2.2487, "step": 120080 }, { "epoch": 0.75, "learning_rate": 4.306018796772823e-05, "loss": 2.2293, "step": 120088 }, { "epoch": 0.75, "learning_rate": 4.305447482635566e-05, "loss": 2.2336, "step": 120096 }, { "epoch": 0.75, "learning_rate": 4.304876210625072e-05, "loss": 2.2543, "step": 120104 }, { "epoch": 0.75, "learning_rate": 4.304304980755546e-05, "loss": 2.2569, "step": 120112 }, { "epoch": 0.75, "learning_rate": 4.303733793041189e-05, "loss": 2.2294, "step": 120120 }, { "epoch": 0.75, "learning_rate": 4.303162647496199e-05, "loss": 2.2579, "step": 120128 }, { "epoch": 0.75, "learning_rate": 4.3025915441347776e-05, "loss": 2.2319, "step": 120136 }, { "epoch": 0.75, "learning_rate": 4.302020482971119e-05, "loss": 2.2499, "step": 120144 }, { "epoch": 0.75, "learning_rate": 4.301449464019423e-05, "loss": 2.256, "step": 120152 }, { "epoch": 0.75, "learning_rate": 4.300878487293884e-05, "loss": 2.2389, "step": 120160 }, { "epoch": 0.75, "learning_rate": 4.300307552808695e-05, "loss": 2.2488, "step": 120168 }, { "epoch": 0.75, "learning_rate": 4.2997366605780525e-05, "loss": 2.2589, "step": 120176 }, { "epoch": 0.75, "learning_rate": 4.2991658106161474e-05, "loss": 2.2407, "step": 120184 }, { "epoch": 0.75, "learning_rate": 4.298595002937169e-05, "loss": 2.2353, "step": 120192 }, { "epoch": 0.75, "learning_rate": 4.298024237555312e-05, "loss": 2.2327, "step": 120200 }, { "epoch": 0.75, "learning_rate": 4.297453514484763e-05, "loss": 2.2398, "step": 120208 }, { "epoch": 0.75, "learning_rate": 4.29688283373971e-05, "loss": 2.2373, "step": 120216 }, { "epoch": 0.75, "learning_rate": 4.2963121953343415e-05, "loss": 2.2394, "step": 120224 }, { "epoch": 0.75, "learning_rate": 4.295741599282843e-05, "loss": 2.2436, "step": 120232 }, { "epoch": 0.75, "learning_rate": 4.295171045599398e-05, "loss": 2.2442, "step": 120240 }, { "epoch": 0.75, "learning_rate": 4.2946005342981935e-05, "loss": 2.2276, "step": 120248 }, { "epoch": 0.75, "learning_rate": 4.2940300653934114e-05, "loss": 2.2337, "step": 120256 }, { "epoch": 0.75, "learning_rate": 4.2934596388992335e-05, "loss": 2.2668, "step": 120264 }, { "epoch": 0.75, "learning_rate": 4.2928892548298386e-05, "loss": 2.239, "step": 120272 }, { "epoch": 0.75, "learning_rate": 4.292318913199408e-05, "loss": 2.2422, "step": 120280 }, { "epoch": 0.75, "learning_rate": 4.291748614022124e-05, "loss": 2.2296, "step": 120288 }, { "epoch": 0.75, "learning_rate": 4.2911783573121586e-05, "loss": 2.2286, "step": 120296 }, { "epoch": 0.75, "learning_rate": 4.2906081430836905e-05, "loss": 2.2441, "step": 120304 }, { "epoch": 0.75, "learning_rate": 4.2900379713509e-05, "loss": 2.2256, "step": 120312 }, { "epoch": 0.75, "learning_rate": 4.289467842127953e-05, "loss": 2.2392, "step": 120320 }, { "epoch": 0.75, "learning_rate": 4.288897755429029e-05, "loss": 2.2344, "step": 120328 }, { "epoch": 0.75, "learning_rate": 4.288327711268298e-05, "loss": 2.2452, "step": 120336 }, { "epoch": 0.75, "learning_rate": 4.2877577096599325e-05, "loss": 2.2176, "step": 120344 }, { "epoch": 0.75, "learning_rate": 4.287187750618103e-05, "loss": 2.2541, "step": 120352 }, { "epoch": 0.75, "learning_rate": 4.286617834156977e-05, "loss": 2.2463, "step": 120360 }, { "epoch": 0.75, "learning_rate": 4.286047960290725e-05, "loss": 2.2361, "step": 120368 }, { "epoch": 0.75, "learning_rate": 4.2854781290335135e-05, "loss": 2.238, "step": 120376 }, { "epoch": 0.75, "learning_rate": 4.284908340399506e-05, "loss": 2.2314, "step": 120384 }, { "epoch": 0.75, "learning_rate": 4.284338594402871e-05, "loss": 2.2317, "step": 120392 }, { "epoch": 0.75, "learning_rate": 4.283768891057771e-05, "loss": 2.2364, "step": 120400 }, { "epoch": 0.75, "learning_rate": 4.283199230378368e-05, "loss": 2.2312, "step": 120408 }, { "epoch": 0.75, "learning_rate": 4.2826296123788264e-05, "loss": 2.2352, "step": 120416 }, { "epoch": 0.75, "learning_rate": 4.2820600370733054e-05, "loss": 2.2366, "step": 120424 }, { "epoch": 0.75, "learning_rate": 4.281490504475962e-05, "loss": 2.2354, "step": 120432 }, { "epoch": 0.75, "learning_rate": 4.2809210146009606e-05, "loss": 2.2376, "step": 120440 }, { "epoch": 0.75, "learning_rate": 4.280351567462454e-05, "loss": 2.2498, "step": 120448 }, { "epoch": 0.75, "learning_rate": 4.2797821630745994e-05, "loss": 2.2458, "step": 120456 }, { "epoch": 0.75, "learning_rate": 4.279212801451555e-05, "loss": 2.2287, "step": 120464 }, { "epoch": 0.75, "learning_rate": 4.278643482607474e-05, "loss": 2.2295, "step": 120472 }, { "epoch": 0.75, "learning_rate": 4.2780742065565083e-05, "loss": 2.2275, "step": 120480 }, { "epoch": 0.75, "learning_rate": 4.2775049733128094e-05, "loss": 2.2439, "step": 120488 }, { "epoch": 0.75, "learning_rate": 4.2769357828905304e-05, "loss": 2.2272, "step": 120496 }, { "epoch": 0.75, "learning_rate": 4.276366635303824e-05, "loss": 2.2526, "step": 120504 }, { "epoch": 0.75, "learning_rate": 4.2757975305668344e-05, "loss": 2.2385, "step": 120512 }, { "epoch": 0.75, "learning_rate": 4.27522846869371e-05, "loss": 2.2371, "step": 120520 }, { "epoch": 0.75, "learning_rate": 4.2746594496986036e-05, "loss": 2.245, "step": 120528 }, { "epoch": 0.75, "learning_rate": 4.274090473595653e-05, "loss": 2.2336, "step": 120536 }, { "epoch": 0.75, "learning_rate": 4.273521540399009e-05, "loss": 2.2528, "step": 120544 }, { "epoch": 0.75, "learning_rate": 4.2729526501228124e-05, "loss": 2.2311, "step": 120552 }, { "epoch": 0.75, "learning_rate": 4.2723838027812066e-05, "loss": 2.2538, "step": 120560 }, { "epoch": 0.75, "learning_rate": 4.271814998388335e-05, "loss": 2.2269, "step": 120568 }, { "epoch": 0.75, "learning_rate": 4.2712462369583335e-05, "loss": 2.2515, "step": 120576 }, { "epoch": 0.75, "learning_rate": 4.2706775185053464e-05, "loss": 2.2517, "step": 120584 }, { "epoch": 0.75, "learning_rate": 4.2701088430435104e-05, "loss": 2.2275, "step": 120592 }, { "epoch": 0.75, "learning_rate": 4.2695402105869615e-05, "loss": 2.2432, "step": 120600 }, { "epoch": 0.75, "learning_rate": 4.268971621149838e-05, "loss": 2.2357, "step": 120608 }, { "epoch": 0.75, "learning_rate": 4.268403074746274e-05, "loss": 2.2279, "step": 120616 }, { "epoch": 0.75, "learning_rate": 4.267834571390403e-05, "loss": 2.2361, "step": 120624 }, { "epoch": 0.75, "learning_rate": 4.26726611109636e-05, "loss": 2.2376, "step": 120632 }, { "epoch": 0.75, "learning_rate": 4.266697693878277e-05, "loss": 2.2478, "step": 120640 }, { "epoch": 0.75, "learning_rate": 4.266129319750281e-05, "loss": 2.2326, "step": 120648 }, { "epoch": 0.75, "learning_rate": 4.2655609887265064e-05, "loss": 2.2275, "step": 120656 }, { "epoch": 0.75, "learning_rate": 4.26499270082108e-05, "loss": 2.2508, "step": 120664 }, { "epoch": 0.75, "learning_rate": 4.264424456048129e-05, "loss": 2.2244, "step": 120672 }, { "epoch": 0.75, "learning_rate": 4.263856254421781e-05, "loss": 2.2497, "step": 120680 }, { "epoch": 0.75, "learning_rate": 4.2632880959561615e-05, "loss": 2.2488, "step": 120688 }, { "epoch": 0.75, "learning_rate": 4.262719980665397e-05, "loss": 2.2215, "step": 120696 }, { "epoch": 0.75, "learning_rate": 4.262151908563605e-05, "loss": 2.2582, "step": 120704 }, { "epoch": 0.75, "learning_rate": 4.261583879664913e-05, "loss": 2.243, "step": 120712 }, { "epoch": 0.75, "learning_rate": 4.2610158939834425e-05, "loss": 2.248, "step": 120720 }, { "epoch": 0.75, "learning_rate": 4.2604479515333094e-05, "loss": 2.2442, "step": 120728 }, { "epoch": 0.75, "learning_rate": 4.2598800523286366e-05, "loss": 2.2544, "step": 120736 }, { "epoch": 0.75, "learning_rate": 4.259312196383541e-05, "loss": 2.2344, "step": 120744 }, { "epoch": 0.75, "learning_rate": 4.258744383712139e-05, "loss": 2.2337, "step": 120752 }, { "epoch": 0.75, "learning_rate": 4.2581766143285476e-05, "loss": 2.2331, "step": 120760 }, { "epoch": 0.75, "learning_rate": 4.2576088882468795e-05, "loss": 2.244, "step": 120768 }, { "epoch": 0.75, "learning_rate": 4.257041205481252e-05, "loss": 2.237, "step": 120776 }, { "epoch": 0.75, "learning_rate": 4.256473566045775e-05, "loss": 2.2368, "step": 120784 }, { "epoch": 0.75, "learning_rate": 4.25590596995456e-05, "loss": 2.2397, "step": 120792 }, { "epoch": 0.76, "learning_rate": 4.2553384172217195e-05, "loss": 2.2382, "step": 120800 }, { "epoch": 0.76, "learning_rate": 4.2547709078613606e-05, "loss": 2.2513, "step": 120808 }, { "epoch": 0.76, "learning_rate": 4.254203441887592e-05, "loss": 2.2378, "step": 120816 }, { "epoch": 0.76, "learning_rate": 4.253636019314524e-05, "loss": 2.2435, "step": 120824 }, { "epoch": 0.76, "learning_rate": 4.25306864015626e-05, "loss": 2.2299, "step": 120832 }, { "epoch": 0.76, "learning_rate": 4.252501304426904e-05, "loss": 2.2358, "step": 120840 }, { "epoch": 0.76, "learning_rate": 4.2519340121405626e-05, "loss": 2.237, "step": 120848 }, { "epoch": 0.76, "learning_rate": 4.251366763311338e-05, "loss": 2.2352, "step": 120856 }, { "epoch": 0.76, "learning_rate": 4.250799557953331e-05, "loss": 2.2487, "step": 120864 }, { "epoch": 0.76, "learning_rate": 4.2502323960806444e-05, "loss": 2.2536, "step": 120872 }, { "epoch": 0.76, "learning_rate": 4.249665277707377e-05, "loss": 2.2294, "step": 120880 }, { "epoch": 0.76, "learning_rate": 4.2490982028476266e-05, "loss": 2.2296, "step": 120888 }, { "epoch": 0.76, "learning_rate": 4.24853117151549e-05, "loss": 2.2442, "step": 120896 }, { "epoch": 0.76, "learning_rate": 4.2479641837250656e-05, "loss": 2.2395, "step": 120904 }, { "epoch": 0.76, "learning_rate": 4.2473972394904504e-05, "loss": 2.238, "step": 120912 }, { "epoch": 0.76, "learning_rate": 4.2468303388257334e-05, "loss": 2.2343, "step": 120920 }, { "epoch": 0.76, "learning_rate": 4.2462634817450114e-05, "loss": 2.2327, "step": 120928 }, { "epoch": 0.76, "learning_rate": 4.245696668262379e-05, "loss": 2.2314, "step": 120936 }, { "epoch": 0.76, "learning_rate": 4.245129898391921e-05, "loss": 2.2238, "step": 120944 }, { "epoch": 0.76, "learning_rate": 4.2445631721477325e-05, "loss": 2.2421, "step": 120952 }, { "epoch": 0.76, "learning_rate": 4.2439964895439e-05, "loss": 2.2497, "step": 120960 }, { "epoch": 0.76, "learning_rate": 4.243429850594511e-05, "loss": 2.224, "step": 120968 }, { "epoch": 0.76, "learning_rate": 4.242863255313654e-05, "loss": 2.2223, "step": 120976 }, { "epoch": 0.76, "learning_rate": 4.242296703715412e-05, "loss": 2.2326, "step": 120984 }, { "epoch": 0.76, "learning_rate": 4.241730195813873e-05, "loss": 2.2326, "step": 120992 }, { "epoch": 0.76, "learning_rate": 4.241163731623118e-05, "loss": 2.2274, "step": 121000 }, { "epoch": 0.76, "learning_rate": 4.2405973111572284e-05, "loss": 2.2239, "step": 121008 }, { "epoch": 0.76, "learning_rate": 4.2400309344302893e-05, "loss": 2.2325, "step": 121016 }, { "epoch": 0.76, "learning_rate": 4.2394646014563784e-05, "loss": 2.2412, "step": 121024 }, { "epoch": 0.76, "learning_rate": 4.238898312249573e-05, "loss": 2.2328, "step": 121032 }, { "epoch": 0.76, "learning_rate": 4.238332066823956e-05, "loss": 2.2379, "step": 121040 }, { "epoch": 0.76, "learning_rate": 4.2377658651936e-05, "loss": 2.2459, "step": 121048 }, { "epoch": 0.76, "learning_rate": 4.2371997073725814e-05, "loss": 2.2265, "step": 121056 }, { "epoch": 0.76, "learning_rate": 4.236633593374977e-05, "loss": 2.2424, "step": 121064 }, { "epoch": 0.76, "learning_rate": 4.2360675232148604e-05, "loss": 2.2198, "step": 121072 }, { "epoch": 0.76, "learning_rate": 4.235501496906301e-05, "loss": 2.2285, "step": 121080 }, { "epoch": 0.76, "learning_rate": 4.234935514463374e-05, "loss": 2.238, "step": 121088 }, { "epoch": 0.76, "learning_rate": 4.2343695759001476e-05, "loss": 2.2291, "step": 121096 }, { "epoch": 0.76, "learning_rate": 4.233803681230692e-05, "loss": 2.2323, "step": 121104 }, { "epoch": 0.76, "learning_rate": 4.233237830469073e-05, "loss": 2.245, "step": 121112 }, { "epoch": 0.76, "learning_rate": 4.232672023629361e-05, "loss": 2.2391, "step": 121120 }, { "epoch": 0.76, "learning_rate": 4.232106260725622e-05, "loss": 2.2356, "step": 121128 }, { "epoch": 0.76, "learning_rate": 4.231540541771918e-05, "loss": 2.2399, "step": 121136 }, { "epoch": 0.76, "learning_rate": 4.230974866782314e-05, "loss": 2.2585, "step": 121144 }, { "epoch": 0.76, "learning_rate": 4.230409235770877e-05, "loss": 2.2262, "step": 121152 }, { "epoch": 0.76, "learning_rate": 4.2298436487516616e-05, "loss": 2.238, "step": 121160 }, { "epoch": 0.76, "learning_rate": 4.2292781057387327e-05, "loss": 2.2274, "step": 121168 }, { "epoch": 0.76, "learning_rate": 4.2287126067461493e-05, "loss": 2.2311, "step": 121176 }, { "epoch": 0.76, "learning_rate": 4.228147151787967e-05, "loss": 2.2387, "step": 121184 }, { "epoch": 0.76, "learning_rate": 4.2275817408782484e-05, "loss": 2.2426, "step": 121192 }, { "epoch": 0.76, "learning_rate": 4.2270163740310434e-05, "loss": 2.2349, "step": 121200 }, { "epoch": 0.76, "learning_rate": 4.226451051260413e-05, "loss": 2.2347, "step": 121208 }, { "epoch": 0.76, "learning_rate": 4.225885772580407e-05, "loss": 2.233, "step": 121216 }, { "epoch": 0.76, "learning_rate": 4.22532053800508e-05, "loss": 2.2367, "step": 121224 }, { "epoch": 0.76, "learning_rate": 4.2247553475484835e-05, "loss": 2.2302, "step": 121232 }, { "epoch": 0.76, "learning_rate": 4.224190201224669e-05, "loss": 2.241, "step": 121240 }, { "epoch": 0.76, "learning_rate": 4.2236250990476836e-05, "loss": 2.247, "step": 121248 }, { "epoch": 0.76, "learning_rate": 4.22306004103158e-05, "loss": 2.2117, "step": 121256 }, { "epoch": 0.76, "learning_rate": 4.222495027190402e-05, "loss": 2.2494, "step": 121264 }, { "epoch": 0.76, "learning_rate": 4.221930057538196e-05, "loss": 2.2305, "step": 121272 }, { "epoch": 0.76, "learning_rate": 4.2213651320890095e-05, "loss": 2.246, "step": 121280 }, { "epoch": 0.76, "learning_rate": 4.220800250856885e-05, "loss": 2.2372, "step": 121288 }, { "epoch": 0.76, "learning_rate": 4.2202354138558654e-05, "loss": 2.2278, "step": 121296 }, { "epoch": 0.76, "learning_rate": 4.2196706210999944e-05, "loss": 2.2454, "step": 121304 }, { "epoch": 0.76, "learning_rate": 4.2191058726033113e-05, "loss": 2.2324, "step": 121312 }, { "epoch": 0.76, "learning_rate": 4.218541168379856e-05, "loss": 2.2285, "step": 121320 }, { "epoch": 0.76, "learning_rate": 4.217976508443666e-05, "loss": 2.2475, "step": 121328 }, { "epoch": 0.76, "learning_rate": 4.217411892808779e-05, "loss": 2.2335, "step": 121336 }, { "epoch": 0.76, "learning_rate": 4.216847321489236e-05, "loss": 2.2391, "step": 121344 }, { "epoch": 0.76, "learning_rate": 4.216282794499065e-05, "loss": 2.2504, "step": 121352 }, { "epoch": 0.76, "learning_rate": 4.215718311852305e-05, "loss": 2.2515, "step": 121360 }, { "epoch": 0.76, "learning_rate": 4.21515387356299e-05, "loss": 2.2317, "step": 121368 }, { "epoch": 0.76, "learning_rate": 4.2145894796451476e-05, "loss": 2.2445, "step": 121376 }, { "epoch": 0.76, "learning_rate": 4.214025130112812e-05, "loss": 2.2447, "step": 121384 }, { "epoch": 0.76, "learning_rate": 4.213460824980011e-05, "loss": 2.2518, "step": 121392 }, { "epoch": 0.76, "learning_rate": 4.212896564260775e-05, "loss": 2.2458, "step": 121400 }, { "epoch": 0.76, "learning_rate": 4.2123323479691326e-05, "loss": 2.244, "step": 121408 }, { "epoch": 0.76, "learning_rate": 4.211768176119106e-05, "loss": 2.2442, "step": 121416 }, { "epoch": 0.76, "learning_rate": 4.211204048724724e-05, "loss": 2.2585, "step": 121424 }, { "epoch": 0.76, "learning_rate": 4.2106399658000114e-05, "loss": 2.2514, "step": 121432 }, { "epoch": 0.76, "learning_rate": 4.2100759273589876e-05, "loss": 2.2506, "step": 121440 }, { "epoch": 0.76, "learning_rate": 4.209511933415678e-05, "loss": 2.2344, "step": 121448 }, { "epoch": 0.76, "learning_rate": 4.208947983984105e-05, "loss": 2.2302, "step": 121456 }, { "epoch": 0.76, "learning_rate": 4.2083840790782825e-05, "loss": 2.2492, "step": 121464 }, { "epoch": 0.76, "learning_rate": 4.207820218712235e-05, "loss": 2.2405, "step": 121472 }, { "epoch": 0.76, "learning_rate": 4.2072564028999775e-05, "loss": 2.2437, "step": 121480 }, { "epoch": 0.76, "learning_rate": 4.206692631655526e-05, "loss": 2.2183, "step": 121488 }, { "epoch": 0.76, "learning_rate": 4.206128904992898e-05, "loss": 2.2277, "step": 121496 }, { "epoch": 0.76, "learning_rate": 4.205565222926107e-05, "loss": 2.2195, "step": 121504 }, { "epoch": 0.76, "learning_rate": 4.205001585469164e-05, "loss": 2.2614, "step": 121512 }, { "epoch": 0.76, "learning_rate": 4.204437992636085e-05, "loss": 2.2192, "step": 121520 }, { "epoch": 0.76, "learning_rate": 4.203874444440879e-05, "loss": 2.2332, "step": 121528 }, { "epoch": 0.76, "learning_rate": 4.2033109408975554e-05, "loss": 2.2423, "step": 121536 }, { "epoch": 0.76, "learning_rate": 4.202747482020122e-05, "loss": 2.2504, "step": 121544 }, { "epoch": 0.76, "learning_rate": 4.2021840678225875e-05, "loss": 2.2396, "step": 121552 }, { "epoch": 0.76, "learning_rate": 4.201620698318962e-05, "loss": 2.2316, "step": 121560 }, { "epoch": 0.76, "learning_rate": 4.201057373523245e-05, "loss": 2.2436, "step": 121568 }, { "epoch": 0.76, "learning_rate": 4.200494093449445e-05, "loss": 2.236, "step": 121576 }, { "epoch": 0.76, "learning_rate": 4.199930858111564e-05, "loss": 2.2343, "step": 121584 }, { "epoch": 0.76, "learning_rate": 4.1993676675236016e-05, "loss": 2.2296, "step": 121592 }, { "epoch": 0.76, "learning_rate": 4.198804521699563e-05, "loss": 2.2278, "step": 121600 }, { "epoch": 0.76, "learning_rate": 4.198241420653444e-05, "loss": 2.2328, "step": 121608 }, { "epoch": 0.76, "learning_rate": 4.1976783643992476e-05, "loss": 2.258, "step": 121616 }, { "epoch": 0.76, "learning_rate": 4.197115352950969e-05, "loss": 2.2484, "step": 121624 }, { "epoch": 0.76, "learning_rate": 4.1965523863226035e-05, "loss": 2.243, "step": 121632 }, { "epoch": 0.76, "learning_rate": 4.195989464528149e-05, "loss": 2.227, "step": 121640 }, { "epoch": 0.76, "learning_rate": 4.1954265875816004e-05, "loss": 2.227, "step": 121648 }, { "epoch": 0.76, "learning_rate": 4.194863755496947e-05, "loss": 2.2371, "step": 121656 }, { "epoch": 0.76, "learning_rate": 4.1943009682881844e-05, "loss": 2.2414, "step": 121664 }, { "epoch": 0.76, "learning_rate": 4.193738225969302e-05, "loss": 2.2354, "step": 121672 }, { "epoch": 0.76, "learning_rate": 4.193175528554289e-05, "loss": 2.2476, "step": 121680 }, { "epoch": 0.76, "learning_rate": 4.1926128760571356e-05, "loss": 2.238, "step": 121688 }, { "epoch": 0.76, "learning_rate": 4.192050268491831e-05, "loss": 2.2525, "step": 121696 }, { "epoch": 0.76, "learning_rate": 4.191487705872356e-05, "loss": 2.2447, "step": 121704 }, { "epoch": 0.76, "learning_rate": 4.190925188212702e-05, "loss": 2.2366, "step": 121712 }, { "epoch": 0.76, "learning_rate": 4.190362715526851e-05, "loss": 2.2515, "step": 121720 }, { "epoch": 0.76, "learning_rate": 4.189800287828784e-05, "loss": 2.2434, "step": 121728 }, { "epoch": 0.76, "learning_rate": 4.1892379051324865e-05, "loss": 2.2573, "step": 121736 }, { "epoch": 0.76, "learning_rate": 4.1886755674519363e-05, "loss": 2.2427, "step": 121744 }, { "epoch": 0.76, "learning_rate": 4.188113274801117e-05, "loss": 2.24, "step": 121752 }, { "epoch": 0.76, "learning_rate": 4.187551027194003e-05, "loss": 2.2427, "step": 121760 }, { "epoch": 0.76, "learning_rate": 4.186988824644574e-05, "loss": 2.2439, "step": 121768 }, { "epoch": 0.76, "learning_rate": 4.1864266671668096e-05, "loss": 2.2449, "step": 121776 }, { "epoch": 0.76, "learning_rate": 4.185864554774677e-05, "loss": 2.2404, "step": 121784 }, { "epoch": 0.76, "learning_rate": 4.185302487482158e-05, "loss": 2.2501, "step": 121792 }, { "epoch": 0.76, "learning_rate": 4.184740465303223e-05, "loss": 2.2181, "step": 121800 }, { "epoch": 0.76, "learning_rate": 4.18417848825184e-05, "loss": 2.2366, "step": 121808 }, { "epoch": 0.76, "learning_rate": 4.183616556341987e-05, "loss": 2.2384, "step": 121816 }, { "epoch": 0.76, "learning_rate": 4.183054669587629e-05, "loss": 2.2462, "step": 121824 }, { "epoch": 0.76, "learning_rate": 4.182492828002736e-05, "loss": 2.2434, "step": 121832 }, { "epoch": 0.76, "learning_rate": 4.181931031601276e-05, "loss": 2.2345, "step": 121840 }, { "epoch": 0.76, "learning_rate": 4.1813692803972124e-05, "loss": 2.234, "step": 121848 }, { "epoch": 0.76, "learning_rate": 4.180807574404515e-05, "loss": 2.226, "step": 121856 }, { "epoch": 0.76, "learning_rate": 4.1802459136371443e-05, "loss": 2.2346, "step": 121864 }, { "epoch": 0.76, "learning_rate": 4.179684298109064e-05, "loss": 2.2369, "step": 121872 }, { "epoch": 0.76, "learning_rate": 4.1791227278342366e-05, "loss": 2.2328, "step": 121880 }, { "epoch": 0.76, "learning_rate": 4.178561202826623e-05, "loss": 2.245, "step": 121888 }, { "epoch": 0.76, "learning_rate": 4.177999723100181e-05, "loss": 2.2469, "step": 121896 }, { "epoch": 0.76, "learning_rate": 4.1774382886688714e-05, "loss": 2.2212, "step": 121904 }, { "epoch": 0.76, "learning_rate": 4.1768768995466504e-05, "loss": 2.235, "step": 121912 }, { "epoch": 0.76, "learning_rate": 4.176315555747473e-05, "loss": 2.2282, "step": 121920 }, { "epoch": 0.76, "learning_rate": 4.175754257285297e-05, "loss": 2.2592, "step": 121928 }, { "epoch": 0.76, "learning_rate": 4.175193004174075e-05, "loss": 2.2463, "step": 121936 }, { "epoch": 0.76, "learning_rate": 4.174631796427759e-05, "loss": 2.2395, "step": 121944 }, { "epoch": 0.76, "learning_rate": 4.174070634060301e-05, "loss": 2.2552, "step": 121952 }, { "epoch": 0.76, "learning_rate": 4.1735095170856506e-05, "loss": 2.2057, "step": 121960 }, { "epoch": 0.76, "learning_rate": 4.172948445517763e-05, "loss": 2.2506, "step": 121968 }, { "epoch": 0.76, "learning_rate": 4.1723874193705774e-05, "loss": 2.2627, "step": 121976 }, { "epoch": 0.76, "learning_rate": 4.171826438658046e-05, "loss": 2.2533, "step": 121984 }, { "epoch": 0.76, "learning_rate": 4.171265503394118e-05, "loss": 2.2254, "step": 121992 }, { "epoch": 0.76, "learning_rate": 4.170704613592732e-05, "loss": 2.2503, "step": 122000 }, { "epoch": 0.76, "learning_rate": 4.170143769267836e-05, "loss": 2.2346, "step": 122008 }, { "epoch": 0.76, "learning_rate": 4.169582970433371e-05, "loss": 2.2175, "step": 122016 }, { "epoch": 0.76, "learning_rate": 4.169022217103276e-05, "loss": 2.2408, "step": 122024 }, { "epoch": 0.76, "learning_rate": 4.168461509291497e-05, "loss": 2.2507, "step": 122032 }, { "epoch": 0.76, "learning_rate": 4.167900847011969e-05, "loss": 2.2369, "step": 122040 }, { "epoch": 0.76, "learning_rate": 4.1673402302786325e-05, "loss": 2.2449, "step": 122048 }, { "epoch": 0.76, "learning_rate": 4.1667796591054234e-05, "loss": 2.2532, "step": 122056 }, { "epoch": 0.76, "learning_rate": 4.1662191335062765e-05, "loss": 2.2404, "step": 122064 }, { "epoch": 0.76, "learning_rate": 4.1656586534951287e-05, "loss": 2.2463, "step": 122072 }, { "epoch": 0.76, "learning_rate": 4.165098219085913e-05, "loss": 2.2463, "step": 122080 }, { "epoch": 0.76, "learning_rate": 4.16453783029256e-05, "loss": 2.2362, "step": 122088 }, { "epoch": 0.76, "learning_rate": 4.1639774871290036e-05, "loss": 2.2386, "step": 122096 }, { "epoch": 0.76, "learning_rate": 4.1634171896091736e-05, "loss": 2.2457, "step": 122104 }, { "epoch": 0.76, "learning_rate": 4.162856937746996e-05, "loss": 2.2276, "step": 122112 }, { "epoch": 0.76, "learning_rate": 4.162296731556403e-05, "loss": 2.2511, "step": 122120 }, { "epoch": 0.76, "learning_rate": 4.161736571051319e-05, "loss": 2.2544, "step": 122128 }, { "epoch": 0.76, "learning_rate": 4.1611764562456686e-05, "loss": 2.229, "step": 122136 }, { "epoch": 0.76, "learning_rate": 4.1606163871533796e-05, "loss": 2.2368, "step": 122144 }, { "epoch": 0.76, "learning_rate": 4.1600563637883736e-05, "loss": 2.2302, "step": 122152 }, { "epoch": 0.76, "learning_rate": 4.159496386164573e-05, "loss": 2.2376, "step": 122160 }, { "epoch": 0.76, "learning_rate": 4.158936454295897e-05, "loss": 2.2391, "step": 122168 }, { "epoch": 0.76, "learning_rate": 4.158376568196267e-05, "loss": 2.2528, "step": 122176 }, { "epoch": 0.76, "learning_rate": 4.157816727879606e-05, "loss": 2.2337, "step": 122184 }, { "epoch": 0.76, "learning_rate": 4.157256933359824e-05, "loss": 2.239, "step": 122192 }, { "epoch": 0.76, "learning_rate": 4.1566971846508415e-05, "loss": 2.2482, "step": 122200 }, { "epoch": 0.76, "learning_rate": 4.156137481766578e-05, "loss": 2.246, "step": 122208 }, { "epoch": 0.76, "learning_rate": 4.155577824720939e-05, "loss": 2.2281, "step": 122216 }, { "epoch": 0.76, "learning_rate": 4.1550182135278444e-05, "loss": 2.2354, "step": 122224 }, { "epoch": 0.76, "learning_rate": 4.1544586482012044e-05, "loss": 2.2471, "step": 122232 }, { "epoch": 0.76, "learning_rate": 4.153899128754927e-05, "loss": 2.2429, "step": 122240 }, { "epoch": 0.76, "learning_rate": 4.153339655202926e-05, "loss": 2.2327, "step": 122248 }, { "epoch": 0.76, "learning_rate": 4.152780227559108e-05, "loss": 2.2298, "step": 122256 }, { "epoch": 0.76, "learning_rate": 4.152220845837381e-05, "loss": 2.2432, "step": 122264 }, { "epoch": 0.76, "learning_rate": 4.151661510051652e-05, "loss": 2.2305, "step": 122272 }, { "epoch": 0.76, "learning_rate": 4.151102220215823e-05, "loss": 2.2426, "step": 122280 }, { "epoch": 0.76, "learning_rate": 4.150542976343802e-05, "loss": 2.2307, "step": 122288 }, { "epoch": 0.76, "learning_rate": 4.149983778449491e-05, "loss": 2.2449, "step": 122296 }, { "epoch": 0.76, "learning_rate": 4.149424626546788e-05, "loss": 2.2442, "step": 122304 }, { "epoch": 0.76, "learning_rate": 4.1488655206495985e-05, "loss": 2.2303, "step": 122312 }, { "epoch": 0.76, "learning_rate": 4.1483064607718205e-05, "loss": 2.2339, "step": 122320 }, { "epoch": 0.76, "learning_rate": 4.147747446927349e-05, "loss": 2.2283, "step": 122328 }, { "epoch": 0.76, "learning_rate": 4.1471884791300864e-05, "loss": 2.236, "step": 122336 }, { "epoch": 0.76, "learning_rate": 4.146629557393925e-05, "loss": 2.2575, "step": 122344 }, { "epoch": 0.76, "learning_rate": 4.1460706817327594e-05, "loss": 2.2457, "step": 122352 }, { "epoch": 0.76, "learning_rate": 4.1455118521604866e-05, "loss": 2.225, "step": 122360 }, { "epoch": 0.76, "learning_rate": 4.144953068690997e-05, "loss": 2.2405, "step": 122368 }, { "epoch": 0.76, "learning_rate": 4.1443943313381823e-05, "loss": 2.2378, "step": 122376 }, { "epoch": 0.76, "learning_rate": 4.1438356401159316e-05, "loss": 2.2292, "step": 122384 }, { "epoch": 0.76, "learning_rate": 4.1432769950381344e-05, "loss": 2.2218, "step": 122392 }, { "epoch": 0.77, "learning_rate": 4.1427183961186834e-05, "loss": 2.2282, "step": 122400 }, { "epoch": 0.77, "learning_rate": 4.142159843371458e-05, "loss": 2.2281, "step": 122408 }, { "epoch": 0.77, "learning_rate": 4.1416013368103483e-05, "loss": 2.2527, "step": 122416 }, { "epoch": 0.77, "learning_rate": 4.141042876449239e-05, "loss": 2.2338, "step": 122424 }, { "epoch": 0.77, "learning_rate": 4.1404844623020096e-05, "loss": 2.2343, "step": 122432 }, { "epoch": 0.77, "learning_rate": 4.139926094382547e-05, "loss": 2.2111, "step": 122440 }, { "epoch": 0.77, "learning_rate": 4.1393677727047295e-05, "loss": 2.2446, "step": 122448 }, { "epoch": 0.77, "learning_rate": 4.138809497282439e-05, "loss": 2.2448, "step": 122456 }, { "epoch": 0.77, "learning_rate": 4.1382512681295534e-05, "loss": 2.2264, "step": 122464 }, { "epoch": 0.77, "learning_rate": 4.1376930852599474e-05, "loss": 2.2328, "step": 122472 }, { "epoch": 0.77, "learning_rate": 4.1371349486875035e-05, "loss": 2.2516, "step": 122480 }, { "epoch": 0.77, "learning_rate": 4.1365768584260934e-05, "loss": 2.241, "step": 122488 }, { "epoch": 0.77, "learning_rate": 4.136018814489589e-05, "loss": 2.2281, "step": 122496 }, { "epoch": 0.77, "learning_rate": 4.1354608168918686e-05, "loss": 2.2124, "step": 122504 }, { "epoch": 0.77, "learning_rate": 4.1349028656468013e-05, "loss": 2.2379, "step": 122512 }, { "epoch": 0.77, "learning_rate": 4.134344960768257e-05, "loss": 2.2491, "step": 122520 }, { "epoch": 0.77, "learning_rate": 4.133787102270107e-05, "loss": 2.2368, "step": 122528 }, { "epoch": 0.77, "learning_rate": 4.133229290166219e-05, "loss": 2.2341, "step": 122536 }, { "epoch": 0.77, "learning_rate": 4.132671524470459e-05, "loss": 2.2224, "step": 122544 }, { "epoch": 0.77, "learning_rate": 4.132113805196696e-05, "loss": 2.2247, "step": 122552 }, { "epoch": 0.77, "learning_rate": 4.131556132358794e-05, "loss": 2.2351, "step": 122560 }, { "epoch": 0.77, "learning_rate": 4.1309985059706134e-05, "loss": 2.2219, "step": 122568 }, { "epoch": 0.77, "learning_rate": 4.130440926046022e-05, "loss": 2.2503, "step": 122576 }, { "epoch": 0.77, "learning_rate": 4.129883392598879e-05, "loss": 2.22, "step": 122584 }, { "epoch": 0.77, "learning_rate": 4.129325905643045e-05, "loss": 2.2228, "step": 122592 }, { "epoch": 0.77, "learning_rate": 4.1287684651923764e-05, "loss": 2.2316, "step": 122600 }, { "epoch": 0.77, "learning_rate": 4.1282110712607344e-05, "loss": 2.2315, "step": 122608 }, { "epoch": 0.77, "learning_rate": 4.127653723861977e-05, "loss": 2.229, "step": 122616 }, { "epoch": 0.77, "learning_rate": 4.127096423009956e-05, "loss": 2.2566, "step": 122624 }, { "epoch": 0.77, "learning_rate": 4.1265391687185296e-05, "loss": 2.2266, "step": 122632 }, { "epoch": 0.77, "learning_rate": 4.1259819610015496e-05, "loss": 2.2559, "step": 122640 }, { "epoch": 0.77, "learning_rate": 4.1254247998728665e-05, "loss": 2.2341, "step": 122648 }, { "epoch": 0.77, "learning_rate": 4.1248676853463355e-05, "loss": 2.2454, "step": 122656 }, { "epoch": 0.77, "learning_rate": 4.124310617435802e-05, "loss": 2.2303, "step": 122664 }, { "epoch": 0.77, "learning_rate": 4.1237535961551194e-05, "loss": 2.2297, "step": 122672 }, { "epoch": 0.77, "learning_rate": 4.1231966215181315e-05, "loss": 2.2327, "step": 122680 }, { "epoch": 0.77, "learning_rate": 4.122639693538686e-05, "loss": 2.2267, "step": 122688 }, { "epoch": 0.77, "learning_rate": 4.1220828122306286e-05, "loss": 2.2388, "step": 122696 }, { "epoch": 0.77, "learning_rate": 4.121525977607804e-05, "loss": 2.2367, "step": 122704 }, { "epoch": 0.77, "learning_rate": 4.1209691896840526e-05, "loss": 2.2268, "step": 122712 }, { "epoch": 0.77, "learning_rate": 4.1204124484732195e-05, "loss": 2.2479, "step": 122720 }, { "epoch": 0.77, "learning_rate": 4.119855753989144e-05, "loss": 2.2347, "step": 122728 }, { "epoch": 0.77, "learning_rate": 4.1192991062456644e-05, "loss": 2.233, "step": 122736 }, { "epoch": 0.77, "learning_rate": 4.118742505256621e-05, "loss": 2.2379, "step": 122744 }, { "epoch": 0.77, "learning_rate": 4.1181859510358493e-05, "loss": 2.236, "step": 122752 }, { "epoch": 0.77, "learning_rate": 4.1176294435971854e-05, "loss": 2.2169, "step": 122760 }, { "epoch": 0.77, "learning_rate": 4.1170729829544666e-05, "loss": 2.2362, "step": 122768 }, { "epoch": 0.77, "learning_rate": 4.1165165691215234e-05, "loss": 2.2289, "step": 122776 }, { "epoch": 0.77, "learning_rate": 4.11596020211219e-05, "loss": 2.2343, "step": 122784 }, { "epoch": 0.77, "learning_rate": 4.115403881940296e-05, "loss": 2.2336, "step": 122792 }, { "epoch": 0.77, "learning_rate": 4.114847608619674e-05, "loss": 2.2465, "step": 122800 }, { "epoch": 0.77, "learning_rate": 4.114291382164153e-05, "loss": 2.2352, "step": 122808 }, { "epoch": 0.77, "learning_rate": 4.113735202587558e-05, "loss": 2.2277, "step": 122816 }, { "epoch": 0.77, "learning_rate": 4.113179069903717e-05, "loss": 2.2431, "step": 122824 }, { "epoch": 0.77, "learning_rate": 4.11262298412646e-05, "loss": 2.2383, "step": 122832 }, { "epoch": 0.77, "learning_rate": 4.1120669452696036e-05, "loss": 2.2315, "step": 122840 }, { "epoch": 0.77, "learning_rate": 4.111510953346976e-05, "loss": 2.228, "step": 122848 }, { "epoch": 0.77, "learning_rate": 4.110955008372399e-05, "loss": 2.2337, "step": 122856 }, { "epoch": 0.77, "learning_rate": 4.11039911035969e-05, "loss": 2.2431, "step": 122864 }, { "epoch": 0.77, "learning_rate": 4.109843259322673e-05, "loss": 2.2247, "step": 122872 }, { "epoch": 0.77, "learning_rate": 4.1092874552751634e-05, "loss": 2.2262, "step": 122880 }, { "epoch": 0.77, "learning_rate": 4.108731698230981e-05, "loss": 2.2399, "step": 122888 }, { "epoch": 0.77, "learning_rate": 4.108175988203941e-05, "loss": 2.2306, "step": 122896 }, { "epoch": 0.77, "learning_rate": 4.1076203252078557e-05, "loss": 2.2304, "step": 122904 }, { "epoch": 0.77, "learning_rate": 4.107064709256544e-05, "loss": 2.2369, "step": 122912 }, { "epoch": 0.77, "learning_rate": 4.106509140363815e-05, "loss": 2.257, "step": 122920 }, { "epoch": 0.77, "learning_rate": 4.105953618543481e-05, "loss": 2.2479, "step": 122928 }, { "epoch": 0.77, "learning_rate": 4.1053981438093536e-05, "loss": 2.2414, "step": 122936 }, { "epoch": 0.77, "learning_rate": 4.1048427161752405e-05, "loss": 2.2342, "step": 122944 }, { "epoch": 0.77, "learning_rate": 4.1042873356549486e-05, "loss": 2.2446, "step": 122952 }, { "epoch": 0.77, "learning_rate": 4.1037320022622884e-05, "loss": 2.2489, "step": 122960 }, { "epoch": 0.77, "learning_rate": 4.103176716011063e-05, "loss": 2.2391, "step": 122968 }, { "epoch": 0.77, "learning_rate": 4.102621476915076e-05, "loss": 2.2279, "step": 122976 }, { "epoch": 0.77, "learning_rate": 4.102066284988133e-05, "loss": 2.2431, "step": 122984 }, { "epoch": 0.77, "learning_rate": 4.1015111402440346e-05, "loss": 2.2276, "step": 122992 }, { "epoch": 0.77, "learning_rate": 4.1009560426965834e-05, "loss": 2.2324, "step": 123000 }, { "epoch": 0.77, "learning_rate": 4.100400992359576e-05, "loss": 2.236, "step": 123008 }, { "epoch": 0.77, "learning_rate": 4.099845989246813e-05, "loss": 2.2307, "step": 123016 }, { "epoch": 0.77, "learning_rate": 4.099291033372096e-05, "loss": 2.2542, "step": 123024 }, { "epoch": 0.77, "learning_rate": 4.098736124749213e-05, "loss": 2.2397, "step": 123032 }, { "epoch": 0.77, "learning_rate": 4.098181263391963e-05, "loss": 2.2219, "step": 123040 }, { "epoch": 0.77, "learning_rate": 4.0976264493141434e-05, "loss": 2.251, "step": 123048 }, { "epoch": 0.77, "learning_rate": 4.097071682529541e-05, "loss": 2.2532, "step": 123056 }, { "epoch": 0.77, "learning_rate": 4.0965169630519516e-05, "loss": 2.2298, "step": 123064 }, { "epoch": 0.77, "learning_rate": 4.0959622908951645e-05, "loss": 2.2551, "step": 123072 }, { "epoch": 0.77, "learning_rate": 4.095407666072966e-05, "loss": 2.231, "step": 123080 }, { "epoch": 0.77, "learning_rate": 4.094853088599149e-05, "loss": 2.2367, "step": 123088 }, { "epoch": 0.77, "learning_rate": 4.094298558487496e-05, "loss": 2.2474, "step": 123096 }, { "epoch": 0.77, "learning_rate": 4.0937440757517965e-05, "loss": 2.2339, "step": 123104 }, { "epoch": 0.77, "learning_rate": 4.093189640405832e-05, "loss": 2.2384, "step": 123112 }, { "epoch": 0.77, "learning_rate": 4.092635252463387e-05, "loss": 2.2425, "step": 123120 }, { "epoch": 0.77, "learning_rate": 4.0920809119382444e-05, "loss": 2.2447, "step": 123128 }, { "epoch": 0.77, "learning_rate": 4.091526618844185e-05, "loss": 2.2433, "step": 123136 }, { "epoch": 0.77, "learning_rate": 4.0909723731949856e-05, "loss": 2.241, "step": 123144 }, { "epoch": 0.77, "learning_rate": 4.090418175004429e-05, "loss": 2.2334, "step": 123152 }, { "epoch": 0.77, "learning_rate": 4.089864024286291e-05, "loss": 2.2409, "step": 123160 }, { "epoch": 0.77, "learning_rate": 4.089309921054346e-05, "loss": 2.2269, "step": 123168 }, { "epoch": 0.77, "learning_rate": 4.088755865322372e-05, "loss": 2.2285, "step": 123176 }, { "epoch": 0.77, "learning_rate": 4.0882018571041426e-05, "loss": 2.2407, "step": 123184 }, { "epoch": 0.77, "learning_rate": 4.087647896413427e-05, "loss": 2.2331, "step": 123192 }, { "epoch": 0.77, "learning_rate": 4.087093983264001e-05, "loss": 2.2477, "step": 123200 }, { "epoch": 0.77, "learning_rate": 4.086540117669633e-05, "loss": 2.2523, "step": 123208 }, { "epoch": 0.77, "learning_rate": 4.0859862996440934e-05, "loss": 2.2208, "step": 123216 }, { "epoch": 0.77, "learning_rate": 4.0854325292011466e-05, "loss": 2.2256, "step": 123224 }, { "epoch": 0.77, "learning_rate": 4.084878806354562e-05, "loss": 2.2279, "step": 123232 }, { "epoch": 0.77, "learning_rate": 4.084325131118109e-05, "loss": 2.2478, "step": 123240 }, { "epoch": 0.77, "learning_rate": 4.083771503505544e-05, "loss": 2.2519, "step": 123248 }, { "epoch": 0.77, "learning_rate": 4.083217923530635e-05, "loss": 2.2269, "step": 123256 }, { "epoch": 0.77, "learning_rate": 4.082664391207147e-05, "loss": 2.2449, "step": 123264 }, { "epoch": 0.77, "learning_rate": 4.082110906548833e-05, "loss": 2.2325, "step": 123272 }, { "epoch": 0.77, "learning_rate": 4.08155746956946e-05, "loss": 2.2393, "step": 123280 }, { "epoch": 0.77, "learning_rate": 4.081004080282783e-05, "loss": 2.2345, "step": 123288 }, { "epoch": 0.77, "learning_rate": 4.080450738702558e-05, "loss": 2.2386, "step": 123296 }, { "epoch": 0.77, "learning_rate": 4.0798974448425445e-05, "loss": 2.2444, "step": 123304 }, { "epoch": 0.77, "learning_rate": 4.079344198716495e-05, "loss": 2.2401, "step": 123312 }, { "epoch": 0.77, "learning_rate": 4.078791000338165e-05, "loss": 2.2385, "step": 123320 }, { "epoch": 0.77, "learning_rate": 4.078237849721307e-05, "loss": 2.2349, "step": 123328 }, { "epoch": 0.77, "learning_rate": 4.07768474687967e-05, "loss": 2.245, "step": 123336 }, { "epoch": 0.77, "learning_rate": 4.0771316918270076e-05, "loss": 2.2479, "step": 123344 }, { "epoch": 0.77, "learning_rate": 4.076578684577066e-05, "loss": 2.2291, "step": 123352 }, { "epoch": 0.77, "learning_rate": 4.076025725143594e-05, "loss": 2.2398, "step": 123360 }, { "epoch": 0.77, "learning_rate": 4.0754728135403395e-05, "loss": 2.2468, "step": 123368 }, { "epoch": 0.77, "learning_rate": 4.074919949781046e-05, "loss": 2.2317, "step": 123376 }, { "epoch": 0.77, "learning_rate": 4.074367133879457e-05, "loss": 2.2227, "step": 123384 }, { "epoch": 0.77, "learning_rate": 4.07381436584932e-05, "loss": 2.2427, "step": 123392 }, { "epoch": 0.77, "learning_rate": 4.073261645704373e-05, "loss": 2.2499, "step": 123400 }, { "epoch": 0.77, "learning_rate": 4.0727089734583565e-05, "loss": 2.2374, "step": 123408 }, { "epoch": 0.77, "learning_rate": 4.0721563491250126e-05, "loss": 2.2336, "step": 123416 }, { "epoch": 0.77, "learning_rate": 4.0716037727180776e-05, "loss": 2.2402, "step": 123424 }, { "epoch": 0.77, "learning_rate": 4.071051244251289e-05, "loss": 2.2616, "step": 123432 }, { "epoch": 0.77, "learning_rate": 4.0704987637383824e-05, "loss": 2.238, "step": 123440 }, { "epoch": 0.77, "learning_rate": 4.069946331193093e-05, "loss": 2.2394, "step": 123448 }, { "epoch": 0.77, "learning_rate": 4.069393946629156e-05, "loss": 2.2257, "step": 123456 }, { "epoch": 0.77, "learning_rate": 4.0688416100603e-05, "loss": 2.2353, "step": 123464 }, { "epoch": 0.77, "learning_rate": 4.068289321500261e-05, "loss": 2.2324, "step": 123472 }, { "epoch": 0.77, "learning_rate": 4.067737080962764e-05, "loss": 2.2334, "step": 123480 }, { "epoch": 0.77, "learning_rate": 4.0671848884615396e-05, "loss": 2.22, "step": 123488 }, { "epoch": 0.77, "learning_rate": 4.066632744010317e-05, "loss": 2.2394, "step": 123496 }, { "epoch": 0.77, "learning_rate": 4.06608064762282e-05, "loss": 2.2184, "step": 123504 }, { "epoch": 0.77, "learning_rate": 4.065528599312777e-05, "loss": 2.2401, "step": 123512 }, { "epoch": 0.77, "learning_rate": 4.064976599093909e-05, "loss": 2.2171, "step": 123520 }, { "epoch": 0.77, "learning_rate": 4.064424646979939e-05, "loss": 2.2376, "step": 123528 }, { "epoch": 0.77, "learning_rate": 4.0638727429845905e-05, "loss": 2.2176, "step": 123536 }, { "epoch": 0.77, "learning_rate": 4.063320887121584e-05, "loss": 2.229, "step": 123544 }, { "epoch": 0.77, "learning_rate": 4.0627690794046344e-05, "loss": 2.2297, "step": 123552 }, { "epoch": 0.77, "learning_rate": 4.062217319847466e-05, "loss": 2.2245, "step": 123560 }, { "epoch": 0.77, "learning_rate": 4.061665608463792e-05, "loss": 2.2233, "step": 123568 }, { "epoch": 0.77, "learning_rate": 4.061113945267325e-05, "loss": 2.2394, "step": 123576 }, { "epoch": 0.77, "learning_rate": 4.0605623302717865e-05, "loss": 2.2398, "step": 123584 }, { "epoch": 0.77, "learning_rate": 4.060010763490885e-05, "loss": 2.2284, "step": 123592 }, { "epoch": 0.77, "learning_rate": 4.0594592449383326e-05, "loss": 2.2365, "step": 123600 }, { "epoch": 0.77, "learning_rate": 4.058907774627842e-05, "loss": 2.2306, "step": 123608 }, { "epoch": 0.77, "learning_rate": 4.0583563525731234e-05, "loss": 2.2292, "step": 123616 }, { "epoch": 0.77, "learning_rate": 4.057804978787883e-05, "loss": 2.2133, "step": 123624 }, { "epoch": 0.77, "learning_rate": 4.0572536532858266e-05, "loss": 2.2447, "step": 123632 }, { "epoch": 0.77, "learning_rate": 4.056702376080664e-05, "loss": 2.2326, "step": 123640 }, { "epoch": 0.77, "learning_rate": 4.056151147186099e-05, "loss": 2.2498, "step": 123648 }, { "epoch": 0.77, "learning_rate": 4.055599966615833e-05, "loss": 2.2168, "step": 123656 }, { "epoch": 0.77, "learning_rate": 4.055048834383569e-05, "loss": 2.2289, "step": 123664 }, { "epoch": 0.77, "learning_rate": 4.0544977505030136e-05, "loss": 2.2322, "step": 123672 }, { "epoch": 0.77, "learning_rate": 4.053946714987859e-05, "loss": 2.2432, "step": 123680 }, { "epoch": 0.77, "learning_rate": 4.053395727851808e-05, "loss": 2.2314, "step": 123688 }, { "epoch": 0.77, "learning_rate": 4.052844789108558e-05, "loss": 2.235, "step": 123696 }, { "epoch": 0.77, "learning_rate": 4.052293898771804e-05, "loss": 2.2287, "step": 123704 }, { "epoch": 0.77, "learning_rate": 4.0517430568552436e-05, "loss": 2.2323, "step": 123712 }, { "epoch": 0.77, "learning_rate": 4.051192263372567e-05, "loss": 2.2382, "step": 123720 }, { "epoch": 0.77, "learning_rate": 4.050641518337472e-05, "loss": 2.2235, "step": 123728 }, { "epoch": 0.77, "learning_rate": 4.050090821763647e-05, "loss": 2.2241, "step": 123736 }, { "epoch": 0.77, "learning_rate": 4.049540173664781e-05, "loss": 2.2303, "step": 123744 }, { "epoch": 0.77, "learning_rate": 4.048989574054567e-05, "loss": 2.2282, "step": 123752 }, { "epoch": 0.77, "learning_rate": 4.0484390229466925e-05, "loss": 2.2314, "step": 123760 }, { "epoch": 0.77, "learning_rate": 4.04788852035484e-05, "loss": 2.2324, "step": 123768 }, { "epoch": 0.77, "learning_rate": 4.0473380662927e-05, "loss": 2.2292, "step": 123776 }, { "epoch": 0.77, "learning_rate": 4.046787660773954e-05, "loss": 2.2287, "step": 123784 }, { "epoch": 0.77, "learning_rate": 4.0462373038122846e-05, "loss": 2.2247, "step": 123792 }, { "epoch": 0.77, "learning_rate": 4.045686995421377e-05, "loss": 2.2315, "step": 123800 }, { "epoch": 0.77, "learning_rate": 4.04513673561491e-05, "loss": 2.2152, "step": 123808 }, { "epoch": 0.77, "learning_rate": 4.04458652440656e-05, "loss": 2.22, "step": 123816 }, { "epoch": 0.77, "learning_rate": 4.044036361810011e-05, "loss": 2.2171, "step": 123824 }, { "epoch": 0.77, "learning_rate": 4.043486247838938e-05, "loss": 2.2292, "step": 123832 }, { "epoch": 0.77, "learning_rate": 4.042936182507016e-05, "loss": 2.2336, "step": 123840 }, { "epoch": 0.77, "learning_rate": 4.042386165827918e-05, "loss": 2.2426, "step": 123848 }, { "epoch": 0.77, "learning_rate": 4.0418361978153206e-05, "loss": 2.2272, "step": 123856 }, { "epoch": 0.77, "learning_rate": 4.041286278482898e-05, "loss": 2.2471, "step": 123864 }, { "epoch": 0.77, "learning_rate": 4.040736407844314e-05, "loss": 2.2336, "step": 123872 }, { "epoch": 0.77, "learning_rate": 4.0401865859132435e-05, "loss": 2.2225, "step": 123880 }, { "epoch": 0.77, "learning_rate": 4.039636812703358e-05, "loss": 2.2559, "step": 123888 }, { "epoch": 0.77, "learning_rate": 4.0390870882283177e-05, "loss": 2.2306, "step": 123896 }, { "epoch": 0.77, "learning_rate": 4.038537412501794e-05, "loss": 2.2272, "step": 123904 }, { "epoch": 0.77, "learning_rate": 4.037987785537451e-05, "loss": 2.2466, "step": 123912 }, { "epoch": 0.77, "learning_rate": 4.0374382073489495e-05, "loss": 2.2509, "step": 123920 }, { "epoch": 0.77, "learning_rate": 4.0368886779499546e-05, "loss": 2.2284, "step": 123928 }, { "epoch": 0.77, "learning_rate": 4.0363391973541285e-05, "loss": 2.2243, "step": 123936 }, { "epoch": 0.77, "learning_rate": 4.03578976557513e-05, "loss": 2.233, "step": 123944 }, { "epoch": 0.77, "learning_rate": 4.035240382626619e-05, "loss": 2.2183, "step": 123952 }, { "epoch": 0.77, "learning_rate": 4.03469104852225e-05, "loss": 2.2453, "step": 123960 }, { "epoch": 0.77, "learning_rate": 4.0341417632756854e-05, "loss": 2.2506, "step": 123968 }, { "epoch": 0.77, "learning_rate": 4.0335925269005754e-05, "loss": 2.2343, "step": 123976 }, { "epoch": 0.77, "learning_rate": 4.033043339410575e-05, "loss": 2.2323, "step": 123984 }, { "epoch": 0.77, "learning_rate": 4.032494200819341e-05, "loss": 2.2395, "step": 123992 }, { "epoch": 0.78, "learning_rate": 4.031945111140518e-05, "loss": 2.2427, "step": 124000 }, { "epoch": 0.78, "learning_rate": 4.0313960703877614e-05, "loss": 2.2469, "step": 124008 }, { "epoch": 0.78, "learning_rate": 4.0308470785747207e-05, "loss": 2.2619, "step": 124016 }, { "epoch": 0.78, "learning_rate": 4.0302981357150424e-05, "loss": 2.2324, "step": 124024 }, { "epoch": 0.78, "learning_rate": 4.029749241822372e-05, "loss": 2.2361, "step": 124032 }, { "epoch": 0.78, "learning_rate": 4.0292003969103576e-05, "loss": 2.2181, "step": 124040 }, { "epoch": 0.78, "learning_rate": 4.028651600992643e-05, "loss": 2.239, "step": 124048 }, { "epoch": 0.78, "learning_rate": 4.0281028540828707e-05, "loss": 2.2327, "step": 124056 }, { "epoch": 0.78, "learning_rate": 4.0275541561946814e-05, "loss": 2.2314, "step": 124064 }, { "epoch": 0.78, "learning_rate": 4.0270055073417166e-05, "loss": 2.2437, "step": 124072 }, { "epoch": 0.78, "learning_rate": 4.026456907537619e-05, "loss": 2.2573, "step": 124080 }, { "epoch": 0.78, "learning_rate": 4.025908356796022e-05, "loss": 2.2264, "step": 124088 }, { "epoch": 0.78, "learning_rate": 4.0253598551305636e-05, "loss": 2.2418, "step": 124096 }, { "epoch": 0.78, "learning_rate": 4.024811402554884e-05, "loss": 2.2432, "step": 124104 }, { "epoch": 0.78, "learning_rate": 4.0242629990826134e-05, "loss": 2.2432, "step": 124112 }, { "epoch": 0.78, "learning_rate": 4.023714644727386e-05, "loss": 2.2255, "step": 124120 }, { "epoch": 0.78, "learning_rate": 4.0231663395028345e-05, "loss": 2.2374, "step": 124128 }, { "epoch": 0.78, "learning_rate": 4.022618083422588e-05, "loss": 2.2445, "step": 124136 }, { "epoch": 0.78, "learning_rate": 4.02206987650028e-05, "loss": 2.2254, "step": 124144 }, { "epoch": 0.78, "learning_rate": 4.0215217187495345e-05, "loss": 2.2248, "step": 124152 }, { "epoch": 0.78, "learning_rate": 4.020973610183983e-05, "loss": 2.2294, "step": 124160 }, { "epoch": 0.78, "learning_rate": 4.02042555081725e-05, "loss": 2.2495, "step": 124168 }, { "epoch": 0.78, "learning_rate": 4.0198775406629575e-05, "loss": 2.2379, "step": 124176 }, { "epoch": 0.78, "learning_rate": 4.0193295797347336e-05, "loss": 2.2443, "step": 124184 }, { "epoch": 0.78, "learning_rate": 4.018781668046198e-05, "loss": 2.2094, "step": 124192 }, { "epoch": 0.78, "learning_rate": 4.018233805610971e-05, "loss": 2.2578, "step": 124200 }, { "epoch": 0.78, "learning_rate": 4.017685992442676e-05, "loss": 2.225, "step": 124208 }, { "epoch": 0.78, "learning_rate": 4.017138228554929e-05, "loss": 2.2411, "step": 124216 }, { "epoch": 0.78, "learning_rate": 4.0165905139613474e-05, "loss": 2.2219, "step": 124224 }, { "epoch": 0.78, "learning_rate": 4.01604284867555e-05, "loss": 2.2235, "step": 124232 }, { "epoch": 0.78, "learning_rate": 4.0154952327111486e-05, "loss": 2.2157, "step": 124240 }, { "epoch": 0.78, "learning_rate": 4.014947666081758e-05, "loss": 2.2432, "step": 124248 }, { "epoch": 0.78, "learning_rate": 4.014400148800992e-05, "loss": 2.234, "step": 124256 }, { "epoch": 0.78, "learning_rate": 4.013852680882461e-05, "loss": 2.2436, "step": 124264 }, { "epoch": 0.78, "learning_rate": 4.013305262339775e-05, "loss": 2.2422, "step": 124272 }, { "epoch": 0.78, "learning_rate": 4.012757893186542e-05, "loss": 2.2462, "step": 124280 }, { "epoch": 0.78, "learning_rate": 4.012210573436371e-05, "loss": 2.2423, "step": 124288 }, { "epoch": 0.78, "learning_rate": 4.0116633031028706e-05, "loss": 2.2267, "step": 124296 }, { "epoch": 0.78, "learning_rate": 4.0111160821996416e-05, "loss": 2.2296, "step": 124304 }, { "epoch": 0.78, "learning_rate": 4.01056891074029e-05, "loss": 2.2221, "step": 124312 }, { "epoch": 0.78, "learning_rate": 4.010021788738419e-05, "loss": 2.2492, "step": 124320 }, { "epoch": 0.78, "learning_rate": 4.009474716207629e-05, "loss": 2.2333, "step": 124328 }, { "epoch": 0.78, "learning_rate": 4.0089276931615215e-05, "loss": 2.234, "step": 124336 }, { "epoch": 0.78, "learning_rate": 4.0083807196136953e-05, "loss": 2.2392, "step": 124344 }, { "epoch": 0.78, "learning_rate": 4.007833795577746e-05, "loss": 2.2155, "step": 124352 }, { "epoch": 0.78, "learning_rate": 4.0072869210672736e-05, "loss": 2.2347, "step": 124360 }, { "epoch": 0.78, "learning_rate": 4.006740096095871e-05, "loss": 2.2311, "step": 124368 }, { "epoch": 0.78, "learning_rate": 4.006193320677134e-05, "loss": 2.2335, "step": 124376 }, { "epoch": 0.78, "learning_rate": 4.005646594824655e-05, "loss": 2.2512, "step": 124384 }, { "epoch": 0.78, "learning_rate": 4.005099918552024e-05, "loss": 2.2398, "step": 124392 }, { "epoch": 0.78, "learning_rate": 4.0045532918728346e-05, "loss": 2.2206, "step": 124400 }, { "epoch": 0.78, "learning_rate": 4.0040067148006735e-05, "loss": 2.2333, "step": 124408 }, { "epoch": 0.78, "learning_rate": 4.003460187349128e-05, "loss": 2.2588, "step": 124416 }, { "epoch": 0.78, "learning_rate": 4.0029137095317885e-05, "loss": 2.2463, "step": 124424 }, { "epoch": 0.78, "learning_rate": 4.002367281362238e-05, "loss": 2.2298, "step": 124432 }, { "epoch": 0.78, "learning_rate": 4.00182090285406e-05, "loss": 2.2275, "step": 124440 }, { "epoch": 0.78, "learning_rate": 4.001274574020839e-05, "loss": 2.2241, "step": 124448 }, { "epoch": 0.78, "learning_rate": 4.0007282948761573e-05, "loss": 2.2312, "step": 124456 }, { "epoch": 0.78, "learning_rate": 4.000182065433592e-05, "loss": 2.245, "step": 124464 }, { "epoch": 0.78, "learning_rate": 3.999635885706727e-05, "loss": 2.2327, "step": 124472 }, { "epoch": 0.78, "learning_rate": 3.999089755709138e-05, "loss": 2.2398, "step": 124480 }, { "epoch": 0.78, "learning_rate": 3.998543675454403e-05, "loss": 2.2454, "step": 124488 }, { "epoch": 0.78, "learning_rate": 3.997997644956095e-05, "loss": 2.2379, "step": 124496 }, { "epoch": 0.78, "learning_rate": 3.997451664227789e-05, "loss": 2.2529, "step": 124504 }, { "epoch": 0.78, "learning_rate": 3.996905733283063e-05, "loss": 2.2184, "step": 124512 }, { "epoch": 0.78, "learning_rate": 3.996359852135483e-05, "loss": 2.2231, "step": 124520 }, { "epoch": 0.78, "learning_rate": 3.9958140207986225e-05, "loss": 2.2361, "step": 124528 }, { "epoch": 0.78, "learning_rate": 3.995268239286051e-05, "loss": 2.2423, "step": 124536 }, { "epoch": 0.78, "learning_rate": 3.994722507611334e-05, "loss": 2.236, "step": 124544 }, { "epoch": 0.78, "learning_rate": 3.9941768257880424e-05, "loss": 2.2325, "step": 124552 }, { "epoch": 0.78, "learning_rate": 3.9936311938297375e-05, "loss": 2.2346, "step": 124560 }, { "epoch": 0.78, "learning_rate": 3.993085611749989e-05, "loss": 2.2342, "step": 124568 }, { "epoch": 0.78, "learning_rate": 3.9925400795623566e-05, "loss": 2.2272, "step": 124576 }, { "epoch": 0.78, "learning_rate": 3.991994597280401e-05, "loss": 2.2387, "step": 124584 }, { "epoch": 0.78, "learning_rate": 3.991449164917688e-05, "loss": 2.2394, "step": 124592 }, { "epoch": 0.78, "learning_rate": 3.9909037824877725e-05, "loss": 2.2647, "step": 124600 }, { "epoch": 0.78, "learning_rate": 3.990358450004214e-05, "loss": 2.234, "step": 124608 }, { "epoch": 0.78, "learning_rate": 3.989813167480571e-05, "loss": 2.2404, "step": 124616 }, { "epoch": 0.78, "learning_rate": 3.989267934930399e-05, "loss": 2.2244, "step": 124624 }, { "epoch": 0.78, "learning_rate": 3.988722752367249e-05, "loss": 2.245, "step": 124632 }, { "epoch": 0.78, "learning_rate": 3.988177619804679e-05, "loss": 2.2337, "step": 124640 }, { "epoch": 0.78, "learning_rate": 3.987632537256239e-05, "loss": 2.2351, "step": 124648 }, { "epoch": 0.78, "learning_rate": 3.987087504735478e-05, "loss": 2.2364, "step": 124656 }, { "epoch": 0.78, "learning_rate": 3.98654252225595e-05, "loss": 2.2354, "step": 124664 }, { "epoch": 0.78, "learning_rate": 3.9859975898312e-05, "loss": 2.2265, "step": 124672 }, { "epoch": 0.78, "learning_rate": 3.985452707474777e-05, "loss": 2.2458, "step": 124680 }, { "epoch": 0.78, "learning_rate": 3.984907875200223e-05, "loss": 2.2368, "step": 124688 }, { "epoch": 0.78, "learning_rate": 3.984363093021086e-05, "loss": 2.2321, "step": 124696 }, { "epoch": 0.78, "learning_rate": 3.983818360950911e-05, "loss": 2.2471, "step": 124704 }, { "epoch": 0.78, "learning_rate": 3.983273679003235e-05, "loss": 2.2337, "step": 124712 }, { "epoch": 0.78, "learning_rate": 3.982729047191602e-05, "loss": 2.2402, "step": 124720 }, { "epoch": 0.78, "learning_rate": 3.982184465529554e-05, "loss": 2.2198, "step": 124728 }, { "epoch": 0.78, "learning_rate": 3.981639934030623e-05, "loss": 2.2275, "step": 124736 }, { "epoch": 0.78, "learning_rate": 3.981095452708352e-05, "loss": 2.2354, "step": 124744 }, { "epoch": 0.78, "learning_rate": 3.980551021576275e-05, "loss": 2.214, "step": 124752 }, { "epoch": 0.78, "learning_rate": 3.980006640647924e-05, "loss": 2.2215, "step": 124760 }, { "epoch": 0.78, "learning_rate": 3.979462309936836e-05, "loss": 2.2389, "step": 124768 }, { "epoch": 0.78, "learning_rate": 3.97891802945654e-05, "loss": 2.2317, "step": 124776 }, { "epoch": 0.78, "learning_rate": 3.97837379922057e-05, "loss": 2.245, "step": 124784 }, { "epoch": 0.78, "learning_rate": 3.977829619242455e-05, "loss": 2.2277, "step": 124792 }, { "epoch": 0.78, "learning_rate": 3.97728548953572e-05, "loss": 2.2316, "step": 124800 }, { "epoch": 0.78, "learning_rate": 3.9767414101138966e-05, "loss": 2.2406, "step": 124808 }, { "epoch": 0.78, "learning_rate": 3.976197380990509e-05, "loss": 2.2166, "step": 124816 }, { "epoch": 0.78, "learning_rate": 3.97565340217908e-05, "loss": 2.24, "step": 124824 }, { "epoch": 0.78, "learning_rate": 3.975109473693137e-05, "loss": 2.2296, "step": 124832 }, { "epoch": 0.78, "learning_rate": 3.974565595546197e-05, "loss": 2.2308, "step": 124840 }, { "epoch": 0.78, "learning_rate": 3.974021767751784e-05, "loss": 2.2496, "step": 124848 }, { "epoch": 0.78, "learning_rate": 3.973477990323418e-05, "loss": 2.2357, "step": 124856 }, { "epoch": 0.78, "learning_rate": 3.972934263274617e-05, "loss": 2.2213, "step": 124864 }, { "epoch": 0.78, "learning_rate": 3.972390586618896e-05, "loss": 2.2415, "step": 124872 }, { "epoch": 0.78, "learning_rate": 3.971846960369774e-05, "loss": 2.2514, "step": 124880 }, { "epoch": 0.78, "learning_rate": 3.971303384540764e-05, "loss": 2.2369, "step": 124888 }, { "epoch": 0.78, "learning_rate": 3.97075985914538e-05, "loss": 2.2278, "step": 124896 }, { "epoch": 0.78, "learning_rate": 3.9702163841971315e-05, "loss": 2.2198, "step": 124904 }, { "epoch": 0.78, "learning_rate": 3.969672959709532e-05, "loss": 2.226, "step": 124912 }, { "epoch": 0.78, "learning_rate": 3.969129585696092e-05, "loss": 2.2515, "step": 124920 }, { "epoch": 0.78, "learning_rate": 3.968586262170317e-05, "loss": 2.2411, "step": 124928 }, { "epoch": 0.78, "learning_rate": 3.968042989145715e-05, "loss": 2.2448, "step": 124936 }, { "epoch": 0.78, "learning_rate": 3.9674997666357954e-05, "loss": 2.239, "step": 124944 }, { "epoch": 0.78, "learning_rate": 3.966956594654056e-05, "loss": 2.2257, "step": 124952 }, { "epoch": 0.78, "learning_rate": 3.966413473214006e-05, "loss": 2.2414, "step": 124960 }, { "epoch": 0.78, "learning_rate": 3.965870402329145e-05, "loss": 2.2421, "step": 124968 }, { "epoch": 0.78, "learning_rate": 3.9653273820129725e-05, "loss": 2.23, "step": 124976 }, { "epoch": 0.78, "learning_rate": 3.964784412278991e-05, "loss": 2.2511, "step": 124984 }, { "epoch": 0.78, "learning_rate": 3.964241493140696e-05, "loss": 2.2355, "step": 124992 }, { "epoch": 0.78, "learning_rate": 3.963698624611587e-05, "loss": 2.237, "step": 125000 }, { "epoch": 0.78, "learning_rate": 3.963155806705159e-05, "loss": 2.221, "step": 125008 }, { "epoch": 0.78, "learning_rate": 3.962613039434905e-05, "loss": 2.2399, "step": 125016 }, { "epoch": 0.78, "learning_rate": 3.96207032281432e-05, "loss": 2.2356, "step": 125024 }, { "epoch": 0.78, "learning_rate": 3.961527656856896e-05, "loss": 2.2237, "step": 125032 }, { "epoch": 0.78, "learning_rate": 3.960985041576122e-05, "loss": 2.2388, "step": 125040 }, { "epoch": 0.78, "learning_rate": 3.960442476985489e-05, "loss": 2.2356, "step": 125048 }, { "epoch": 0.78, "learning_rate": 3.959899963098486e-05, "loss": 2.2352, "step": 125056 }, { "epoch": 0.78, "learning_rate": 3.959357499928597e-05, "loss": 2.231, "step": 125064 }, { "epoch": 0.78, "learning_rate": 3.958815087489311e-05, "loss": 2.2479, "step": 125072 }, { "epoch": 0.78, "learning_rate": 3.958272725794111e-05, "loss": 2.2404, "step": 125080 }, { "epoch": 0.78, "learning_rate": 3.9577304148564784e-05, "loss": 2.2217, "step": 125088 }, { "epoch": 0.78, "learning_rate": 3.957188154689898e-05, "loss": 2.2302, "step": 125096 }, { "epoch": 0.78, "learning_rate": 3.95664594530785e-05, "loss": 2.2383, "step": 125104 }, { "epoch": 0.78, "learning_rate": 3.956103786723813e-05, "loss": 2.2454, "step": 125112 }, { "epoch": 0.78, "learning_rate": 3.955561678951263e-05, "loss": 2.2599, "step": 125120 }, { "epoch": 0.78, "learning_rate": 3.955019622003679e-05, "loss": 2.2369, "step": 125128 }, { "epoch": 0.78, "learning_rate": 3.954477615894541e-05, "loss": 2.2226, "step": 125136 }, { "epoch": 0.78, "learning_rate": 3.953935660637315e-05, "loss": 2.2286, "step": 125144 }, { "epoch": 0.78, "learning_rate": 3.953393756245479e-05, "loss": 2.248, "step": 125152 }, { "epoch": 0.78, "learning_rate": 3.952851902732505e-05, "loss": 2.2334, "step": 125160 }, { "epoch": 0.78, "learning_rate": 3.95231010011186e-05, "loss": 2.2394, "step": 125168 }, { "epoch": 0.78, "learning_rate": 3.951768348397018e-05, "loss": 2.2295, "step": 125176 }, { "epoch": 0.78, "learning_rate": 3.951226647601444e-05, "loss": 2.2171, "step": 125184 }, { "epoch": 0.78, "learning_rate": 3.950684997738604e-05, "loss": 2.2353, "step": 125192 }, { "epoch": 0.78, "learning_rate": 3.950143398821966e-05, "loss": 2.2297, "step": 125200 }, { "epoch": 0.78, "learning_rate": 3.9496018508649924e-05, "loss": 2.2246, "step": 125208 }, { "epoch": 0.78, "learning_rate": 3.949060353881148e-05, "loss": 2.2501, "step": 125216 }, { "epoch": 0.78, "learning_rate": 3.9485189078838936e-05, "loss": 2.2284, "step": 125224 }, { "epoch": 0.78, "learning_rate": 3.947977512886687e-05, "loss": 2.234, "step": 125232 }, { "epoch": 0.78, "learning_rate": 3.947436168902992e-05, "loss": 2.2552, "step": 125240 }, { "epoch": 0.78, "learning_rate": 3.946894875946264e-05, "loss": 2.2373, "step": 125248 }, { "epoch": 0.78, "learning_rate": 3.946353634029958e-05, "loss": 2.2288, "step": 125256 }, { "epoch": 0.78, "learning_rate": 3.9458124431675325e-05, "loss": 2.2355, "step": 125264 }, { "epoch": 0.78, "learning_rate": 3.9452713033724405e-05, "loss": 2.2276, "step": 125272 }, { "epoch": 0.78, "learning_rate": 3.9447302146581325e-05, "loss": 2.2446, "step": 125280 }, { "epoch": 0.78, "learning_rate": 3.944189177038064e-05, "loss": 2.2434, "step": 125288 }, { "epoch": 0.78, "learning_rate": 3.943648190525683e-05, "loss": 2.2406, "step": 125296 }, { "epoch": 0.78, "learning_rate": 3.943107255134437e-05, "loss": 2.2352, "step": 125304 }, { "epoch": 0.78, "learning_rate": 3.9425663708777766e-05, "loss": 2.2321, "step": 125312 }, { "epoch": 0.78, "learning_rate": 3.942025537769147e-05, "loss": 2.24, "step": 125320 }, { "epoch": 0.78, "learning_rate": 3.941484755821994e-05, "loss": 2.2374, "step": 125328 }, { "epoch": 0.78, "learning_rate": 3.94094402504976e-05, "loss": 2.2294, "step": 125336 }, { "epoch": 0.78, "learning_rate": 3.940403345465888e-05, "loss": 2.2479, "step": 125344 }, { "epoch": 0.78, "learning_rate": 3.939862717083822e-05, "loss": 2.2276, "step": 125352 }, { "epoch": 0.78, "learning_rate": 3.939322139916998e-05, "loss": 2.2245, "step": 125360 }, { "epoch": 0.78, "learning_rate": 3.9387816139788585e-05, "loss": 2.2283, "step": 125368 }, { "epoch": 0.78, "learning_rate": 3.938241139282839e-05, "loss": 2.2287, "step": 125376 }, { "epoch": 0.78, "learning_rate": 3.937700715842374e-05, "loss": 2.2373, "step": 125384 }, { "epoch": 0.78, "learning_rate": 3.937160343670903e-05, "loss": 2.2419, "step": 125392 }, { "epoch": 0.78, "learning_rate": 3.936620022781855e-05, "loss": 2.2474, "step": 125400 }, { "epoch": 0.78, "learning_rate": 3.936079753188667e-05, "loss": 2.2495, "step": 125408 }, { "epoch": 0.78, "learning_rate": 3.9355395349047674e-05, "loss": 2.23, "step": 125416 }, { "epoch": 0.78, "learning_rate": 3.934999367943586e-05, "loss": 2.2438, "step": 125424 }, { "epoch": 0.78, "learning_rate": 3.934459252318552e-05, "loss": 2.2477, "step": 125432 }, { "epoch": 0.78, "learning_rate": 3.9339191880430934e-05, "loss": 2.2418, "step": 125440 }, { "epoch": 0.78, "learning_rate": 3.933379175130634e-05, "loss": 2.2414, "step": 125448 }, { "epoch": 0.78, "learning_rate": 3.932839213594602e-05, "loss": 2.224, "step": 125456 }, { "epoch": 0.78, "learning_rate": 3.932299303448419e-05, "loss": 2.2277, "step": 125464 }, { "epoch": 0.78, "learning_rate": 3.931759444705506e-05, "loss": 2.2237, "step": 125472 }, { "epoch": 0.78, "learning_rate": 3.931219637379286e-05, "loss": 2.2345, "step": 125480 }, { "epoch": 0.78, "learning_rate": 3.930679881483179e-05, "loss": 2.2304, "step": 125488 }, { "epoch": 0.78, "learning_rate": 3.9301401770306005e-05, "loss": 2.2391, "step": 125496 }, { "epoch": 0.78, "learning_rate": 3.929600524034971e-05, "loss": 2.2278, "step": 125504 }, { "epoch": 0.78, "learning_rate": 3.9290609225097045e-05, "loss": 2.2238, "step": 125512 }, { "epoch": 0.78, "learning_rate": 3.928521372468215e-05, "loss": 2.236, "step": 125520 }, { "epoch": 0.78, "learning_rate": 3.927981873923916e-05, "loss": 2.2324, "step": 125528 }, { "epoch": 0.78, "learning_rate": 3.927442426890222e-05, "loss": 2.2472, "step": 125536 }, { "epoch": 0.78, "learning_rate": 3.9269030313805414e-05, "loss": 2.2379, "step": 125544 }, { "epoch": 0.78, "learning_rate": 3.926363687408282e-05, "loss": 2.2239, "step": 125552 }, { "epoch": 0.78, "learning_rate": 3.925824394986855e-05, "loss": 2.2173, "step": 125560 }, { "epoch": 0.78, "learning_rate": 3.925285154129668e-05, "loss": 2.2298, "step": 125568 }, { "epoch": 0.78, "learning_rate": 3.9247459648501226e-05, "loss": 2.2409, "step": 125576 }, { "epoch": 0.78, "learning_rate": 3.924206827161627e-05, "loss": 2.236, "step": 125584 }, { "epoch": 0.78, "learning_rate": 3.923667741077582e-05, "loss": 2.2244, "step": 125592 }, { "epoch": 0.79, "learning_rate": 3.9231287066113886e-05, "loss": 2.228, "step": 125600 }, { "epoch": 0.79, "learning_rate": 3.922589723776451e-05, "loss": 2.2264, "step": 125608 }, { "epoch": 0.79, "learning_rate": 3.922050792586163e-05, "loss": 2.2416, "step": 125616 }, { "epoch": 0.79, "learning_rate": 3.921511913053928e-05, "loss": 2.2185, "step": 125624 }, { "epoch": 0.79, "learning_rate": 3.9209730851931393e-05, "loss": 2.2296, "step": 125632 }, { "epoch": 0.79, "learning_rate": 3.920434309017192e-05, "loss": 2.2238, "step": 125640 }, { "epoch": 0.79, "learning_rate": 3.9198955845394825e-05, "loss": 2.2285, "step": 125648 }, { "epoch": 0.79, "learning_rate": 3.919356911773402e-05, "loss": 2.2399, "step": 125656 }, { "epoch": 0.79, "learning_rate": 3.918818290732341e-05, "loss": 2.2309, "step": 125664 }, { "epoch": 0.79, "learning_rate": 3.918279721429693e-05, "loss": 2.2265, "step": 125672 }, { "epoch": 0.79, "learning_rate": 3.917741203878842e-05, "loss": 2.2405, "step": 125680 }, { "epoch": 0.79, "learning_rate": 3.917202738093179e-05, "loss": 2.2237, "step": 125688 }, { "epoch": 0.79, "learning_rate": 3.91666432408609e-05, "loss": 2.2308, "step": 125696 }, { "epoch": 0.79, "learning_rate": 3.916125961870961e-05, "loss": 2.2317, "step": 125704 }, { "epoch": 0.79, "learning_rate": 3.915587651461172e-05, "loss": 2.2457, "step": 125712 }, { "epoch": 0.79, "learning_rate": 3.915049392870109e-05, "loss": 2.2458, "step": 125720 }, { "epoch": 0.79, "learning_rate": 3.9145111861111525e-05, "loss": 2.2227, "step": 125728 }, { "epoch": 0.79, "learning_rate": 3.913973031197682e-05, "loss": 2.2119, "step": 125736 }, { "epoch": 0.79, "learning_rate": 3.9134349281430745e-05, "loss": 2.2379, "step": 125744 }, { "epoch": 0.79, "learning_rate": 3.9128968769607085e-05, "loss": 2.2311, "step": 125752 }, { "epoch": 0.79, "learning_rate": 3.912358877663964e-05, "loss": 2.2424, "step": 125760 }, { "epoch": 0.79, "learning_rate": 3.9118209302662076e-05, "loss": 2.244, "step": 125768 }, { "epoch": 0.79, "learning_rate": 3.9112830347808186e-05, "loss": 2.243, "step": 125776 }, { "epoch": 0.79, "learning_rate": 3.91074519122117e-05, "loss": 2.2556, "step": 125784 }, { "epoch": 0.79, "learning_rate": 3.9102073996006275e-05, "loss": 2.2335, "step": 125792 }, { "epoch": 0.79, "learning_rate": 3.909669659932565e-05, "loss": 2.2355, "step": 125800 }, { "epoch": 0.79, "learning_rate": 3.90913197223035e-05, "loss": 2.2453, "step": 125808 }, { "epoch": 0.79, "learning_rate": 3.9085943365073466e-05, "loss": 2.2391, "step": 125816 }, { "epoch": 0.79, "learning_rate": 3.908056752776924e-05, "loss": 2.2458, "step": 125824 }, { "epoch": 0.79, "learning_rate": 3.9075192210524435e-05, "loss": 2.2372, "step": 125832 }, { "epoch": 0.79, "learning_rate": 3.906981741347272e-05, "loss": 2.2318, "step": 125840 }, { "epoch": 0.79, "learning_rate": 3.906444313674769e-05, "loss": 2.2335, "step": 125848 }, { "epoch": 0.79, "learning_rate": 3.905906938048294e-05, "loss": 2.242, "step": 125856 }, { "epoch": 0.79, "learning_rate": 3.905369614481209e-05, "loss": 2.2259, "step": 125864 }, { "epoch": 0.79, "learning_rate": 3.90483234298687e-05, "loss": 2.2258, "step": 125872 }, { "epoch": 0.79, "learning_rate": 3.904295123578632e-05, "loss": 2.223, "step": 125880 }, { "epoch": 0.79, "learning_rate": 3.9037579562698566e-05, "loss": 2.2349, "step": 125888 }, { "epoch": 0.79, "learning_rate": 3.9032208410738904e-05, "loss": 2.2389, "step": 125896 }, { "epoch": 0.79, "learning_rate": 3.9026837780040886e-05, "loss": 2.2316, "step": 125904 }, { "epoch": 0.79, "learning_rate": 3.902146767073806e-05, "loss": 2.2432, "step": 125912 }, { "epoch": 0.79, "learning_rate": 3.901609808296389e-05, "loss": 2.225, "step": 125920 }, { "epoch": 0.79, "learning_rate": 3.9010729016851865e-05, "loss": 2.2439, "step": 125928 }, { "epoch": 0.79, "learning_rate": 3.900536047253549e-05, "loss": 2.2339, "step": 125936 }, { "epoch": 0.79, "learning_rate": 3.89999924501482e-05, "loss": 2.2281, "step": 125944 }, { "epoch": 0.79, "learning_rate": 3.8994624949823465e-05, "loss": 2.2472, "step": 125952 }, { "epoch": 0.79, "learning_rate": 3.8989257971694695e-05, "loss": 2.2378, "step": 125960 }, { "epoch": 0.79, "learning_rate": 3.898389151589532e-05, "loss": 2.2272, "step": 125968 }, { "epoch": 0.79, "learning_rate": 3.8978525582558796e-05, "loss": 2.241, "step": 125976 }, { "epoch": 0.79, "learning_rate": 3.897316017181845e-05, "loss": 2.2307, "step": 125984 }, { "epoch": 0.79, "learning_rate": 3.896779528380772e-05, "loss": 2.2277, "step": 125992 }, { "epoch": 0.79, "learning_rate": 3.8962430918659964e-05, "loss": 2.2322, "step": 126000 }, { "epoch": 0.79, "learning_rate": 3.895706707650851e-05, "loss": 2.231, "step": 126008 }, { "epoch": 0.79, "learning_rate": 3.8951703757486755e-05, "loss": 2.2405, "step": 126016 }, { "epoch": 0.79, "learning_rate": 3.8946340961728e-05, "loss": 2.2336, "step": 126024 }, { "epoch": 0.79, "learning_rate": 3.8940978689365555e-05, "loss": 2.2354, "step": 126032 }, { "epoch": 0.79, "learning_rate": 3.893561694053276e-05, "loss": 2.2239, "step": 126040 }, { "epoch": 0.79, "learning_rate": 3.893025571536288e-05, "loss": 2.2202, "step": 126048 }, { "epoch": 0.79, "learning_rate": 3.8924895013989214e-05, "loss": 2.2274, "step": 126056 }, { "epoch": 0.79, "learning_rate": 3.8919534836545025e-05, "loss": 2.2526, "step": 126064 }, { "epoch": 0.79, "learning_rate": 3.8914175183163556e-05, "loss": 2.2154, "step": 126072 }, { "epoch": 0.79, "learning_rate": 3.890881605397806e-05, "loss": 2.2292, "step": 126080 }, { "epoch": 0.79, "learning_rate": 3.890345744912178e-05, "loss": 2.2433, "step": 126088 }, { "epoch": 0.79, "learning_rate": 3.8898099368727886e-05, "loss": 2.2274, "step": 126096 }, { "epoch": 0.79, "learning_rate": 3.889274181292963e-05, "loss": 2.2475, "step": 126104 }, { "epoch": 0.79, "learning_rate": 3.888738478186018e-05, "loss": 2.2308, "step": 126112 }, { "epoch": 0.79, "learning_rate": 3.88820282756527e-05, "loss": 2.2253, "step": 126120 }, { "epoch": 0.79, "learning_rate": 3.887667229444038e-05, "loss": 2.2359, "step": 126128 }, { "epoch": 0.79, "learning_rate": 3.8871316838356354e-05, "loss": 2.2311, "step": 126136 }, { "epoch": 0.79, "learning_rate": 3.8865961907533756e-05, "loss": 2.234, "step": 126144 }, { "epoch": 0.79, "learning_rate": 3.886060750210572e-05, "loss": 2.2234, "step": 126152 }, { "epoch": 0.79, "learning_rate": 3.8855253622205357e-05, "loss": 2.2238, "step": 126160 }, { "epoch": 0.79, "learning_rate": 3.884990026796576e-05, "loss": 2.2378, "step": 126168 }, { "epoch": 0.79, "learning_rate": 3.884454743952e-05, "loss": 2.2345, "step": 126176 }, { "epoch": 0.79, "learning_rate": 3.8839195137001174e-05, "loss": 2.2341, "step": 126184 }, { "epoch": 0.79, "learning_rate": 3.883384336054235e-05, "loss": 2.2322, "step": 126192 }, { "epoch": 0.79, "learning_rate": 3.882849211027653e-05, "loss": 2.2462, "step": 126200 }, { "epoch": 0.79, "learning_rate": 3.882314138633678e-05, "loss": 2.2326, "step": 126208 }, { "epoch": 0.79, "learning_rate": 3.881779118885612e-05, "loss": 2.2379, "step": 126216 }, { "epoch": 0.79, "learning_rate": 3.881244151796753e-05, "loss": 2.2232, "step": 126224 }, { "epoch": 0.79, "learning_rate": 3.880709237380404e-05, "loss": 2.2292, "step": 126232 }, { "epoch": 0.79, "learning_rate": 3.8801743756498606e-05, "loss": 2.212, "step": 126240 }, { "epoch": 0.79, "learning_rate": 3.879639566618418e-05, "loss": 2.2425, "step": 126248 }, { "epoch": 0.79, "learning_rate": 3.879104810299376e-05, "loss": 2.2359, "step": 126256 }, { "epoch": 0.79, "learning_rate": 3.878570106706025e-05, "loss": 2.2323, "step": 126264 }, { "epoch": 0.79, "learning_rate": 3.8780354558516605e-05, "loss": 2.2241, "step": 126272 }, { "epoch": 0.79, "learning_rate": 3.877500857749572e-05, "loss": 2.2338, "step": 126280 }, { "epoch": 0.79, "learning_rate": 3.876966312413049e-05, "loss": 2.2371, "step": 126288 }, { "epoch": 0.79, "learning_rate": 3.876431819855384e-05, "loss": 2.2261, "step": 126296 }, { "epoch": 0.79, "learning_rate": 3.875897380089861e-05, "loss": 2.2337, "step": 126304 }, { "epoch": 0.79, "learning_rate": 3.875362993129767e-05, "loss": 2.244, "step": 126312 }, { "epoch": 0.79, "learning_rate": 3.8748286589883887e-05, "loss": 2.2358, "step": 126320 }, { "epoch": 0.79, "learning_rate": 3.874294377679008e-05, "loss": 2.2426, "step": 126328 }, { "epoch": 0.79, "learning_rate": 3.873760149214906e-05, "loss": 2.2377, "step": 126336 }, { "epoch": 0.79, "learning_rate": 3.873225973609367e-05, "loss": 2.2122, "step": 126344 }, { "epoch": 0.79, "learning_rate": 3.872691850875669e-05, "loss": 2.2354, "step": 126352 }, { "epoch": 0.79, "learning_rate": 3.872157781027091e-05, "loss": 2.2112, "step": 126360 }, { "epoch": 0.79, "learning_rate": 3.871623764076906e-05, "loss": 2.2259, "step": 126368 }, { "epoch": 0.79, "learning_rate": 3.871089800038396e-05, "loss": 2.2302, "step": 126376 }, { "epoch": 0.79, "learning_rate": 3.870555888924832e-05, "loss": 2.2297, "step": 126384 }, { "epoch": 0.79, "learning_rate": 3.8700220307494855e-05, "loss": 2.2403, "step": 126392 }, { "epoch": 0.79, "learning_rate": 3.869488225525631e-05, "loss": 2.2329, "step": 126400 }, { "epoch": 0.79, "learning_rate": 3.868954473266541e-05, "loss": 2.2269, "step": 126408 }, { "epoch": 0.79, "learning_rate": 3.868420773985479e-05, "loss": 2.2222, "step": 126416 }, { "epoch": 0.79, "learning_rate": 3.8678871276957176e-05, "loss": 2.2324, "step": 126424 }, { "epoch": 0.79, "learning_rate": 3.867353534410521e-05, "loss": 2.2318, "step": 126432 }, { "epoch": 0.79, "learning_rate": 3.8668199941431524e-05, "loss": 2.2356, "step": 126440 }, { "epoch": 0.79, "learning_rate": 3.8662865069068804e-05, "loss": 2.2277, "step": 126448 }, { "epoch": 0.79, "learning_rate": 3.865753072714964e-05, "loss": 2.2269, "step": 126456 }, { "epoch": 0.79, "learning_rate": 3.8652196915806674e-05, "loss": 2.2391, "step": 126464 }, { "epoch": 0.79, "learning_rate": 3.864686363517247e-05, "loss": 2.2311, "step": 126472 }, { "epoch": 0.79, "learning_rate": 3.864153088537964e-05, "loss": 2.232, "step": 126480 }, { "epoch": 0.79, "learning_rate": 3.863619866656075e-05, "loss": 2.2384, "step": 126488 }, { "epoch": 0.79, "learning_rate": 3.863086697884837e-05, "loss": 2.2309, "step": 126496 }, { "epoch": 0.79, "learning_rate": 3.8625535822375006e-05, "loss": 2.221, "step": 126504 }, { "epoch": 0.79, "learning_rate": 3.862020519727324e-05, "loss": 2.2436, "step": 126512 }, { "epoch": 0.79, "learning_rate": 3.8614875103675566e-05, "loss": 2.2327, "step": 126520 }, { "epoch": 0.79, "learning_rate": 3.8609545541714494e-05, "loss": 2.218, "step": 126528 }, { "epoch": 0.79, "learning_rate": 3.860421651152253e-05, "loss": 2.2503, "step": 126536 }, { "epoch": 0.79, "learning_rate": 3.859888801323214e-05, "loss": 2.2338, "step": 126544 }, { "epoch": 0.79, "learning_rate": 3.859356004697578e-05, "loss": 2.2533, "step": 126552 }, { "epoch": 0.79, "learning_rate": 3.8588232612885934e-05, "loss": 2.2212, "step": 126560 }, { "epoch": 0.79, "learning_rate": 3.858290571109503e-05, "loss": 2.2197, "step": 126568 }, { "epoch": 0.79, "learning_rate": 3.8577579341735494e-05, "loss": 2.241, "step": 126576 }, { "epoch": 0.79, "learning_rate": 3.857225350493972e-05, "loss": 2.2221, "step": 126584 }, { "epoch": 0.79, "learning_rate": 3.8566928200840146e-05, "loss": 2.2294, "step": 126592 }, { "epoch": 0.79, "learning_rate": 3.8561603429569136e-05, "loss": 2.2343, "step": 126600 }, { "epoch": 0.79, "learning_rate": 3.855627919125906e-05, "loss": 2.2296, "step": 126608 }, { "epoch": 0.79, "learning_rate": 3.855095548604229e-05, "loss": 2.2274, "step": 126616 }, { "epoch": 0.79, "learning_rate": 3.854563231405121e-05, "loss": 2.2421, "step": 126624 }, { "epoch": 0.79, "learning_rate": 3.854030967541808e-05, "loss": 2.2292, "step": 126632 }, { "epoch": 0.79, "learning_rate": 3.853498757027527e-05, "loss": 2.2357, "step": 126640 }, { "epoch": 0.79, "learning_rate": 3.8529665998755084e-05, "loss": 2.2342, "step": 126648 }, { "epoch": 0.79, "learning_rate": 3.852434496098979e-05, "loss": 2.2129, "step": 126656 }, { "epoch": 0.79, "learning_rate": 3.8519024457111705e-05, "loss": 2.2233, "step": 126664 }, { "epoch": 0.79, "learning_rate": 3.8513704487253075e-05, "loss": 2.261, "step": 126672 }, { "epoch": 0.79, "learning_rate": 3.850838505154617e-05, "loss": 2.2364, "step": 126680 }, { "epoch": 0.79, "learning_rate": 3.850306615012322e-05, "loss": 2.2336, "step": 126688 }, { "epoch": 0.79, "learning_rate": 3.8497747783116455e-05, "loss": 2.2512, "step": 126696 }, { "epoch": 0.79, "learning_rate": 3.84924299506581e-05, "loss": 2.2496, "step": 126704 }, { "epoch": 0.79, "learning_rate": 3.848711265288035e-05, "loss": 2.2296, "step": 126712 }, { "epoch": 0.79, "learning_rate": 3.848179588991539e-05, "loss": 2.2399, "step": 126720 }, { "epoch": 0.79, "learning_rate": 3.847647966189541e-05, "loss": 2.2392, "step": 126728 }, { "epoch": 0.79, "learning_rate": 3.847116396895254e-05, "loss": 2.2525, "step": 126736 }, { "epoch": 0.79, "learning_rate": 3.846584881121895e-05, "loss": 2.2693, "step": 126744 }, { "epoch": 0.79, "learning_rate": 3.846053418882678e-05, "loss": 2.2498, "step": 126752 }, { "epoch": 0.79, "learning_rate": 3.845522010190816e-05, "loss": 2.2354, "step": 126760 }, { "epoch": 0.79, "learning_rate": 3.8449906550595155e-05, "loss": 2.245, "step": 126768 }, { "epoch": 0.79, "learning_rate": 3.844459353501992e-05, "loss": 2.2451, "step": 126776 }, { "epoch": 0.79, "learning_rate": 3.84392810553145e-05, "loss": 2.2376, "step": 126784 }, { "epoch": 0.79, "learning_rate": 3.843396911161097e-05, "loss": 2.2385, "step": 126792 }, { "epoch": 0.79, "learning_rate": 3.842865770404138e-05, "loss": 2.2472, "step": 126800 }, { "epoch": 0.79, "learning_rate": 3.842334683273778e-05, "loss": 2.2517, "step": 126808 }, { "epoch": 0.79, "learning_rate": 3.8418036497832226e-05, "loss": 2.2148, "step": 126816 }, { "epoch": 0.79, "learning_rate": 3.841272669945668e-05, "loss": 2.248, "step": 126824 }, { "epoch": 0.79, "learning_rate": 3.8407417437743165e-05, "loss": 2.2347, "step": 126832 }, { "epoch": 0.79, "learning_rate": 3.8402108712823705e-05, "loss": 2.2309, "step": 126840 }, { "epoch": 0.79, "learning_rate": 3.839680052483022e-05, "loss": 2.2442, "step": 126848 }, { "epoch": 0.79, "learning_rate": 3.8391492873894705e-05, "loss": 2.2365, "step": 126856 }, { "epoch": 0.79, "learning_rate": 3.8386185760149106e-05, "loss": 2.2582, "step": 126864 }, { "epoch": 0.79, "learning_rate": 3.838087918372534e-05, "loss": 2.2394, "step": 126872 }, { "epoch": 0.79, "learning_rate": 3.837557314475536e-05, "loss": 2.2298, "step": 126880 }, { "epoch": 0.79, "learning_rate": 3.837026764337104e-05, "loss": 2.2474, "step": 126888 }, { "epoch": 0.79, "learning_rate": 3.836496267970431e-05, "loss": 2.2383, "step": 126896 }, { "epoch": 0.79, "learning_rate": 3.835965825388703e-05, "loss": 2.2328, "step": 126904 }, { "epoch": 0.79, "learning_rate": 3.835435436605106e-05, "loss": 2.243, "step": 126912 }, { "epoch": 0.79, "learning_rate": 3.834905101632829e-05, "loss": 2.2521, "step": 126920 }, { "epoch": 0.79, "learning_rate": 3.8343748204850536e-05, "loss": 2.2398, "step": 126928 }, { "epoch": 0.79, "learning_rate": 3.833844593174962e-05, "loss": 2.2336, "step": 126936 }, { "epoch": 0.79, "learning_rate": 3.83331441971574e-05, "loss": 2.2286, "step": 126944 }, { "epoch": 0.79, "learning_rate": 3.832784300120561e-05, "loss": 2.2435, "step": 126952 }, { "epoch": 0.79, "learning_rate": 3.832254234402608e-05, "loss": 2.2341, "step": 126960 }, { "epoch": 0.79, "learning_rate": 3.831724222575059e-05, "loss": 2.2363, "step": 126968 }, { "epoch": 0.79, "learning_rate": 3.83119426465109e-05, "loss": 2.2202, "step": 126976 }, { "epoch": 0.79, "learning_rate": 3.830664360643872e-05, "loss": 2.2307, "step": 126984 }, { "epoch": 0.79, "learning_rate": 3.830134510566584e-05, "loss": 2.2456, "step": 126992 }, { "epoch": 0.79, "learning_rate": 3.829604714432395e-05, "loss": 2.2415, "step": 127000 }, { "epoch": 0.79, "learning_rate": 3.829074972254476e-05, "loss": 2.2326, "step": 127008 }, { "epoch": 0.79, "learning_rate": 3.8285452840459965e-05, "loss": 2.2352, "step": 127016 }, { "epoch": 0.79, "learning_rate": 3.828015649820124e-05, "loss": 2.2346, "step": 127024 }, { "epoch": 0.79, "learning_rate": 3.8274860695900286e-05, "loss": 2.2462, "step": 127032 }, { "epoch": 0.79, "learning_rate": 3.826956543368871e-05, "loss": 2.2264, "step": 127040 }, { "epoch": 0.79, "learning_rate": 3.826427071169819e-05, "loss": 2.2461, "step": 127048 }, { "epoch": 0.79, "learning_rate": 3.825897653006034e-05, "loss": 2.2516, "step": 127056 }, { "epoch": 0.79, "learning_rate": 3.825368288890675e-05, "loss": 2.2294, "step": 127064 }, { "epoch": 0.79, "learning_rate": 3.8248389788369066e-05, "loss": 2.2288, "step": 127072 }, { "epoch": 0.79, "learning_rate": 3.824309722857885e-05, "loss": 2.2407, "step": 127080 }, { "epoch": 0.79, "learning_rate": 3.823780520966767e-05, "loss": 2.2304, "step": 127088 }, { "epoch": 0.79, "learning_rate": 3.82325137317671e-05, "loss": 2.229, "step": 127096 }, { "epoch": 0.79, "learning_rate": 3.822722279500866e-05, "loss": 2.2223, "step": 127104 }, { "epoch": 0.79, "learning_rate": 3.822193239952393e-05, "loss": 2.2341, "step": 127112 }, { "epoch": 0.79, "learning_rate": 3.8216642545444404e-05, "loss": 2.2205, "step": 127120 }, { "epoch": 0.79, "learning_rate": 3.821135323290157e-05, "loss": 2.2244, "step": 127128 }, { "epoch": 0.79, "learning_rate": 3.820606446202695e-05, "loss": 2.2333, "step": 127136 }, { "epoch": 0.79, "learning_rate": 3.820077623295202e-05, "loss": 2.232, "step": 127144 }, { "epoch": 0.79, "learning_rate": 3.819548854580822e-05, "loss": 2.2261, "step": 127152 }, { "epoch": 0.79, "learning_rate": 3.819020140072704e-05, "loss": 2.2457, "step": 127160 }, { "epoch": 0.79, "learning_rate": 3.81849147978399e-05, "loss": 2.2371, "step": 127168 }, { "epoch": 0.79, "learning_rate": 3.8179628737278205e-05, "loss": 2.2238, "step": 127176 }, { "epoch": 0.79, "learning_rate": 3.817434321917341e-05, "loss": 2.2261, "step": 127184 }, { "epoch": 0.79, "learning_rate": 3.8169058243656886e-05, "loss": 2.2342, "step": 127192 }, { "epoch": 0.8, "learning_rate": 3.816377381086003e-05, "loss": 2.2409, "step": 127200 }, { "epoch": 0.8, "learning_rate": 3.8158489920914184e-05, "loss": 2.2218, "step": 127208 }, { "epoch": 0.8, "learning_rate": 3.815320657395075e-05, "loss": 2.2333, "step": 127216 }, { "epoch": 0.8, "learning_rate": 3.814792377010105e-05, "loss": 2.2307, "step": 127224 }, { "epoch": 0.8, "learning_rate": 3.81426415094964e-05, "loss": 2.2279, "step": 127232 }, { "epoch": 0.8, "learning_rate": 3.813735979226813e-05, "loss": 2.2232, "step": 127240 }, { "epoch": 0.8, "learning_rate": 3.8132078618547585e-05, "loss": 2.226, "step": 127248 }, { "epoch": 0.8, "learning_rate": 3.812679798846599e-05, "loss": 2.2286, "step": 127256 }, { "epoch": 0.8, "learning_rate": 3.812151790215466e-05, "loss": 2.2203, "step": 127264 }, { "epoch": 0.8, "learning_rate": 3.811623835974486e-05, "loss": 2.235, "step": 127272 }, { "epoch": 0.8, "learning_rate": 3.8110959361367806e-05, "loss": 2.2381, "step": 127280 }, { "epoch": 0.8, "learning_rate": 3.810568090715477e-05, "loss": 2.2415, "step": 127288 }, { "epoch": 0.8, "learning_rate": 3.810040299723697e-05, "loss": 2.237, "step": 127296 }, { "epoch": 0.8, "learning_rate": 3.8095125631745594e-05, "loss": 2.2161, "step": 127304 }, { "epoch": 0.8, "learning_rate": 3.808984881081186e-05, "loss": 2.2326, "step": 127312 }, { "epoch": 0.8, "learning_rate": 3.808457253456694e-05, "loss": 2.2341, "step": 127320 }, { "epoch": 0.8, "learning_rate": 3.807929680314201e-05, "loss": 2.2222, "step": 127328 }, { "epoch": 0.8, "learning_rate": 3.807402161666823e-05, "loss": 2.2321, "step": 127336 }, { "epoch": 0.8, "learning_rate": 3.806874697527671e-05, "loss": 2.2281, "step": 127344 }, { "epoch": 0.8, "learning_rate": 3.8063472879098615e-05, "loss": 2.2208, "step": 127352 }, { "epoch": 0.8, "learning_rate": 3.8058199328265055e-05, "loss": 2.2355, "step": 127360 }, { "epoch": 0.8, "learning_rate": 3.8052926322907093e-05, "loss": 2.2244, "step": 127368 }, { "epoch": 0.8, "learning_rate": 3.804765386315588e-05, "loss": 2.2329, "step": 127376 }, { "epoch": 0.8, "learning_rate": 3.804238194914244e-05, "loss": 2.2363, "step": 127384 }, { "epoch": 0.8, "learning_rate": 3.803711058099783e-05, "loss": 2.2409, "step": 127392 }, { "epoch": 0.8, "learning_rate": 3.8031839758853135e-05, "loss": 2.2299, "step": 127400 }, { "epoch": 0.8, "learning_rate": 3.8026569482839376e-05, "loss": 2.2293, "step": 127408 }, { "epoch": 0.8, "learning_rate": 3.802129975308755e-05, "loss": 2.244, "step": 127416 }, { "epoch": 0.8, "learning_rate": 3.801603056972868e-05, "loss": 2.224, "step": 127424 }, { "epoch": 0.8, "learning_rate": 3.8010761932893755e-05, "loss": 2.2212, "step": 127432 }, { "epoch": 0.8, "learning_rate": 3.800549384271377e-05, "loss": 2.2329, "step": 127440 }, { "epoch": 0.8, "learning_rate": 3.800022629931965e-05, "loss": 2.2274, "step": 127448 }, { "epoch": 0.8, "learning_rate": 3.799495930284238e-05, "loss": 2.2499, "step": 127456 }, { "epoch": 0.8, "learning_rate": 3.798969285341292e-05, "loss": 2.2302, "step": 127464 }, { "epoch": 0.8, "learning_rate": 3.7984426951162136e-05, "loss": 2.2298, "step": 127472 }, { "epoch": 0.8, "learning_rate": 3.7979161596220966e-05, "loss": 2.2318, "step": 127480 }, { "epoch": 0.8, "learning_rate": 3.7973896788720334e-05, "loss": 2.2259, "step": 127488 }, { "epoch": 0.8, "learning_rate": 3.796863252879107e-05, "loss": 2.2277, "step": 127496 }, { "epoch": 0.8, "learning_rate": 3.796336881656409e-05, "loss": 2.2213, "step": 127504 }, { "epoch": 0.8, "learning_rate": 3.7958105652170225e-05, "loss": 2.2175, "step": 127512 }, { "epoch": 0.8, "learning_rate": 3.7952843035740336e-05, "loss": 2.2357, "step": 127520 }, { "epoch": 0.8, "learning_rate": 3.794758096740524e-05, "loss": 2.2236, "step": 127528 }, { "epoch": 0.8, "learning_rate": 3.794231944729574e-05, "loss": 2.2257, "step": 127536 }, { "epoch": 0.8, "learning_rate": 3.793705847554267e-05, "loss": 2.2098, "step": 127544 }, { "epoch": 0.8, "learning_rate": 3.793179805227681e-05, "loss": 2.2384, "step": 127552 }, { "epoch": 0.8, "learning_rate": 3.792653817762891e-05, "loss": 2.2355, "step": 127560 }, { "epoch": 0.8, "learning_rate": 3.792127885172977e-05, "loss": 2.2277, "step": 127568 }, { "epoch": 0.8, "learning_rate": 3.791602007471009e-05, "loss": 2.2162, "step": 127576 }, { "epoch": 0.8, "learning_rate": 3.791076184670062e-05, "loss": 2.2111, "step": 127584 }, { "epoch": 0.8, "learning_rate": 3.790550416783212e-05, "loss": 2.2283, "step": 127592 }, { "epoch": 0.8, "learning_rate": 3.7900247038235245e-05, "loss": 2.2291, "step": 127600 }, { "epoch": 0.8, "learning_rate": 3.7894990458040705e-05, "loss": 2.2403, "step": 127608 }, { "epoch": 0.8, "learning_rate": 3.78897344273792e-05, "loss": 2.2342, "step": 127616 }, { "epoch": 0.8, "learning_rate": 3.788447894638137e-05, "loss": 2.2338, "step": 127624 }, { "epoch": 0.8, "learning_rate": 3.787922401517788e-05, "loss": 2.2103, "step": 127632 }, { "epoch": 0.8, "learning_rate": 3.787396963389935e-05, "loss": 2.2402, "step": 127640 }, { "epoch": 0.8, "learning_rate": 3.786871580267643e-05, "loss": 2.2407, "step": 127648 }, { "epoch": 0.8, "learning_rate": 3.786346252163972e-05, "loss": 2.2278, "step": 127656 }, { "epoch": 0.8, "learning_rate": 3.7858209790919794e-05, "loss": 2.2182, "step": 127664 }, { "epoch": 0.8, "learning_rate": 3.785295761064726e-05, "loss": 2.232, "step": 127672 }, { "epoch": 0.8, "learning_rate": 3.784770598095271e-05, "loss": 2.2206, "step": 127680 }, { "epoch": 0.8, "learning_rate": 3.7842454901966656e-05, "loss": 2.2375, "step": 127688 }, { "epoch": 0.8, "learning_rate": 3.783720437381967e-05, "loss": 2.2331, "step": 127696 }, { "epoch": 0.8, "learning_rate": 3.783195439664227e-05, "loss": 2.2283, "step": 127704 }, { "epoch": 0.8, "learning_rate": 3.782670497056495e-05, "loss": 2.2352, "step": 127712 }, { "epoch": 0.8, "learning_rate": 3.782145609571826e-05, "loss": 2.2176, "step": 127720 }, { "epoch": 0.8, "learning_rate": 3.7816207772232624e-05, "loss": 2.2298, "step": 127728 }, { "epoch": 0.8, "learning_rate": 3.7810960000238584e-05, "loss": 2.2341, "step": 127736 }, { "epoch": 0.8, "learning_rate": 3.780571277986656e-05, "loss": 2.2243, "step": 127744 }, { "epoch": 0.8, "learning_rate": 3.7800466111246995e-05, "loss": 2.2376, "step": 127752 }, { "epoch": 0.8, "learning_rate": 3.779521999451035e-05, "loss": 2.2484, "step": 127760 }, { "epoch": 0.8, "learning_rate": 3.778997442978702e-05, "loss": 2.242, "step": 127768 }, { "epoch": 0.8, "learning_rate": 3.778472941720741e-05, "loss": 2.2434, "step": 127776 }, { "epoch": 0.8, "learning_rate": 3.7779484956901946e-05, "loss": 2.2285, "step": 127784 }, { "epoch": 0.8, "learning_rate": 3.777424104900095e-05, "loss": 2.2251, "step": 127792 }, { "epoch": 0.8, "learning_rate": 3.7768997693634815e-05, "loss": 2.2297, "step": 127800 }, { "epoch": 0.8, "learning_rate": 3.7763754890933906e-05, "loss": 2.2491, "step": 127808 }, { "epoch": 0.8, "learning_rate": 3.7758512641028545e-05, "loss": 2.239, "step": 127816 }, { "epoch": 0.8, "learning_rate": 3.775327094404904e-05, "loss": 2.2311, "step": 127824 }, { "epoch": 0.8, "learning_rate": 3.774802980012573e-05, "loss": 2.2215, "step": 127832 }, { "epoch": 0.8, "learning_rate": 3.774278920938889e-05, "loss": 2.2379, "step": 127840 }, { "epoch": 0.8, "learning_rate": 3.773754917196882e-05, "loss": 2.2383, "step": 127848 }, { "epoch": 0.8, "learning_rate": 3.773230968799576e-05, "loss": 2.244, "step": 127856 }, { "epoch": 0.8, "learning_rate": 3.7727070757599974e-05, "loss": 2.2296, "step": 127864 }, { "epoch": 0.8, "learning_rate": 3.7721832380911736e-05, "loss": 2.2405, "step": 127872 }, { "epoch": 0.8, "learning_rate": 3.771659455806122e-05, "loss": 2.2293, "step": 127880 }, { "epoch": 0.8, "learning_rate": 3.771135728917867e-05, "loss": 2.2387, "step": 127888 }, { "epoch": 0.8, "learning_rate": 3.770612057439429e-05, "loss": 2.2326, "step": 127896 }, { "epoch": 0.8, "learning_rate": 3.770088441383823e-05, "loss": 2.2366, "step": 127904 }, { "epoch": 0.8, "learning_rate": 3.76956488076407e-05, "loss": 2.236, "step": 127912 }, { "epoch": 0.8, "learning_rate": 3.7690413755931846e-05, "loss": 2.2256, "step": 127920 }, { "epoch": 0.8, "learning_rate": 3.7685179258841795e-05, "loss": 2.2198, "step": 127928 }, { "epoch": 0.8, "learning_rate": 3.7679945316500706e-05, "loss": 2.2345, "step": 127936 }, { "epoch": 0.8, "learning_rate": 3.767471192903866e-05, "loss": 2.2396, "step": 127944 }, { "epoch": 0.8, "learning_rate": 3.76694790965858e-05, "loss": 2.2253, "step": 127952 }, { "epoch": 0.8, "learning_rate": 3.7664246819272205e-05, "loss": 2.2415, "step": 127960 }, { "epoch": 0.8, "learning_rate": 3.765901509722791e-05, "loss": 2.2301, "step": 127968 }, { "epoch": 0.8, "learning_rate": 3.765378393058303e-05, "loss": 2.2085, "step": 127976 }, { "epoch": 0.8, "learning_rate": 3.7648553319467585e-05, "loss": 2.2443, "step": 127984 }, { "epoch": 0.8, "learning_rate": 3.76433232640116e-05, "loss": 2.2272, "step": 127992 }, { "epoch": 0.8, "learning_rate": 3.763809376434513e-05, "loss": 2.2225, "step": 128000 }, { "epoch": 0.8, "learning_rate": 3.763286482059814e-05, "loss": 2.2199, "step": 128008 }, { "epoch": 0.8, "learning_rate": 3.7627636432900634e-05, "loss": 2.2239, "step": 128016 }, { "epoch": 0.8, "learning_rate": 3.76224086013826e-05, "loss": 2.218, "step": 128024 }, { "epoch": 0.8, "learning_rate": 3.7617181326174015e-05, "loss": 2.2219, "step": 128032 }, { "epoch": 0.8, "learning_rate": 3.761195460740479e-05, "loss": 2.2301, "step": 128040 }, { "epoch": 0.8, "learning_rate": 3.760672844520491e-05, "loss": 2.2317, "step": 128048 }, { "epoch": 0.8, "learning_rate": 3.7601502839704264e-05, "loss": 2.228, "step": 128056 }, { "epoch": 0.8, "learning_rate": 3.759627779103277e-05, "loss": 2.2358, "step": 128064 }, { "epoch": 0.8, "learning_rate": 3.759105329932031e-05, "loss": 2.2249, "step": 128072 }, { "epoch": 0.8, "learning_rate": 3.7585829364696786e-05, "loss": 2.2391, "step": 128080 }, { "epoch": 0.8, "learning_rate": 3.758060598729208e-05, "loss": 2.2203, "step": 128088 }, { "epoch": 0.8, "learning_rate": 3.7575383167236e-05, "loss": 2.2337, "step": 128096 }, { "epoch": 0.8, "learning_rate": 3.757016090465843e-05, "loss": 2.2302, "step": 128104 }, { "epoch": 0.8, "learning_rate": 3.7564939199689166e-05, "loss": 2.2377, "step": 128112 }, { "epoch": 0.8, "learning_rate": 3.755971805245801e-05, "loss": 2.2442, "step": 128120 }, { "epoch": 0.8, "learning_rate": 3.755449746309481e-05, "loss": 2.2353, "step": 128128 }, { "epoch": 0.8, "learning_rate": 3.7549277431729326e-05, "loss": 2.2241, "step": 128136 }, { "epoch": 0.8, "learning_rate": 3.7544057958491296e-05, "loss": 2.2393, "step": 128144 }, { "epoch": 0.8, "learning_rate": 3.753883904351052e-05, "loss": 2.2403, "step": 128152 }, { "epoch": 0.8, "learning_rate": 3.753362068691672e-05, "loss": 2.2473, "step": 128160 }, { "epoch": 0.8, "learning_rate": 3.752840288883964e-05, "loss": 2.2329, "step": 128168 }, { "epoch": 0.8, "learning_rate": 3.752318564940898e-05, "loss": 2.2305, "step": 128176 }, { "epoch": 0.8, "learning_rate": 3.751796896875444e-05, "loss": 2.2473, "step": 128184 }, { "epoch": 0.8, "learning_rate": 3.751275284700573e-05, "loss": 2.2215, "step": 128192 }, { "epoch": 0.8, "learning_rate": 3.75075372842925e-05, "loss": 2.2394, "step": 128200 }, { "epoch": 0.8, "learning_rate": 3.7502322280744403e-05, "loss": 2.2349, "step": 128208 }, { "epoch": 0.8, "learning_rate": 3.749710783649112e-05, "loss": 2.2303, "step": 128216 }, { "epoch": 0.8, "learning_rate": 3.749189395166225e-05, "loss": 2.2303, "step": 128224 }, { "epoch": 0.8, "learning_rate": 3.748668062638742e-05, "loss": 2.2426, "step": 128232 }, { "epoch": 0.8, "learning_rate": 3.7481467860796236e-05, "loss": 2.2345, "step": 128240 }, { "epoch": 0.8, "learning_rate": 3.747625565501829e-05, "loss": 2.2261, "step": 128248 }, { "epoch": 0.8, "learning_rate": 3.747104400918317e-05, "loss": 2.2423, "step": 128256 }, { "epoch": 0.8, "learning_rate": 3.7465832923420395e-05, "loss": 2.2264, "step": 128264 }, { "epoch": 0.8, "learning_rate": 3.746062239785956e-05, "loss": 2.2319, "step": 128272 }, { "epoch": 0.8, "learning_rate": 3.745541243263018e-05, "loss": 2.2384, "step": 128280 }, { "epoch": 0.8, "learning_rate": 3.745020302786177e-05, "loss": 2.2454, "step": 128288 }, { "epoch": 0.8, "learning_rate": 3.744499418368383e-05, "loss": 2.2379, "step": 128296 }, { "epoch": 0.8, "learning_rate": 3.7439785900225904e-05, "loss": 2.2458, "step": 128304 }, { "epoch": 0.8, "learning_rate": 3.74345781776174e-05, "loss": 2.2334, "step": 128312 }, { "epoch": 0.8, "learning_rate": 3.742937101598783e-05, "loss": 2.2313, "step": 128320 }, { "epoch": 0.8, "learning_rate": 3.742416441546662e-05, "loss": 2.2448, "step": 128328 }, { "epoch": 0.8, "learning_rate": 3.741895837618321e-05, "loss": 2.2095, "step": 128336 }, { "epoch": 0.8, "learning_rate": 3.741375289826705e-05, "loss": 2.2231, "step": 128344 }, { "epoch": 0.8, "learning_rate": 3.740854798184751e-05, "loss": 2.2348, "step": 128352 }, { "epoch": 0.8, "learning_rate": 3.7403343627054e-05, "loss": 2.2409, "step": 128360 }, { "epoch": 0.8, "learning_rate": 3.739813983401591e-05, "loss": 2.2243, "step": 128368 }, { "epoch": 0.8, "learning_rate": 3.7392936602862586e-05, "loss": 2.2334, "step": 128376 }, { "epoch": 0.8, "learning_rate": 3.738773393372341e-05, "loss": 2.2329, "step": 128384 }, { "epoch": 0.8, "learning_rate": 3.7382531826727705e-05, "loss": 2.2292, "step": 128392 }, { "epoch": 0.8, "learning_rate": 3.737733028200479e-05, "loss": 2.2237, "step": 128400 }, { "epoch": 0.8, "learning_rate": 3.7372129299684e-05, "loss": 2.2255, "step": 128408 }, { "epoch": 0.8, "learning_rate": 3.736692887989459e-05, "loss": 2.234, "step": 128416 }, { "epoch": 0.8, "learning_rate": 3.7361729022765865e-05, "loss": 2.2342, "step": 128424 }, { "epoch": 0.8, "learning_rate": 3.735652972842711e-05, "loss": 2.2345, "step": 128432 }, { "epoch": 0.8, "learning_rate": 3.735133099700757e-05, "loss": 2.2264, "step": 128440 }, { "epoch": 0.8, "learning_rate": 3.734613282863647e-05, "loss": 2.2303, "step": 128448 }, { "epoch": 0.8, "learning_rate": 3.7340935223443066e-05, "loss": 2.2404, "step": 128456 }, { "epoch": 0.8, "learning_rate": 3.733573818155655e-05, "loss": 2.2554, "step": 128464 }, { "epoch": 0.8, "learning_rate": 3.733054170310613e-05, "loss": 2.2359, "step": 128472 }, { "epoch": 0.8, "learning_rate": 3.732534578822096e-05, "loss": 2.2409, "step": 128480 }, { "epoch": 0.8, "learning_rate": 3.732015043703026e-05, "loss": 2.2393, "step": 128488 }, { "epoch": 0.8, "learning_rate": 3.731495564966317e-05, "loss": 2.2444, "step": 128496 }, { "epoch": 0.8, "learning_rate": 3.7309761426248805e-05, "loss": 2.2336, "step": 128504 }, { "epoch": 0.8, "learning_rate": 3.730456776691632e-05, "loss": 2.2443, "step": 128512 }, { "epoch": 0.8, "learning_rate": 3.7299374671794854e-05, "loss": 2.2291, "step": 128520 }, { "epoch": 0.8, "learning_rate": 3.729418214101346e-05, "loss": 2.2256, "step": 128528 }, { "epoch": 0.8, "learning_rate": 3.728899017470125e-05, "loss": 2.2306, "step": 128536 }, { "epoch": 0.8, "learning_rate": 3.72837987729873e-05, "loss": 2.2418, "step": 128544 }, { "epoch": 0.8, "learning_rate": 3.7278607936000645e-05, "loss": 2.2293, "step": 128552 }, { "epoch": 0.8, "learning_rate": 3.727341766387036e-05, "loss": 2.2245, "step": 128560 }, { "epoch": 0.8, "learning_rate": 3.7268227956725446e-05, "loss": 2.2308, "step": 128568 }, { "epoch": 0.8, "learning_rate": 3.7263038814694947e-05, "loss": 2.2417, "step": 128576 }, { "epoch": 0.8, "learning_rate": 3.7257850237907856e-05, "loss": 2.2341, "step": 128584 }, { "epoch": 0.8, "learning_rate": 3.725266222649315e-05, "loss": 2.232, "step": 128592 }, { "epoch": 0.8, "learning_rate": 3.724747478057982e-05, "loss": 2.2191, "step": 128600 }, { "epoch": 0.8, "learning_rate": 3.7242287900296824e-05, "loss": 2.2337, "step": 128608 }, { "epoch": 0.8, "learning_rate": 3.723710158577309e-05, "loss": 2.245, "step": 128616 }, { "epoch": 0.8, "learning_rate": 3.723191583713759e-05, "loss": 2.2381, "step": 128624 }, { "epoch": 0.8, "learning_rate": 3.7226730654519186e-05, "loss": 2.2179, "step": 128632 }, { "epoch": 0.8, "learning_rate": 3.722154603804682e-05, "loss": 2.2462, "step": 128640 }, { "epoch": 0.8, "learning_rate": 3.721636198784939e-05, "loss": 2.2252, "step": 128648 }, { "epoch": 0.8, "learning_rate": 3.721117850405575e-05, "loss": 2.225, "step": 128656 }, { "epoch": 0.8, "learning_rate": 3.720599558679476e-05, "loss": 2.2347, "step": 128664 }, { "epoch": 0.8, "learning_rate": 3.720081323619529e-05, "loss": 2.24, "step": 128672 }, { "epoch": 0.8, "learning_rate": 3.719563145238616e-05, "loss": 2.2397, "step": 128680 }, { "epoch": 0.8, "learning_rate": 3.719045023549619e-05, "loss": 2.2241, "step": 128688 }, { "epoch": 0.8, "learning_rate": 3.718526958565418e-05, "loss": 2.2312, "step": 128696 }, { "epoch": 0.8, "learning_rate": 3.718008950298894e-05, "loss": 2.233, "step": 128704 }, { "epoch": 0.8, "learning_rate": 3.717490998762922e-05, "loss": 2.2234, "step": 128712 }, { "epoch": 0.8, "learning_rate": 3.7169731039703804e-05, "loss": 2.2416, "step": 128720 }, { "epoch": 0.8, "learning_rate": 3.716455265934144e-05, "loss": 2.227, "step": 128728 }, { "epoch": 0.8, "learning_rate": 3.715937484667086e-05, "loss": 2.2468, "step": 128736 }, { "epoch": 0.8, "learning_rate": 3.7154197601820774e-05, "loss": 2.2326, "step": 128744 }, { "epoch": 0.8, "learning_rate": 3.714902092491991e-05, "loss": 2.2367, "step": 128752 }, { "epoch": 0.8, "learning_rate": 3.714384481609695e-05, "loss": 2.2189, "step": 128760 }, { "epoch": 0.8, "learning_rate": 3.713866927548055e-05, "loss": 2.2433, "step": 128768 }, { "epoch": 0.8, "learning_rate": 3.7133494303199424e-05, "loss": 2.2456, "step": 128776 }, { "epoch": 0.8, "learning_rate": 3.712831989938217e-05, "loss": 2.2331, "step": 128784 }, { "epoch": 0.8, "learning_rate": 3.712314606415748e-05, "loss": 2.2286, "step": 128792 }, { "epoch": 0.81, "learning_rate": 3.711797279765393e-05, "loss": 2.2357, "step": 128800 }, { "epoch": 0.81, "learning_rate": 3.7112800100000135e-05, "loss": 2.2218, "step": 128808 }, { "epoch": 0.81, "learning_rate": 3.710762797132471e-05, "loss": 2.2169, "step": 128816 }, { "epoch": 0.81, "learning_rate": 3.7102456411756226e-05, "loss": 2.2409, "step": 128824 }, { "epoch": 0.81, "learning_rate": 3.7097285421423225e-05, "loss": 2.2314, "step": 128832 }, { "epoch": 0.81, "learning_rate": 3.7092115000454306e-05, "loss": 2.2439, "step": 128840 }, { "epoch": 0.81, "learning_rate": 3.708694514897796e-05, "loss": 2.2382, "step": 128848 }, { "epoch": 0.81, "learning_rate": 3.708177586712271e-05, "loss": 2.2284, "step": 128856 }, { "epoch": 0.81, "learning_rate": 3.7076607155017115e-05, "loss": 2.2189, "step": 128864 }, { "epoch": 0.81, "learning_rate": 3.7071439012789634e-05, "loss": 2.2245, "step": 128872 }, { "epoch": 0.81, "learning_rate": 3.706627144056873e-05, "loss": 2.221, "step": 128880 }, { "epoch": 0.81, "learning_rate": 3.7061104438482917e-05, "loss": 2.2379, "step": 128888 }, { "epoch": 0.81, "learning_rate": 3.705593800666061e-05, "loss": 2.2222, "step": 128896 }, { "epoch": 0.81, "learning_rate": 3.705077214523027e-05, "loss": 2.2302, "step": 128904 }, { "epoch": 0.81, "learning_rate": 3.704560685432028e-05, "loss": 2.2354, "step": 128912 }, { "epoch": 0.81, "learning_rate": 3.704044213405909e-05, "loss": 2.2305, "step": 128920 }, { "epoch": 0.81, "learning_rate": 3.703527798457511e-05, "loss": 2.2257, "step": 128928 }, { "epoch": 0.81, "learning_rate": 3.703011440599667e-05, "loss": 2.2413, "step": 128936 }, { "epoch": 0.81, "learning_rate": 3.702495139845217e-05, "loss": 2.2303, "step": 128944 }, { "epoch": 0.81, "learning_rate": 3.701978896206997e-05, "loss": 2.2362, "step": 128952 }, { "epoch": 0.81, "learning_rate": 3.7014627096978364e-05, "loss": 2.2246, "step": 128960 }, { "epoch": 0.81, "learning_rate": 3.7009465803305735e-05, "loss": 2.2222, "step": 128968 }, { "epoch": 0.81, "learning_rate": 3.700430508118036e-05, "loss": 2.2305, "step": 128976 }, { "epoch": 0.81, "learning_rate": 3.6999144930730526e-05, "loss": 2.2263, "step": 128984 }, { "epoch": 0.81, "learning_rate": 3.699398535208454e-05, "loss": 2.2323, "step": 128992 }, { "epoch": 0.81, "learning_rate": 3.6988826345370656e-05, "loss": 2.23, "step": 129000 }, { "epoch": 0.81, "learning_rate": 3.698366791071713e-05, "loss": 2.2245, "step": 129008 }, { "epoch": 0.81, "learning_rate": 3.6978510048252214e-05, "loss": 2.2347, "step": 129016 }, { "epoch": 0.81, "learning_rate": 3.6973352758104106e-05, "loss": 2.2351, "step": 129024 }, { "epoch": 0.81, "learning_rate": 3.6968196040401044e-05, "loss": 2.2435, "step": 129032 }, { "epoch": 0.81, "learning_rate": 3.6963039895271214e-05, "loss": 2.2137, "step": 129040 }, { "epoch": 0.81, "learning_rate": 3.6957884322842776e-05, "loss": 2.2408, "step": 129048 }, { "epoch": 0.81, "learning_rate": 3.695272932324394e-05, "loss": 2.2469, "step": 129056 }, { "epoch": 0.81, "learning_rate": 3.694757489660284e-05, "loss": 2.2282, "step": 129064 }, { "epoch": 0.81, "learning_rate": 3.6942421043047595e-05, "loss": 2.2316, "step": 129072 }, { "epoch": 0.81, "learning_rate": 3.6937267762706365e-05, "loss": 2.2287, "step": 129080 }, { "epoch": 0.81, "learning_rate": 3.693211505570725e-05, "loss": 2.2328, "step": 129088 }, { "epoch": 0.81, "learning_rate": 3.6926962922178346e-05, "loss": 2.232, "step": 129096 }, { "epoch": 0.81, "learning_rate": 3.692181136224771e-05, "loss": 2.248, "step": 129104 }, { "epoch": 0.81, "learning_rate": 3.6916660376043444e-05, "loss": 2.2358, "step": 129112 }, { "epoch": 0.81, "learning_rate": 3.6911509963693594e-05, "loss": 2.2366, "step": 129120 }, { "epoch": 0.81, "learning_rate": 3.690636012532619e-05, "loss": 2.2234, "step": 129128 }, { "epoch": 0.81, "learning_rate": 3.690121086106926e-05, "loss": 2.2347, "step": 129136 }, { "epoch": 0.81, "learning_rate": 3.6896062171050846e-05, "loss": 2.2179, "step": 129144 }, { "epoch": 0.81, "learning_rate": 3.68909140553989e-05, "loss": 2.226, "step": 129152 }, { "epoch": 0.81, "learning_rate": 3.6885766514241426e-05, "loss": 2.2317, "step": 129160 }, { "epoch": 0.81, "learning_rate": 3.6880619547706384e-05, "loss": 2.24, "step": 129168 }, { "epoch": 0.81, "learning_rate": 3.687547315592174e-05, "loss": 2.2254, "step": 129176 }, { "epoch": 0.81, "learning_rate": 3.687032733901543e-05, "loss": 2.2209, "step": 129184 }, { "epoch": 0.81, "learning_rate": 3.6865182097115375e-05, "loss": 2.2233, "step": 129192 }, { "epoch": 0.81, "learning_rate": 3.686003743034947e-05, "loss": 2.2334, "step": 129200 }, { "epoch": 0.81, "learning_rate": 3.6854893338845664e-05, "loss": 2.2356, "step": 129208 }, { "epoch": 0.81, "learning_rate": 3.6849749822731777e-05, "loss": 2.2395, "step": 129216 }, { "epoch": 0.81, "learning_rate": 3.684460688213573e-05, "loss": 2.2116, "step": 129224 }, { "epoch": 0.81, "learning_rate": 3.683946451718535e-05, "loss": 2.2256, "step": 129232 }, { "epoch": 0.81, "learning_rate": 3.683432272800846e-05, "loss": 2.2155, "step": 129240 }, { "epoch": 0.81, "learning_rate": 3.682918151473293e-05, "loss": 2.2294, "step": 129248 }, { "epoch": 0.81, "learning_rate": 3.682404087748654e-05, "loss": 2.2292, "step": 129256 }, { "epoch": 0.81, "learning_rate": 3.681890081639708e-05, "loss": 2.2517, "step": 129264 }, { "epoch": 0.81, "learning_rate": 3.681376133159237e-05, "loss": 2.2304, "step": 129272 }, { "epoch": 0.81, "learning_rate": 3.680862242320014e-05, "loss": 2.2363, "step": 129280 }, { "epoch": 0.81, "learning_rate": 3.680348409134816e-05, "loss": 2.2298, "step": 129288 }, { "epoch": 0.81, "learning_rate": 3.679834633616417e-05, "loss": 2.2187, "step": 129296 }, { "epoch": 0.81, "learning_rate": 3.67932091577759e-05, "loss": 2.2263, "step": 129304 }, { "epoch": 0.81, "learning_rate": 3.678807255631105e-05, "loss": 2.2491, "step": 129312 }, { "epoch": 0.81, "learning_rate": 3.678293653189731e-05, "loss": 2.2457, "step": 129320 }, { "epoch": 0.81, "learning_rate": 3.677780108466239e-05, "loss": 2.2111, "step": 129328 }, { "epoch": 0.81, "learning_rate": 3.677266621473394e-05, "loss": 2.2392, "step": 129336 }, { "epoch": 0.81, "learning_rate": 3.676753192223959e-05, "loss": 2.2307, "step": 129344 }, { "epoch": 0.81, "learning_rate": 3.676239820730701e-05, "loss": 2.2402, "step": 129352 }, { "epoch": 0.81, "learning_rate": 3.675726507006385e-05, "loss": 2.2373, "step": 129360 }, { "epoch": 0.81, "learning_rate": 3.675213251063765e-05, "loss": 2.2249, "step": 129368 }, { "epoch": 0.81, "learning_rate": 3.6747000529156064e-05, "loss": 2.2358, "step": 129376 }, { "epoch": 0.81, "learning_rate": 3.674186912574665e-05, "loss": 2.2369, "step": 129384 }, { "epoch": 0.81, "learning_rate": 3.6736738300536974e-05, "loss": 2.2478, "step": 129392 }, { "epoch": 0.81, "learning_rate": 3.67316080536546e-05, "loss": 2.245, "step": 129400 }, { "epoch": 0.81, "learning_rate": 3.672647838522705e-05, "loss": 2.2508, "step": 129408 }, { "epoch": 0.81, "learning_rate": 3.672134929538187e-05, "loss": 2.2168, "step": 129416 }, { "epoch": 0.81, "learning_rate": 3.6716220784246556e-05, "loss": 2.2312, "step": 129424 }, { "epoch": 0.81, "learning_rate": 3.67110928519486e-05, "loss": 2.2184, "step": 129432 }, { "epoch": 0.81, "learning_rate": 3.6705965498615494e-05, "loss": 2.2214, "step": 129440 }, { "epoch": 0.81, "learning_rate": 3.6700838724374706e-05, "loss": 2.2312, "step": 129448 }, { "epoch": 0.81, "learning_rate": 3.669571252935367e-05, "loss": 2.2432, "step": 129456 }, { "epoch": 0.81, "learning_rate": 3.669058691367985e-05, "loss": 2.2292, "step": 129464 }, { "epoch": 0.81, "learning_rate": 3.668546187748064e-05, "loss": 2.2361, "step": 129472 }, { "epoch": 0.81, "learning_rate": 3.668033742088345e-05, "loss": 2.2207, "step": 129480 }, { "epoch": 0.81, "learning_rate": 3.667521354401571e-05, "loss": 2.2289, "step": 129488 }, { "epoch": 0.81, "learning_rate": 3.667009024700479e-05, "loss": 2.2392, "step": 129496 }, { "epoch": 0.81, "learning_rate": 3.666496752997801e-05, "loss": 2.2268, "step": 129504 }, { "epoch": 0.81, "learning_rate": 3.6659845393062774e-05, "loss": 2.2338, "step": 129512 }, { "epoch": 0.81, "learning_rate": 3.66547238363864e-05, "loss": 2.2501, "step": 129520 }, { "epoch": 0.81, "learning_rate": 3.664960286007622e-05, "loss": 2.2296, "step": 129528 }, { "epoch": 0.81, "learning_rate": 3.664448246425952e-05, "loss": 2.2319, "step": 129536 }, { "epoch": 0.81, "learning_rate": 3.663936264906361e-05, "loss": 2.2249, "step": 129544 }, { "epoch": 0.81, "learning_rate": 3.663424341461576e-05, "loss": 2.2273, "step": 129552 }, { "epoch": 0.81, "learning_rate": 3.6629124761043244e-05, "loss": 2.2311, "step": 129560 }, { "epoch": 0.81, "learning_rate": 3.66240066884733e-05, "loss": 2.237, "step": 129568 }, { "epoch": 0.81, "learning_rate": 3.66188891970332e-05, "loss": 2.2311, "step": 129576 }, { "epoch": 0.81, "learning_rate": 3.6613772286850115e-05, "loss": 2.2269, "step": 129584 }, { "epoch": 0.81, "learning_rate": 3.660865595805128e-05, "loss": 2.2396, "step": 129592 }, { "epoch": 0.81, "learning_rate": 3.660354021076389e-05, "loss": 2.2317, "step": 129600 }, { "epoch": 0.81, "learning_rate": 3.6598425045115096e-05, "loss": 2.2326, "step": 129608 }, { "epoch": 0.81, "learning_rate": 3.6593310461232094e-05, "loss": 2.2466, "step": 129616 }, { "epoch": 0.81, "learning_rate": 3.6588196459242005e-05, "loss": 2.2298, "step": 129624 }, { "epoch": 0.81, "learning_rate": 3.6583083039272004e-05, "loss": 2.238, "step": 129632 }, { "epoch": 0.81, "learning_rate": 3.657797020144918e-05, "loss": 2.23, "step": 129640 }, { "epoch": 0.81, "learning_rate": 3.657285794590063e-05, "loss": 2.2441, "step": 129648 }, { "epoch": 0.81, "learning_rate": 3.656774627275347e-05, "loss": 2.2344, "step": 129656 }, { "epoch": 0.81, "learning_rate": 3.6562635182134774e-05, "loss": 2.2324, "step": 129664 }, { "epoch": 0.81, "learning_rate": 3.655752467417158e-05, "loss": 2.2234, "step": 129672 }, { "epoch": 0.81, "learning_rate": 3.655241474899098e-05, "loss": 2.2245, "step": 129680 }, { "epoch": 0.81, "learning_rate": 3.654730540671995e-05, "loss": 2.2379, "step": 129688 }, { "epoch": 0.81, "learning_rate": 3.6542196647485544e-05, "loss": 2.2452, "step": 129696 }, { "epoch": 0.81, "learning_rate": 3.653708847141477e-05, "loss": 2.2371, "step": 129704 }, { "epoch": 0.81, "learning_rate": 3.653198087863461e-05, "loss": 2.2214, "step": 129712 }, { "epoch": 0.81, "learning_rate": 3.6526873869272025e-05, "loss": 2.2221, "step": 129720 }, { "epoch": 0.81, "learning_rate": 3.6521767443454006e-05, "loss": 2.2249, "step": 129728 }, { "epoch": 0.81, "learning_rate": 3.6516661601307485e-05, "loss": 2.2344, "step": 129736 }, { "epoch": 0.81, "learning_rate": 3.651155634295938e-05, "loss": 2.2302, "step": 129744 }, { "epoch": 0.81, "learning_rate": 3.650645166853661e-05, "loss": 2.2372, "step": 129752 }, { "epoch": 0.81, "learning_rate": 3.650134757816609e-05, "loss": 2.2233, "step": 129760 }, { "epoch": 0.81, "learning_rate": 3.649624407197474e-05, "loss": 2.2328, "step": 129768 }, { "epoch": 0.81, "learning_rate": 3.6491141150089365e-05, "loss": 2.2386, "step": 129776 }, { "epoch": 0.81, "learning_rate": 3.648603881263688e-05, "loss": 2.2444, "step": 129784 }, { "epoch": 0.81, "learning_rate": 3.648093705974409e-05, "loss": 2.2271, "step": 129792 }, { "epoch": 0.81, "learning_rate": 3.6475835891537844e-05, "loss": 2.2453, "step": 129800 }, { "epoch": 0.81, "learning_rate": 3.6470735308144974e-05, "loss": 2.2355, "step": 129808 }, { "epoch": 0.81, "learning_rate": 3.6465635309692255e-05, "loss": 2.2126, "step": 129816 }, { "epoch": 0.81, "learning_rate": 3.646053589630647e-05, "loss": 2.2128, "step": 129824 }, { "epoch": 0.81, "learning_rate": 3.6455437068114417e-05, "loss": 2.2233, "step": 129832 }, { "epoch": 0.81, "learning_rate": 3.645033882524283e-05, "loss": 2.2381, "step": 129840 }, { "epoch": 0.81, "learning_rate": 3.644524116781847e-05, "loss": 2.2276, "step": 129848 }, { "epoch": 0.81, "learning_rate": 3.6440144095968064e-05, "loss": 2.2157, "step": 129856 }, { "epoch": 0.81, "learning_rate": 3.643504760981831e-05, "loss": 2.2336, "step": 129864 }, { "epoch": 0.81, "learning_rate": 3.642995170949592e-05, "loss": 2.2329, "step": 129872 }, { "epoch": 0.81, "learning_rate": 3.642485639512758e-05, "loss": 2.2393, "step": 129880 }, { "epoch": 0.81, "learning_rate": 3.6419761666839935e-05, "loss": 2.2469, "step": 129888 }, { "epoch": 0.81, "learning_rate": 3.641466752475969e-05, "loss": 2.2479, "step": 129896 }, { "epoch": 0.81, "learning_rate": 3.6409573969013434e-05, "loss": 2.2356, "step": 129904 }, { "epoch": 0.81, "learning_rate": 3.640448099972782e-05, "loss": 2.227, "step": 129912 }, { "epoch": 0.81, "learning_rate": 3.6399388617029454e-05, "loss": 2.248, "step": 129920 }, { "epoch": 0.81, "learning_rate": 3.639429682104495e-05, "loss": 2.2381, "step": 129928 }, { "epoch": 0.81, "learning_rate": 3.6389205611900864e-05, "loss": 2.2371, "step": 129936 }, { "epoch": 0.81, "learning_rate": 3.638411498972377e-05, "loss": 2.2206, "step": 129944 }, { "epoch": 0.81, "learning_rate": 3.637902495464024e-05, "loss": 2.2413, "step": 129952 }, { "epoch": 0.81, "learning_rate": 3.6373935506776793e-05, "loss": 2.2234, "step": 129960 }, { "epoch": 0.81, "learning_rate": 3.636884664625996e-05, "loss": 2.2155, "step": 129968 }, { "epoch": 0.81, "learning_rate": 3.636375837321624e-05, "loss": 2.2282, "step": 129976 }, { "epoch": 0.81, "learning_rate": 3.6358670687772165e-05, "loss": 2.2341, "step": 129984 }, { "epoch": 0.81, "learning_rate": 3.6353583590054166e-05, "loss": 2.2135, "step": 129992 }, { "epoch": 0.81, "learning_rate": 3.634849708018875e-05, "loss": 2.2119, "step": 130000 }, { "epoch": 0.81, "learning_rate": 3.6343411158302345e-05, "loss": 2.2489, "step": 130008 }, { "epoch": 0.81, "learning_rate": 3.633832582452137e-05, "loss": 2.2073, "step": 130016 }, { "epoch": 0.81, "learning_rate": 3.6333241078972295e-05, "loss": 2.2232, "step": 130024 }, { "epoch": 0.81, "learning_rate": 3.6328156921781506e-05, "loss": 2.2233, "step": 130032 }, { "epoch": 0.81, "learning_rate": 3.632307335307537e-05, "loss": 2.2364, "step": 130040 }, { "epoch": 0.81, "learning_rate": 3.6317990372980306e-05, "loss": 2.2392, "step": 130048 }, { "epoch": 0.81, "learning_rate": 3.6312907981622635e-05, "loss": 2.2416, "step": 130056 }, { "epoch": 0.81, "learning_rate": 3.6307826179128755e-05, "loss": 2.2243, "step": 130064 }, { "epoch": 0.81, "learning_rate": 3.630274496562497e-05, "loss": 2.2466, "step": 130072 }, { "epoch": 0.81, "learning_rate": 3.629766434123758e-05, "loss": 2.2433, "step": 130080 }, { "epoch": 0.81, "learning_rate": 3.629258430609294e-05, "loss": 2.2305, "step": 130088 }, { "epoch": 0.81, "learning_rate": 3.628750486031731e-05, "loss": 2.2251, "step": 130096 }, { "epoch": 0.81, "learning_rate": 3.6282426004036953e-05, "loss": 2.2168, "step": 130104 }, { "epoch": 0.81, "learning_rate": 3.627734773737817e-05, "loss": 2.217, "step": 130112 }, { "epoch": 0.81, "learning_rate": 3.627227006046718e-05, "loss": 2.238, "step": 130120 }, { "epoch": 0.81, "learning_rate": 3.6267192973430194e-05, "loss": 2.2333, "step": 130128 }, { "epoch": 0.81, "learning_rate": 3.6262116476393485e-05, "loss": 2.237, "step": 130136 }, { "epoch": 0.81, "learning_rate": 3.6257040569483206e-05, "loss": 2.2367, "step": 130144 }, { "epoch": 0.81, "learning_rate": 3.6251965252825574e-05, "loss": 2.2434, "step": 130152 }, { "epoch": 0.81, "learning_rate": 3.6246890526546735e-05, "loss": 2.2231, "step": 130160 }, { "epoch": 0.81, "learning_rate": 3.6241816390772876e-05, "loss": 2.2393, "step": 130168 }, { "epoch": 0.81, "learning_rate": 3.6236742845630125e-05, "loss": 2.2201, "step": 130176 }, { "epoch": 0.81, "learning_rate": 3.62316698912446e-05, "loss": 2.2482, "step": 130184 }, { "epoch": 0.81, "learning_rate": 3.622659752774242e-05, "loss": 2.2463, "step": 130192 }, { "epoch": 0.81, "learning_rate": 3.622152575524974e-05, "loss": 2.2333, "step": 130200 }, { "epoch": 0.81, "learning_rate": 3.621645457389255e-05, "loss": 2.2148, "step": 130208 }, { "epoch": 0.81, "learning_rate": 3.6211383983797e-05, "loss": 2.2347, "step": 130216 }, { "epoch": 0.81, "learning_rate": 3.6206313985089094e-05, "loss": 2.232, "step": 130224 }, { "epoch": 0.81, "learning_rate": 3.620124457789489e-05, "loss": 2.2463, "step": 130232 }, { "epoch": 0.81, "learning_rate": 3.619617576234043e-05, "loss": 2.2352, "step": 130240 }, { "epoch": 0.81, "learning_rate": 3.6191107538551705e-05, "loss": 2.2478, "step": 130248 }, { "epoch": 0.81, "learning_rate": 3.6186039906654704e-05, "loss": 2.2255, "step": 130256 }, { "epoch": 0.81, "learning_rate": 3.6180972866775444e-05, "loss": 2.2405, "step": 130264 }, { "epoch": 0.81, "learning_rate": 3.6175906419039854e-05, "loss": 2.2266, "step": 130272 }, { "epoch": 0.81, "learning_rate": 3.617084056357391e-05, "loss": 2.2348, "step": 130280 }, { "epoch": 0.81, "learning_rate": 3.6165775300503556e-05, "loss": 2.2354, "step": 130288 }, { "epoch": 0.81, "learning_rate": 3.616071062995468e-05, "loss": 2.2444, "step": 130296 }, { "epoch": 0.81, "learning_rate": 3.6155646552053245e-05, "loss": 2.2294, "step": 130304 }, { "epoch": 0.81, "learning_rate": 3.615058306692508e-05, "loss": 2.2152, "step": 130312 }, { "epoch": 0.81, "learning_rate": 3.61455201746961e-05, "loss": 2.241, "step": 130320 }, { "epoch": 0.81, "learning_rate": 3.6140457875492177e-05, "loss": 2.2169, "step": 130328 }, { "epoch": 0.81, "learning_rate": 3.613539616943915e-05, "loss": 2.2248, "step": 130336 }, { "epoch": 0.81, "learning_rate": 3.6130335056662836e-05, "loss": 2.2248, "step": 130344 }, { "epoch": 0.81, "learning_rate": 3.612527453728908e-05, "loss": 2.2372, "step": 130352 }, { "epoch": 0.81, "learning_rate": 3.612021461144368e-05, "loss": 2.2175, "step": 130360 }, { "epoch": 0.81, "learning_rate": 3.611515527925243e-05, "loss": 2.2513, "step": 130368 }, { "epoch": 0.81, "learning_rate": 3.6110096540841075e-05, "loss": 2.2471, "step": 130376 }, { "epoch": 0.81, "learning_rate": 3.610503839633542e-05, "loss": 2.2205, "step": 130384 }, { "epoch": 0.81, "learning_rate": 3.609998084586119e-05, "loss": 2.2306, "step": 130392 }, { "epoch": 0.81, "learning_rate": 3.6094923889544117e-05, "loss": 2.2253, "step": 130400 }, { "epoch": 0.82, "learning_rate": 3.6089867527509905e-05, "loss": 2.2381, "step": 130408 }, { "epoch": 0.82, "learning_rate": 3.6084811759884296e-05, "loss": 2.217, "step": 130416 }, { "epoch": 0.82, "learning_rate": 3.607975658679292e-05, "loss": 2.2222, "step": 130424 }, { "epoch": 0.82, "learning_rate": 3.60747020083615e-05, "loss": 2.2217, "step": 130432 }, { "epoch": 0.82, "learning_rate": 3.606964802471567e-05, "loss": 2.2326, "step": 130440 }, { "epoch": 0.82, "learning_rate": 3.6064594635981065e-05, "loss": 2.2207, "step": 130448 }, { "epoch": 0.82, "learning_rate": 3.605954184228333e-05, "loss": 2.2346, "step": 130456 }, { "epoch": 0.82, "learning_rate": 3.605448964374806e-05, "loss": 2.239, "step": 130464 }, { "epoch": 0.82, "learning_rate": 3.604943804050088e-05, "loss": 2.2162, "step": 130472 }, { "epoch": 0.82, "learning_rate": 3.604438703266735e-05, "loss": 2.236, "step": 130480 }, { "epoch": 0.82, "learning_rate": 3.603933662037304e-05, "loss": 2.2343, "step": 130488 }, { "epoch": 0.82, "learning_rate": 3.603428680374352e-05, "loss": 2.243, "step": 130496 }, { "epoch": 0.82, "learning_rate": 3.602923758290432e-05, "loss": 2.2367, "step": 130504 }, { "epoch": 0.82, "learning_rate": 3.6024188957980955e-05, "loss": 2.2319, "step": 130512 }, { "epoch": 0.82, "learning_rate": 3.601914092909896e-05, "loss": 2.226, "step": 130520 }, { "epoch": 0.82, "learning_rate": 3.601409349638379e-05, "loss": 2.2248, "step": 130528 }, { "epoch": 0.82, "learning_rate": 3.600904665996094e-05, "loss": 2.2395, "step": 130536 }, { "epoch": 0.82, "learning_rate": 3.600400041995591e-05, "loss": 2.2344, "step": 130544 }, { "epoch": 0.82, "learning_rate": 3.599895477649411e-05, "loss": 2.2332, "step": 130552 }, { "epoch": 0.82, "learning_rate": 3.599390972970098e-05, "loss": 2.225, "step": 130560 }, { "epoch": 0.82, "learning_rate": 3.5988865279701956e-05, "loss": 2.251, "step": 130568 }, { "epoch": 0.82, "learning_rate": 3.5983821426622445e-05, "loss": 2.2216, "step": 130576 }, { "epoch": 0.82, "learning_rate": 3.597877817058781e-05, "loss": 2.2351, "step": 130584 }, { "epoch": 0.82, "learning_rate": 3.597373551172345e-05, "loss": 2.2332, "step": 130592 }, { "epoch": 0.82, "learning_rate": 3.5968693450154726e-05, "loss": 2.2249, "step": 130600 }, { "epoch": 0.82, "learning_rate": 3.596365198600697e-05, "loss": 2.2401, "step": 130608 }, { "epoch": 0.82, "learning_rate": 3.5958611119405525e-05, "loss": 2.2397, "step": 130616 }, { "epoch": 0.82, "learning_rate": 3.595357085047571e-05, "loss": 2.2339, "step": 130624 }, { "epoch": 0.82, "learning_rate": 3.594853117934282e-05, "loss": 2.2282, "step": 130632 }, { "epoch": 0.82, "learning_rate": 3.5943492106132134e-05, "loss": 2.2355, "step": 130640 }, { "epoch": 0.82, "learning_rate": 3.593845363096895e-05, "loss": 2.2334, "step": 130648 }, { "epoch": 0.82, "learning_rate": 3.59334157539785e-05, "loss": 2.2353, "step": 130656 }, { "epoch": 0.82, "learning_rate": 3.592837847528603e-05, "loss": 2.2185, "step": 130664 }, { "epoch": 0.82, "learning_rate": 3.592334179501678e-05, "loss": 2.2154, "step": 130672 }, { "epoch": 0.82, "learning_rate": 3.5918305713295944e-05, "loss": 2.2372, "step": 130680 }, { "epoch": 0.82, "learning_rate": 3.5913270230248734e-05, "loss": 2.2367, "step": 130688 }, { "epoch": 0.82, "learning_rate": 3.590823534600034e-05, "loss": 2.219, "step": 130696 }, { "epoch": 0.82, "learning_rate": 3.59032010606759e-05, "loss": 2.2299, "step": 130704 }, { "epoch": 0.82, "learning_rate": 3.5898167374400595e-05, "loss": 2.2388, "step": 130712 }, { "epoch": 0.82, "learning_rate": 3.589313428729956e-05, "loss": 2.2336, "step": 130720 }, { "epoch": 0.82, "learning_rate": 3.5888101799497894e-05, "loss": 2.2379, "step": 130728 }, { "epoch": 0.82, "learning_rate": 3.588306991112075e-05, "loss": 2.2415, "step": 130736 }, { "epoch": 0.82, "learning_rate": 3.5878038622293166e-05, "loss": 2.2277, "step": 130744 }, { "epoch": 0.82, "learning_rate": 3.587300793314025e-05, "loss": 2.2369, "step": 130752 }, { "epoch": 0.82, "learning_rate": 3.586797784378708e-05, "loss": 2.2473, "step": 130760 }, { "epoch": 0.82, "learning_rate": 3.586294835435868e-05, "loss": 2.2331, "step": 130768 }, { "epoch": 0.82, "learning_rate": 3.58579194649801e-05, "loss": 2.2473, "step": 130776 }, { "epoch": 0.82, "learning_rate": 3.585289117577634e-05, "loss": 2.2163, "step": 130784 }, { "epoch": 0.82, "learning_rate": 3.5847863486872415e-05, "loss": 2.2285, "step": 130792 }, { "epoch": 0.82, "learning_rate": 3.584283639839333e-05, "loss": 2.2285, "step": 130800 }, { "epoch": 0.82, "learning_rate": 3.5837809910464015e-05, "loss": 2.2282, "step": 130808 }, { "epoch": 0.82, "learning_rate": 3.5832784023209465e-05, "loss": 2.2433, "step": 130816 }, { "epoch": 0.82, "learning_rate": 3.582775873675463e-05, "loss": 2.2335, "step": 130824 }, { "epoch": 0.82, "learning_rate": 3.582273405122442e-05, "loss": 2.2352, "step": 130832 }, { "epoch": 0.82, "learning_rate": 3.5817709966743753e-05, "loss": 2.2241, "step": 130840 }, { "epoch": 0.82, "learning_rate": 3.581268648343753e-05, "loss": 2.2258, "step": 130848 }, { "epoch": 0.82, "learning_rate": 3.580766360143062e-05, "loss": 2.2222, "step": 130856 }, { "epoch": 0.82, "learning_rate": 3.580264132084792e-05, "loss": 2.2308, "step": 130864 }, { "epoch": 0.82, "learning_rate": 3.5797619641814275e-05, "loss": 2.2274, "step": 130872 }, { "epoch": 0.82, "learning_rate": 3.579259856445452e-05, "loss": 2.2307, "step": 130880 }, { "epoch": 0.82, "learning_rate": 3.5787578088893474e-05, "loss": 2.2427, "step": 130888 }, { "epoch": 0.82, "learning_rate": 3.578255821525595e-05, "loss": 2.2427, "step": 130896 }, { "epoch": 0.82, "learning_rate": 3.5777538943666753e-05, "loss": 2.2451, "step": 130904 }, { "epoch": 0.82, "learning_rate": 3.5772520274250666e-05, "loss": 2.2399, "step": 130912 }, { "epoch": 0.82, "learning_rate": 3.576750220713242e-05, "loss": 2.2427, "step": 130920 }, { "epoch": 0.82, "learning_rate": 3.576248474243681e-05, "loss": 2.2364, "step": 130928 }, { "epoch": 0.82, "learning_rate": 3.575746788028854e-05, "loss": 2.2318, "step": 130936 }, { "epoch": 0.82, "learning_rate": 3.5752451620812334e-05, "loss": 2.2235, "step": 130944 }, { "epoch": 0.82, "learning_rate": 3.574743596413292e-05, "loss": 2.235, "step": 130952 }, { "epoch": 0.82, "learning_rate": 3.574242091037494e-05, "loss": 2.224, "step": 130960 }, { "epoch": 0.82, "learning_rate": 3.57374064596631e-05, "loss": 2.2426, "step": 130968 }, { "epoch": 0.82, "learning_rate": 3.5732392612122076e-05, "loss": 2.2364, "step": 130976 }, { "epoch": 0.82, "learning_rate": 3.5727379367876494e-05, "loss": 2.245, "step": 130984 }, { "epoch": 0.82, "learning_rate": 3.5722366727050983e-05, "loss": 2.2434, "step": 130992 }, { "epoch": 0.82, "learning_rate": 3.571735468977015e-05, "loss": 2.2277, "step": 131000 }, { "epoch": 0.82, "learning_rate": 3.571234325615861e-05, "loss": 2.2427, "step": 131008 }, { "epoch": 0.82, "learning_rate": 3.5707332426340946e-05, "loss": 2.2502, "step": 131016 }, { "epoch": 0.82, "learning_rate": 3.5702322200441706e-05, "loss": 2.2197, "step": 131024 }, { "epoch": 0.82, "learning_rate": 3.569731257858546e-05, "loss": 2.2271, "step": 131032 }, { "epoch": 0.82, "learning_rate": 3.569230356089679e-05, "loss": 2.2342, "step": 131040 }, { "epoch": 0.82, "learning_rate": 3.568729514750014e-05, "loss": 2.227, "step": 131048 }, { "epoch": 0.82, "learning_rate": 3.5682287338520085e-05, "loss": 2.2214, "step": 131056 }, { "epoch": 0.82, "learning_rate": 3.5677280134081084e-05, "loss": 2.2416, "step": 131064 }, { "epoch": 0.82, "learning_rate": 3.567227353430762e-05, "loss": 2.2156, "step": 131072 }, { "epoch": 0.82, "learning_rate": 3.566726753932418e-05, "loss": 2.2305, "step": 131080 }, { "epoch": 0.82, "learning_rate": 3.5662262149255196e-05, "loss": 2.2269, "step": 131088 }, { "epoch": 0.82, "learning_rate": 3.565725736422509e-05, "loss": 2.2359, "step": 131096 }, { "epoch": 0.82, "learning_rate": 3.565225318435832e-05, "loss": 2.2318, "step": 131104 }, { "epoch": 0.82, "learning_rate": 3.564724960977925e-05, "loss": 2.2353, "step": 131112 }, { "epoch": 0.82, "learning_rate": 3.56422466406123e-05, "loss": 2.2289, "step": 131120 }, { "epoch": 0.82, "learning_rate": 3.563724427698183e-05, "loss": 2.2095, "step": 131128 }, { "epoch": 0.82, "learning_rate": 3.5632242519012183e-05, "loss": 2.2371, "step": 131136 }, { "epoch": 0.82, "learning_rate": 3.562724136682776e-05, "loss": 2.2384, "step": 131144 }, { "epoch": 0.82, "learning_rate": 3.562224082055281e-05, "loss": 2.236, "step": 131152 }, { "epoch": 0.82, "learning_rate": 3.561724088031169e-05, "loss": 2.2331, "step": 131160 }, { "epoch": 0.82, "learning_rate": 3.561224154622872e-05, "loss": 2.2052, "step": 131168 }, { "epoch": 0.82, "learning_rate": 3.560724281842815e-05, "loss": 2.2224, "step": 131176 }, { "epoch": 0.82, "learning_rate": 3.560224469703426e-05, "loss": 2.2249, "step": 131184 }, { "epoch": 0.82, "learning_rate": 3.5597247182171316e-05, "loss": 2.2243, "step": 131192 }, { "epoch": 0.82, "learning_rate": 3.559225027396354e-05, "loss": 2.2386, "step": 131200 }, { "epoch": 0.82, "learning_rate": 3.5587253972535165e-05, "loss": 2.2328, "step": 131208 }, { "epoch": 0.82, "learning_rate": 3.558225827801038e-05, "loss": 2.2449, "step": 131216 }, { "epoch": 0.82, "learning_rate": 3.55772631905134e-05, "loss": 2.2291, "step": 131224 }, { "epoch": 0.82, "learning_rate": 3.5572268710168406e-05, "loss": 2.2375, "step": 131232 }, { "epoch": 0.82, "learning_rate": 3.556727483709954e-05, "loss": 2.2252, "step": 131240 }, { "epoch": 0.82, "learning_rate": 3.5562281571430955e-05, "loss": 2.2283, "step": 131248 }, { "epoch": 0.82, "learning_rate": 3.555728891328682e-05, "loss": 2.2374, "step": 131256 }, { "epoch": 0.82, "learning_rate": 3.55522968627912e-05, "loss": 2.2252, "step": 131264 }, { "epoch": 0.82, "learning_rate": 3.554730542006824e-05, "loss": 2.2236, "step": 131272 }, { "epoch": 0.82, "learning_rate": 3.554231458524201e-05, "loss": 2.2291, "step": 131280 }, { "epoch": 0.82, "learning_rate": 3.553732435843657e-05, "loss": 2.2373, "step": 131288 }, { "epoch": 0.82, "learning_rate": 3.5532334739775996e-05, "loss": 2.2376, "step": 131296 }, { "epoch": 0.82, "learning_rate": 3.552734572938434e-05, "loss": 2.2182, "step": 131304 }, { "epoch": 0.82, "learning_rate": 3.5522357327385586e-05, "loss": 2.2255, "step": 131312 }, { "epoch": 0.82, "learning_rate": 3.55173695339038e-05, "loss": 2.2209, "step": 131320 }, { "epoch": 0.82, "learning_rate": 3.5512382349062935e-05, "loss": 2.2334, "step": 131328 }, { "epoch": 0.82, "learning_rate": 3.5507395772987005e-05, "loss": 2.2425, "step": 131336 }, { "epoch": 0.82, "learning_rate": 3.550240980579997e-05, "loss": 2.2324, "step": 131344 }, { "epoch": 0.82, "learning_rate": 3.549742444762576e-05, "loss": 2.2303, "step": 131352 }, { "epoch": 0.82, "learning_rate": 3.5492439698588356e-05, "loss": 2.226, "step": 131360 }, { "epoch": 0.82, "learning_rate": 3.548745555881162e-05, "loss": 2.2275, "step": 131368 }, { "epoch": 0.82, "learning_rate": 3.5482472028419495e-05, "loss": 2.2508, "step": 131376 }, { "epoch": 0.82, "learning_rate": 3.547748910753587e-05, "loss": 2.2334, "step": 131384 }, { "epoch": 0.82, "learning_rate": 3.547250679628462e-05, "loss": 2.2111, "step": 131392 }, { "epoch": 0.82, "learning_rate": 3.5467525094789594e-05, "loss": 2.2356, "step": 131400 }, { "epoch": 0.82, "learning_rate": 3.546254400317466e-05, "loss": 2.224, "step": 131408 }, { "epoch": 0.82, "learning_rate": 3.545756352156364e-05, "loss": 2.2334, "step": 131416 }, { "epoch": 0.82, "learning_rate": 3.545258365008033e-05, "loss": 2.2134, "step": 131424 }, { "epoch": 0.82, "learning_rate": 3.544760438884854e-05, "loss": 2.228, "step": 131432 }, { "epoch": 0.82, "learning_rate": 3.544262573799207e-05, "loss": 2.2304, "step": 131440 }, { "epoch": 0.82, "learning_rate": 3.543764769763468e-05, "loss": 2.2416, "step": 131448 }, { "epoch": 0.82, "learning_rate": 3.543267026790012e-05, "loss": 2.2403, "step": 131456 }, { "epoch": 0.82, "learning_rate": 3.5427693448912135e-05, "loss": 2.2346, "step": 131464 }, { "epoch": 0.82, "learning_rate": 3.5422717240794454e-05, "loss": 2.2401, "step": 131472 }, { "epoch": 0.82, "learning_rate": 3.541774164367076e-05, "loss": 2.2356, "step": 131480 }, { "epoch": 0.82, "learning_rate": 3.541276665766479e-05, "loss": 2.2306, "step": 131488 }, { "epoch": 0.82, "learning_rate": 3.540779228290019e-05, "loss": 2.2304, "step": 131496 }, { "epoch": 0.82, "learning_rate": 3.540281851950062e-05, "loss": 2.2475, "step": 131504 }, { "epoch": 0.82, "learning_rate": 3.5397845367589766e-05, "loss": 2.2267, "step": 131512 }, { "epoch": 0.82, "learning_rate": 3.539287282729121e-05, "loss": 2.2171, "step": 131520 }, { "epoch": 0.82, "learning_rate": 3.538790089872862e-05, "loss": 2.2169, "step": 131528 }, { "epoch": 0.82, "learning_rate": 3.538292958202557e-05, "loss": 2.23, "step": 131536 }, { "epoch": 0.82, "learning_rate": 3.537795887730564e-05, "loss": 2.2357, "step": 131544 }, { "epoch": 0.82, "learning_rate": 3.537298878469242e-05, "loss": 2.2341, "step": 131552 }, { "epoch": 0.82, "learning_rate": 3.536801930430948e-05, "loss": 2.2327, "step": 131560 }, { "epoch": 0.82, "learning_rate": 3.536305043628032e-05, "loss": 2.2423, "step": 131568 }, { "epoch": 0.82, "learning_rate": 3.535808218072851e-05, "loss": 2.235, "step": 131576 }, { "epoch": 0.82, "learning_rate": 3.535311453777753e-05, "loss": 2.2136, "step": 131584 }, { "epoch": 0.82, "learning_rate": 3.534814750755088e-05, "loss": 2.2175, "step": 131592 }, { "epoch": 0.82, "learning_rate": 3.5343181090172057e-05, "loss": 2.2435, "step": 131600 }, { "epoch": 0.82, "learning_rate": 3.533821528576452e-05, "loss": 2.2336, "step": 131608 }, { "epoch": 0.82, "learning_rate": 3.5333250094451715e-05, "loss": 2.2425, "step": 131616 }, { "epoch": 0.82, "learning_rate": 3.532828551635708e-05, "loss": 2.2258, "step": 131624 }, { "epoch": 0.82, "learning_rate": 3.532332155160405e-05, "loss": 2.234, "step": 131632 }, { "epoch": 0.82, "learning_rate": 3.5318358200316e-05, "loss": 2.2327, "step": 131640 }, { "epoch": 0.82, "learning_rate": 3.5313395462616334e-05, "loss": 2.2355, "step": 131648 }, { "epoch": 0.82, "learning_rate": 3.530843333862843e-05, "loss": 2.2138, "step": 131656 }, { "epoch": 0.82, "learning_rate": 3.5303471828475654e-05, "loss": 2.2371, "step": 131664 }, { "epoch": 0.82, "learning_rate": 3.529851093228131e-05, "loss": 2.2268, "step": 131672 }, { "epoch": 0.82, "learning_rate": 3.529355065016879e-05, "loss": 2.2247, "step": 131680 }, { "epoch": 0.82, "learning_rate": 3.528859098226136e-05, "loss": 2.2429, "step": 131688 }, { "epoch": 0.82, "learning_rate": 3.5283631928682316e-05, "loss": 2.2139, "step": 131696 }, { "epoch": 0.82, "learning_rate": 3.527867348955497e-05, "loss": 2.2254, "step": 131704 }, { "epoch": 0.82, "learning_rate": 3.5273715665002574e-05, "loss": 2.2267, "step": 131712 }, { "epoch": 0.82, "learning_rate": 3.526875845514837e-05, "loss": 2.2435, "step": 131720 }, { "epoch": 0.82, "learning_rate": 3.526380186011562e-05, "loss": 2.2486, "step": 131728 }, { "epoch": 0.82, "learning_rate": 3.525884588002752e-05, "loss": 2.2356, "step": 131736 }, { "epoch": 0.82, "learning_rate": 3.525389051500729e-05, "loss": 2.2236, "step": 131744 }, { "epoch": 0.82, "learning_rate": 3.524893576517813e-05, "loss": 2.2263, "step": 131752 }, { "epoch": 0.82, "learning_rate": 3.524398163066318e-05, "loss": 2.2419, "step": 131760 }, { "epoch": 0.82, "learning_rate": 3.523902811158565e-05, "loss": 2.2334, "step": 131768 }, { "epoch": 0.82, "learning_rate": 3.523407520806865e-05, "loss": 2.2283, "step": 131776 }, { "epoch": 0.82, "learning_rate": 3.522912292023531e-05, "loss": 2.2268, "step": 131784 }, { "epoch": 0.82, "learning_rate": 3.522417124820878e-05, "loss": 2.2214, "step": 131792 }, { "epoch": 0.82, "learning_rate": 3.52192201921121e-05, "loss": 2.2292, "step": 131800 }, { "epoch": 0.82, "learning_rate": 3.52142697520684e-05, "loss": 2.2362, "step": 131808 }, { "epoch": 0.82, "learning_rate": 3.5209319928200734e-05, "loss": 2.2237, "step": 131816 }, { "epoch": 0.82, "learning_rate": 3.520437072063216e-05, "loss": 2.2264, "step": 131824 }, { "epoch": 0.82, "learning_rate": 3.519942212948572e-05, "loss": 2.2395, "step": 131832 }, { "epoch": 0.82, "learning_rate": 3.51944741548844e-05, "loss": 2.2279, "step": 131840 }, { "epoch": 0.82, "learning_rate": 3.518952679695126e-05, "loss": 2.2305, "step": 131848 }, { "epoch": 0.82, "learning_rate": 3.518458005580926e-05, "loss": 2.2291, "step": 131856 }, { "epoch": 0.82, "learning_rate": 3.517963393158138e-05, "loss": 2.2376, "step": 131864 }, { "epoch": 0.82, "learning_rate": 3.517468842439058e-05, "loss": 2.2353, "step": 131872 }, { "epoch": 0.82, "learning_rate": 3.5169743534359836e-05, "loss": 2.2273, "step": 131880 }, { "epoch": 0.82, "learning_rate": 3.516479926161203e-05, "loss": 2.2497, "step": 131888 }, { "epoch": 0.82, "learning_rate": 3.515985560627011e-05, "loss": 2.2218, "step": 131896 }, { "epoch": 0.82, "learning_rate": 3.5154912568456974e-05, "loss": 2.2263, "step": 131904 }, { "epoch": 0.82, "learning_rate": 3.5149970148295484e-05, "loss": 2.2381, "step": 131912 }, { "epoch": 0.82, "learning_rate": 3.5145028345908536e-05, "loss": 2.2197, "step": 131920 }, { "epoch": 0.82, "learning_rate": 3.5140087161418964e-05, "loss": 2.2338, "step": 131928 }, { "epoch": 0.82, "learning_rate": 3.513514659494961e-05, "loss": 2.2337, "step": 131936 }, { "epoch": 0.82, "learning_rate": 3.513020664662331e-05, "loss": 2.238, "step": 131944 }, { "epoch": 0.82, "learning_rate": 3.512526731656286e-05, "loss": 2.223, "step": 131952 }, { "epoch": 0.82, "learning_rate": 3.512032860489106e-05, "loss": 2.2202, "step": 131960 }, { "epoch": 0.82, "learning_rate": 3.5115390511730685e-05, "loss": 2.2381, "step": 131968 }, { "epoch": 0.82, "learning_rate": 3.5110453037204486e-05, "loss": 2.2392, "step": 131976 }, { "epoch": 0.82, "learning_rate": 3.5105516181435225e-05, "loss": 2.2332, "step": 131984 }, { "epoch": 0.82, "learning_rate": 3.510057994454561e-05, "loss": 2.2364, "step": 131992 }, { "epoch": 0.82, "learning_rate": 3.5095644326658375e-05, "loss": 2.2258, "step": 132000 }, { "epoch": 0.83, "learning_rate": 3.509070932789624e-05, "loss": 2.221, "step": 132008 }, { "epoch": 0.83, "learning_rate": 3.508577494838184e-05, "loss": 2.2277, "step": 132016 }, { "epoch": 0.83, "learning_rate": 3.508084118823787e-05, "loss": 2.2265, "step": 132024 }, { "epoch": 0.83, "learning_rate": 3.5075908047587e-05, "loss": 2.2399, "step": 132032 }, { "epoch": 0.83, "learning_rate": 3.507097552655185e-05, "loss": 2.2239, "step": 132040 }, { "epoch": 0.83, "learning_rate": 3.506604362525503e-05, "loss": 2.2244, "step": 132048 }, { "epoch": 0.83, "learning_rate": 3.506111234381917e-05, "loss": 2.2304, "step": 132056 }, { "epoch": 0.83, "learning_rate": 3.505618168236686e-05, "loss": 2.2251, "step": 132064 }, { "epoch": 0.83, "learning_rate": 3.505125164102068e-05, "loss": 2.242, "step": 132072 }, { "epoch": 0.83, "learning_rate": 3.504632221990316e-05, "loss": 2.2252, "step": 132080 }, { "epoch": 0.83, "learning_rate": 3.504139341913687e-05, "loss": 2.2191, "step": 132088 }, { "epoch": 0.83, "learning_rate": 3.503646523884437e-05, "loss": 2.2214, "step": 132096 }, { "epoch": 0.83, "learning_rate": 3.503153767914812e-05, "loss": 2.2328, "step": 132104 }, { "epoch": 0.83, "learning_rate": 3.502661074017066e-05, "loss": 2.2312, "step": 132112 }, { "epoch": 0.83, "learning_rate": 3.502168442203446e-05, "loss": 2.2222, "step": 132120 }, { "epoch": 0.83, "learning_rate": 3.501675872486196e-05, "loss": 2.2285, "step": 132128 }, { "epoch": 0.83, "learning_rate": 3.501183364877567e-05, "loss": 2.22, "step": 132136 }, { "epoch": 0.83, "learning_rate": 3.5006909193897995e-05, "loss": 2.2161, "step": 132144 }, { "epoch": 0.83, "learning_rate": 3.500198536035135e-05, "loss": 2.2107, "step": 132152 }, { "epoch": 0.83, "learning_rate": 3.4997062148258156e-05, "loss": 2.2113, "step": 132160 }, { "epoch": 0.83, "learning_rate": 3.49921395577408e-05, "loss": 2.2308, "step": 132168 }, { "epoch": 0.83, "learning_rate": 3.4987217588921675e-05, "loss": 2.2417, "step": 132176 }, { "epoch": 0.83, "learning_rate": 3.498229624192312e-05, "loss": 2.2292, "step": 132184 }, { "epoch": 0.83, "learning_rate": 3.497737551686747e-05, "loss": 2.2337, "step": 132192 }, { "epoch": 0.83, "learning_rate": 3.497245541387711e-05, "loss": 2.2358, "step": 132200 }, { "epoch": 0.83, "learning_rate": 3.496753593307428e-05, "loss": 2.2436, "step": 132208 }, { "epoch": 0.83, "learning_rate": 3.496261707458133e-05, "loss": 2.2273, "step": 132216 }, { "epoch": 0.83, "learning_rate": 3.4957698838520524e-05, "loss": 2.227, "step": 132224 }, { "epoch": 0.83, "learning_rate": 3.495278122501414e-05, "loss": 2.2352, "step": 132232 }, { "epoch": 0.83, "learning_rate": 3.4947864234184416e-05, "loss": 2.2396, "step": 132240 }, { "epoch": 0.83, "learning_rate": 3.494294786615362e-05, "loss": 2.2384, "step": 132248 }, { "epoch": 0.83, "learning_rate": 3.493803212104394e-05, "loss": 2.2256, "step": 132256 }, { "epoch": 0.83, "learning_rate": 3.493311699897759e-05, "loss": 2.2285, "step": 132264 }, { "epoch": 0.83, "learning_rate": 3.4928202500076754e-05, "loss": 2.2385, "step": 132272 }, { "epoch": 0.83, "learning_rate": 3.4923288624463635e-05, "loss": 2.2355, "step": 132280 }, { "epoch": 0.83, "learning_rate": 3.491837537226037e-05, "loss": 2.2325, "step": 132288 }, { "epoch": 0.83, "learning_rate": 3.4913462743589096e-05, "loss": 2.2357, "step": 132296 }, { "epoch": 0.83, "learning_rate": 3.490855073857197e-05, "loss": 2.2477, "step": 132304 }, { "epoch": 0.83, "learning_rate": 3.4903639357331077e-05, "loss": 2.2149, "step": 132312 }, { "epoch": 0.83, "learning_rate": 3.489872859998852e-05, "loss": 2.2238, "step": 132320 }, { "epoch": 0.83, "learning_rate": 3.4893818466666396e-05, "loss": 2.2247, "step": 132328 }, { "epoch": 0.83, "learning_rate": 3.488890895748676e-05, "loss": 2.2256, "step": 132336 }, { "epoch": 0.83, "learning_rate": 3.4884000072571655e-05, "loss": 2.2285, "step": 132344 }, { "epoch": 0.83, "learning_rate": 3.487909181204314e-05, "loss": 2.231, "step": 132352 }, { "epoch": 0.83, "learning_rate": 3.487418417602322e-05, "loss": 2.2214, "step": 132360 }, { "epoch": 0.83, "learning_rate": 3.486927716463388e-05, "loss": 2.2226, "step": 132368 }, { "epoch": 0.83, "learning_rate": 3.4864370777997156e-05, "loss": 2.2237, "step": 132376 }, { "epoch": 0.83, "learning_rate": 3.4859465016234984e-05, "loss": 2.2252, "step": 132384 }, { "epoch": 0.83, "learning_rate": 3.4854559879469326e-05, "loss": 2.2304, "step": 132392 }, { "epoch": 0.83, "learning_rate": 3.484965536782214e-05, "loss": 2.2433, "step": 132400 }, { "epoch": 0.83, "learning_rate": 3.484475148141534e-05, "loss": 2.2254, "step": 132408 }, { "epoch": 0.83, "learning_rate": 3.483984822037086e-05, "loss": 2.2272, "step": 132416 }, { "epoch": 0.83, "learning_rate": 3.483494558481054e-05, "loss": 2.2296, "step": 132424 }, { "epoch": 0.83, "learning_rate": 3.4830043574856306e-05, "loss": 2.2235, "step": 132432 }, { "epoch": 0.83, "learning_rate": 3.482514219063003e-05, "loss": 2.2389, "step": 132440 }, { "epoch": 0.83, "learning_rate": 3.482024143225354e-05, "loss": 2.2252, "step": 132448 }, { "epoch": 0.83, "learning_rate": 3.481534129984865e-05, "loss": 2.2311, "step": 132456 }, { "epoch": 0.83, "learning_rate": 3.4810441793537226e-05, "loss": 2.23, "step": 132464 }, { "epoch": 0.83, "learning_rate": 3.480554291344105e-05, "loss": 2.2157, "step": 132472 }, { "epoch": 0.83, "learning_rate": 3.480064465968189e-05, "loss": 2.2309, "step": 132480 }, { "epoch": 0.83, "learning_rate": 3.479574703238152e-05, "loss": 2.2337, "step": 132488 }, { "epoch": 0.83, "learning_rate": 3.479085003166173e-05, "loss": 2.2222, "step": 132496 }, { "epoch": 0.83, "learning_rate": 3.478595365764422e-05, "loss": 2.2561, "step": 132504 }, { "epoch": 0.83, "learning_rate": 3.478105791045073e-05, "loss": 2.2259, "step": 132512 }, { "epoch": 0.83, "learning_rate": 3.477616279020298e-05, "loss": 2.2105, "step": 132520 }, { "epoch": 0.83, "learning_rate": 3.477126829702265e-05, "loss": 2.2314, "step": 132528 }, { "epoch": 0.83, "learning_rate": 3.476637443103142e-05, "loss": 2.2338, "step": 132536 }, { "epoch": 0.83, "learning_rate": 3.4761481192350954e-05, "loss": 2.2172, "step": 132544 }, { "epoch": 0.83, "learning_rate": 3.47565885811029e-05, "loss": 2.2046, "step": 132552 }, { "epoch": 0.83, "learning_rate": 3.475169659740888e-05, "loss": 2.226, "step": 132560 }, { "epoch": 0.83, "learning_rate": 3.474680524139052e-05, "loss": 2.229, "step": 132568 }, { "epoch": 0.83, "learning_rate": 3.47419145131694e-05, "loss": 2.2336, "step": 132576 }, { "epoch": 0.83, "learning_rate": 3.473702441286714e-05, "loss": 2.2161, "step": 132584 }, { "epoch": 0.83, "learning_rate": 3.473213494060528e-05, "loss": 2.2287, "step": 132592 }, { "epoch": 0.83, "learning_rate": 3.472724609650537e-05, "loss": 2.2196, "step": 132600 }, { "epoch": 0.83, "learning_rate": 3.472235788068897e-05, "loss": 2.2271, "step": 132608 }, { "epoch": 0.83, "learning_rate": 3.4717470293277594e-05, "loss": 2.2131, "step": 132616 }, { "epoch": 0.83, "learning_rate": 3.471258333439272e-05, "loss": 2.2409, "step": 132624 }, { "epoch": 0.83, "learning_rate": 3.47076970041559e-05, "loss": 2.2147, "step": 132632 }, { "epoch": 0.83, "learning_rate": 3.4702811302688544e-05, "loss": 2.2262, "step": 132640 }, { "epoch": 0.83, "learning_rate": 3.469792623011213e-05, "loss": 2.204, "step": 132648 }, { "epoch": 0.83, "learning_rate": 3.469304178654812e-05, "loss": 2.2135, "step": 132656 }, { "epoch": 0.83, "learning_rate": 3.468815797211794e-05, "loss": 2.2331, "step": 132664 }, { "epoch": 0.83, "learning_rate": 3.468327478694299e-05, "loss": 2.2264, "step": 132672 }, { "epoch": 0.83, "learning_rate": 3.467839223114465e-05, "loss": 2.2367, "step": 132680 }, { "epoch": 0.83, "learning_rate": 3.467351030484434e-05, "loss": 2.2461, "step": 132688 }, { "epoch": 0.83, "learning_rate": 3.46686290081634e-05, "loss": 2.2329, "step": 132696 }, { "epoch": 0.83, "learning_rate": 3.466374834122317e-05, "loss": 2.24, "step": 132704 }, { "epoch": 0.83, "learning_rate": 3.465886830414502e-05, "loss": 2.2315, "step": 132712 }, { "epoch": 0.83, "learning_rate": 3.465398889705024e-05, "loss": 2.238, "step": 132720 }, { "epoch": 0.83, "learning_rate": 3.4649110120060124e-05, "loss": 2.2279, "step": 132728 }, { "epoch": 0.83, "learning_rate": 3.4644231973296e-05, "loss": 2.2282, "step": 132736 }, { "epoch": 0.83, "learning_rate": 3.46393544568791e-05, "loss": 2.2255, "step": 132744 }, { "epoch": 0.83, "learning_rate": 3.463447757093069e-05, "loss": 2.2336, "step": 132752 }, { "epoch": 0.83, "learning_rate": 3.462960131557203e-05, "loss": 2.2248, "step": 132760 }, { "epoch": 0.83, "learning_rate": 3.462472569092432e-05, "loss": 2.236, "step": 132768 }, { "epoch": 0.83, "learning_rate": 3.4619850697108766e-05, "loss": 2.2256, "step": 132776 }, { "epoch": 0.83, "learning_rate": 3.461497633424659e-05, "loss": 2.2318, "step": 132784 }, { "epoch": 0.83, "learning_rate": 3.461010260245893e-05, "loss": 2.232, "step": 132792 }, { "epoch": 0.83, "learning_rate": 3.460522950186698e-05, "loss": 2.2271, "step": 132800 }, { "epoch": 0.83, "learning_rate": 3.460035703259188e-05, "loss": 2.2302, "step": 132808 }, { "epoch": 0.83, "learning_rate": 3.459548519475473e-05, "loss": 2.2273, "step": 132816 }, { "epoch": 0.83, "learning_rate": 3.459061398847669e-05, "loss": 2.2311, "step": 132824 }, { "epoch": 0.83, "learning_rate": 3.458574341387884e-05, "loss": 2.2329, "step": 132832 }, { "epoch": 0.83, "learning_rate": 3.4580873471082245e-05, "loss": 2.2182, "step": 132840 }, { "epoch": 0.83, "learning_rate": 3.457600416020801e-05, "loss": 2.2333, "step": 132848 }, { "epoch": 0.83, "learning_rate": 3.457113548137714e-05, "loss": 2.221, "step": 132856 }, { "epoch": 0.83, "learning_rate": 3.4566267434710696e-05, "loss": 2.2261, "step": 132864 }, { "epoch": 0.83, "learning_rate": 3.45614000203297e-05, "loss": 2.2331, "step": 132872 }, { "epoch": 0.83, "learning_rate": 3.455653323835517e-05, "loss": 2.2235, "step": 132880 }, { "epoch": 0.83, "learning_rate": 3.455166708890807e-05, "loss": 2.2327, "step": 132888 }, { "epoch": 0.83, "learning_rate": 3.4546801572109365e-05, "loss": 2.2402, "step": 132896 }, { "epoch": 0.83, "learning_rate": 3.4541936688080046e-05, "loss": 2.2383, "step": 132904 }, { "epoch": 0.83, "learning_rate": 3.453707243694104e-05, "loss": 2.2333, "step": 132912 }, { "epoch": 0.83, "learning_rate": 3.4532208818813255e-05, "loss": 2.2282, "step": 132920 }, { "epoch": 0.83, "learning_rate": 3.4527345833817614e-05, "loss": 2.2301, "step": 132928 }, { "epoch": 0.83, "learning_rate": 3.452248348207504e-05, "loss": 2.217, "step": 132936 }, { "epoch": 0.83, "learning_rate": 3.4517621763706366e-05, "loss": 2.2284, "step": 132944 }, { "epoch": 0.83, "learning_rate": 3.451276067883248e-05, "loss": 2.2402, "step": 132952 }, { "epoch": 0.83, "learning_rate": 3.450790022757423e-05, "loss": 2.2524, "step": 132960 }, { "epoch": 0.83, "learning_rate": 3.450304041005241e-05, "loss": 2.2393, "step": 132968 }, { "epoch": 0.83, "learning_rate": 3.4498181226387894e-05, "loss": 2.2419, "step": 132976 }, { "epoch": 0.83, "learning_rate": 3.449332267670145e-05, "loss": 2.2275, "step": 132984 }, { "epoch": 0.83, "learning_rate": 3.448846476111386e-05, "loss": 2.2145, "step": 132992 }, { "epoch": 0.83, "learning_rate": 3.4483607479745904e-05, "loss": 2.2475, "step": 133000 }, { "epoch": 0.83, "learning_rate": 3.447875083271831e-05, "loss": 2.2269, "step": 133008 }, { "epoch": 0.83, "learning_rate": 3.447389482015186e-05, "loss": 2.2226, "step": 133016 }, { "epoch": 0.83, "learning_rate": 3.4469039442167236e-05, "loss": 2.2178, "step": 133024 }, { "epoch": 0.83, "learning_rate": 3.4464184698885154e-05, "loss": 2.232, "step": 133032 }, { "epoch": 0.83, "learning_rate": 3.445933059042633e-05, "loss": 2.2177, "step": 133040 }, { "epoch": 0.83, "learning_rate": 3.445447711691139e-05, "loss": 2.2261, "step": 133048 }, { "epoch": 0.83, "learning_rate": 3.4449624278461e-05, "loss": 2.214, "step": 133056 }, { "epoch": 0.83, "learning_rate": 3.444477207519584e-05, "loss": 2.2307, "step": 133064 }, { "epoch": 0.83, "learning_rate": 3.443992050723651e-05, "loss": 2.2416, "step": 133072 }, { "epoch": 0.83, "learning_rate": 3.4435069574703615e-05, "loss": 2.228, "step": 133080 }, { "epoch": 0.83, "learning_rate": 3.4430219277717776e-05, "loss": 2.2288, "step": 133088 }, { "epoch": 0.83, "learning_rate": 3.442536961639955e-05, "loss": 2.2174, "step": 133096 }, { "epoch": 0.83, "learning_rate": 3.44205205908695e-05, "loss": 2.2319, "step": 133104 }, { "epoch": 0.83, "learning_rate": 3.441567220124817e-05, "loss": 2.2227, "step": 133112 }, { "epoch": 0.83, "learning_rate": 3.441082444765612e-05, "loss": 2.2349, "step": 133120 }, { "epoch": 0.83, "learning_rate": 3.440597733021383e-05, "loss": 2.2409, "step": 133128 }, { "epoch": 0.83, "learning_rate": 3.4401130849041805e-05, "loss": 2.24, "step": 133136 }, { "epoch": 0.83, "learning_rate": 3.439628500426054e-05, "loss": 2.2295, "step": 133144 }, { "epoch": 0.83, "learning_rate": 3.4391439795990536e-05, "loss": 2.2228, "step": 133152 }, { "epoch": 0.83, "learning_rate": 3.438659522435218e-05, "loss": 2.2192, "step": 133160 }, { "epoch": 0.83, "learning_rate": 3.438175128946596e-05, "loss": 2.2385, "step": 133168 }, { "epoch": 0.83, "learning_rate": 3.437690799145227e-05, "loss": 2.2279, "step": 133176 }, { "epoch": 0.83, "learning_rate": 3.437206533043151e-05, "loss": 2.2539, "step": 133184 }, { "epoch": 0.83, "learning_rate": 3.43672233065241e-05, "loss": 2.2224, "step": 133192 }, { "epoch": 0.83, "learning_rate": 3.4362381919850394e-05, "loss": 2.227, "step": 133200 }, { "epoch": 0.83, "learning_rate": 3.435754117053073e-05, "loss": 2.2444, "step": 133208 }, { "epoch": 0.83, "learning_rate": 3.435270105868549e-05, "loss": 2.2338, "step": 133216 }, { "epoch": 0.83, "learning_rate": 3.4347861584434956e-05, "loss": 2.2327, "step": 133224 }, { "epoch": 0.83, "learning_rate": 3.434302274789948e-05, "loss": 2.2226, "step": 133232 }, { "epoch": 0.83, "learning_rate": 3.4338184549199336e-05, "loss": 2.2302, "step": 133240 }, { "epoch": 0.83, "learning_rate": 3.433334698845479e-05, "loss": 2.2254, "step": 133248 }, { "epoch": 0.83, "learning_rate": 3.432851006578615e-05, "loss": 2.246, "step": 133256 }, { "epoch": 0.83, "learning_rate": 3.43236737813136e-05, "loss": 2.247, "step": 133264 }, { "epoch": 0.83, "learning_rate": 3.43188381351574e-05, "loss": 2.2316, "step": 133272 }, { "epoch": 0.83, "learning_rate": 3.431400312743778e-05, "loss": 2.2443, "step": 133280 }, { "epoch": 0.83, "learning_rate": 3.4309168758274925e-05, "loss": 2.2256, "step": 133288 }, { "epoch": 0.83, "learning_rate": 3.4304335027789e-05, "loss": 2.2211, "step": 133296 }, { "epoch": 0.83, "learning_rate": 3.42995019361002e-05, "loss": 2.2222, "step": 133304 }, { "epoch": 0.83, "learning_rate": 3.429466948332867e-05, "loss": 2.2294, "step": 133312 }, { "epoch": 0.83, "learning_rate": 3.428983766959454e-05, "loss": 2.2153, "step": 133320 }, { "epoch": 0.83, "learning_rate": 3.428500649501792e-05, "loss": 2.2214, "step": 133328 }, { "epoch": 0.83, "learning_rate": 3.4280175959718927e-05, "loss": 2.2141, "step": 133336 }, { "epoch": 0.83, "learning_rate": 3.427534606381766e-05, "loss": 2.2546, "step": 133344 }, { "epoch": 0.83, "learning_rate": 3.427051680743415e-05, "loss": 2.2353, "step": 133352 }, { "epoch": 0.83, "learning_rate": 3.42656881906885e-05, "loss": 2.2198, "step": 133360 }, { "epoch": 0.83, "learning_rate": 3.426086021370073e-05, "loss": 2.2451, "step": 133368 }, { "epoch": 0.83, "learning_rate": 3.425603287659084e-05, "loss": 2.2162, "step": 133376 }, { "epoch": 0.83, "learning_rate": 3.425120617947889e-05, "loss": 2.251, "step": 133384 }, { "epoch": 0.83, "learning_rate": 3.424638012248483e-05, "loss": 2.2348, "step": 133392 }, { "epoch": 0.83, "learning_rate": 3.4241554705728636e-05, "loss": 2.23, "step": 133400 }, { "epoch": 0.83, "learning_rate": 3.4236729929330306e-05, "loss": 2.2459, "step": 133408 }, { "epoch": 0.83, "learning_rate": 3.423190579340974e-05, "loss": 2.2327, "step": 133416 }, { "epoch": 0.83, "learning_rate": 3.422708229808689e-05, "loss": 2.2215, "step": 133424 }, { "epoch": 0.83, "learning_rate": 3.422225944348168e-05, "loss": 2.2285, "step": 133432 }, { "epoch": 0.83, "learning_rate": 3.4217437229713977e-05, "loss": 2.2276, "step": 133440 }, { "epoch": 0.83, "learning_rate": 3.421261565690369e-05, "loss": 2.2151, "step": 133448 }, { "epoch": 0.83, "learning_rate": 3.4207794725170675e-05, "loss": 2.2187, "step": 133456 }, { "epoch": 0.83, "learning_rate": 3.4202974434634763e-05, "loss": 2.2319, "step": 133464 }, { "epoch": 0.83, "learning_rate": 3.4198154785415815e-05, "loss": 2.2174, "step": 133472 }, { "epoch": 0.83, "learning_rate": 3.419333577763362e-05, "loss": 2.2294, "step": 133480 }, { "epoch": 0.83, "learning_rate": 3.418851741140798e-05, "loss": 2.21, "step": 133488 }, { "epoch": 0.83, "learning_rate": 3.418369968685872e-05, "loss": 2.2286, "step": 133496 }, { "epoch": 0.83, "learning_rate": 3.4178882604105575e-05, "loss": 2.2367, "step": 133504 }, { "epoch": 0.83, "learning_rate": 3.4174066163268313e-05, "loss": 2.2306, "step": 133512 }, { "epoch": 0.83, "learning_rate": 3.4169250364466644e-05, "loss": 2.2254, "step": 133520 }, { "epoch": 0.83, "learning_rate": 3.416443520782032e-05, "loss": 2.234, "step": 133528 }, { "epoch": 0.83, "learning_rate": 3.415962069344905e-05, "loss": 2.2462, "step": 133536 }, { "epoch": 0.83, "learning_rate": 3.415480682147248e-05, "loss": 2.2151, "step": 133544 }, { "epoch": 0.83, "learning_rate": 3.414999359201033e-05, "loss": 2.217, "step": 133552 }, { "epoch": 0.83, "learning_rate": 3.414518100518224e-05, "loss": 2.2356, "step": 133560 }, { "epoch": 0.83, "learning_rate": 3.4140369061107835e-05, "loss": 2.2434, "step": 133568 }, { "epoch": 0.83, "learning_rate": 3.413555775990678e-05, "loss": 2.2438, "step": 133576 }, { "epoch": 0.83, "learning_rate": 3.413074710169865e-05, "loss": 2.234, "step": 133584 }, { "epoch": 0.83, "learning_rate": 3.4125937086603047e-05, "loss": 2.2242, "step": 133592 }, { "epoch": 0.83, "learning_rate": 3.4121127714739555e-05, "loss": 2.2364, "step": 133600 }, { "epoch": 0.84, "learning_rate": 3.411631898622772e-05, "loss": 2.2288, "step": 133608 }, { "epoch": 0.84, "learning_rate": 3.4111510901187105e-05, "loss": 2.2349, "step": 133616 }, { "epoch": 0.84, "learning_rate": 3.410670345973724e-05, "loss": 2.2363, "step": 133624 }, { "epoch": 0.84, "learning_rate": 3.4101896661997626e-05, "loss": 2.2474, "step": 133632 }, { "epoch": 0.84, "learning_rate": 3.409709050808777e-05, "loss": 2.2273, "step": 133640 }, { "epoch": 0.84, "learning_rate": 3.409228499812716e-05, "loss": 2.2291, "step": 133648 }, { "epoch": 0.84, "learning_rate": 3.408748013223523e-05, "loss": 2.231, "step": 133656 }, { "epoch": 0.84, "learning_rate": 3.4082675910531466e-05, "loss": 2.2305, "step": 133664 }, { "epoch": 0.84, "learning_rate": 3.40778723331353e-05, "loss": 2.2304, "step": 133672 }, { "epoch": 0.84, "learning_rate": 3.40730694001661e-05, "loss": 2.2251, "step": 133680 }, { "epoch": 0.84, "learning_rate": 3.406826711174335e-05, "loss": 2.2058, "step": 133688 }, { "epoch": 0.84, "learning_rate": 3.4063465467986355e-05, "loss": 2.2429, "step": 133696 }, { "epoch": 0.84, "learning_rate": 3.405866446901451e-05, "loss": 2.2228, "step": 133704 }, { "epoch": 0.84, "learning_rate": 3.40538641149472e-05, "loss": 2.2185, "step": 133712 }, { "epoch": 0.84, "learning_rate": 3.404906440590374e-05, "loss": 2.2271, "step": 133720 }, { "epoch": 0.84, "learning_rate": 3.404426534200344e-05, "loss": 2.2341, "step": 133728 }, { "epoch": 0.84, "learning_rate": 3.403946692336562e-05, "loss": 2.2395, "step": 133736 }, { "epoch": 0.84, "learning_rate": 3.403466915010957e-05, "loss": 2.2397, "step": 133744 }, { "epoch": 0.84, "learning_rate": 3.402987202235455e-05, "loss": 2.2292, "step": 133752 }, { "epoch": 0.84, "learning_rate": 3.402507554021982e-05, "loss": 2.2311, "step": 133760 }, { "epoch": 0.84, "learning_rate": 3.402027970382462e-05, "loss": 2.2227, "step": 133768 }, { "epoch": 0.84, "learning_rate": 3.401548451328822e-05, "loss": 2.2309, "step": 133776 }, { "epoch": 0.84, "learning_rate": 3.401068996872975e-05, "loss": 2.2222, "step": 133784 }, { "epoch": 0.84, "learning_rate": 3.400589607026846e-05, "loss": 2.2245, "step": 133792 }, { "epoch": 0.84, "learning_rate": 3.400110281802352e-05, "loss": 2.2283, "step": 133800 }, { "epoch": 0.84, "learning_rate": 3.399631021211406e-05, "loss": 2.2386, "step": 133808 }, { "epoch": 0.84, "learning_rate": 3.399151825265926e-05, "loss": 2.2373, "step": 133816 }, { "epoch": 0.84, "learning_rate": 3.398672693977823e-05, "loss": 2.2291, "step": 133824 }, { "epoch": 0.84, "learning_rate": 3.398193627359008e-05, "loss": 2.2355, "step": 133832 }, { "epoch": 0.84, "learning_rate": 3.397714625421393e-05, "loss": 2.2402, "step": 133840 }, { "epoch": 0.84, "learning_rate": 3.397235688176882e-05, "loss": 2.2124, "step": 133848 }, { "epoch": 0.84, "learning_rate": 3.396756815637386e-05, "loss": 2.2118, "step": 133856 }, { "epoch": 0.84, "learning_rate": 3.396278007814807e-05, "loss": 2.2479, "step": 133864 }, { "epoch": 0.84, "learning_rate": 3.3957992647210476e-05, "loss": 2.2385, "step": 133872 }, { "epoch": 0.84, "learning_rate": 3.395320586368014e-05, "loss": 2.2263, "step": 133880 }, { "epoch": 0.84, "learning_rate": 3.3948419727676e-05, "loss": 2.2383, "step": 133888 }, { "epoch": 0.84, "learning_rate": 3.394363423931706e-05, "loss": 2.2242, "step": 133896 }, { "epoch": 0.84, "learning_rate": 3.393884939872234e-05, "loss": 2.2191, "step": 133904 }, { "epoch": 0.84, "learning_rate": 3.39340652060107e-05, "loss": 2.2311, "step": 133912 }, { "epoch": 0.84, "learning_rate": 3.3929281661301135e-05, "loss": 2.2281, "step": 133920 }, { "epoch": 0.84, "learning_rate": 3.3924498764712564e-05, "loss": 2.2307, "step": 133928 }, { "epoch": 0.84, "learning_rate": 3.3919716516363885e-05, "loss": 2.2407, "step": 133936 }, { "epoch": 0.84, "learning_rate": 3.3914934916373974e-05, "loss": 2.2217, "step": 133944 }, { "epoch": 0.84, "learning_rate": 3.39101539648617e-05, "loss": 2.2288, "step": 133952 }, { "epoch": 0.84, "learning_rate": 3.390537366194593e-05, "loss": 2.2256, "step": 133960 }, { "epoch": 0.84, "learning_rate": 3.39005940077455e-05, "loss": 2.2476, "step": 133968 }, { "epoch": 0.84, "learning_rate": 3.389581500237923e-05, "loss": 2.2314, "step": 133976 }, { "epoch": 0.84, "learning_rate": 3.389103664596591e-05, "loss": 2.2307, "step": 133984 }, { "epoch": 0.84, "learning_rate": 3.388625893862439e-05, "loss": 2.2164, "step": 133992 }, { "epoch": 0.84, "learning_rate": 3.3881481880473366e-05, "loss": 2.2413, "step": 134000 }, { "epoch": 0.84, "learning_rate": 3.387670547163165e-05, "loss": 2.2238, "step": 134008 }, { "epoch": 0.84, "learning_rate": 3.3871929712217966e-05, "loss": 2.2419, "step": 134016 }, { "epoch": 0.84, "learning_rate": 3.386715460235103e-05, "loss": 2.2335, "step": 134024 }, { "epoch": 0.84, "learning_rate": 3.386238014214957e-05, "loss": 2.2187, "step": 134032 }, { "epoch": 0.84, "learning_rate": 3.3857606331732284e-05, "loss": 2.2413, "step": 134040 }, { "epoch": 0.84, "learning_rate": 3.385283317121781e-05, "loss": 2.2251, "step": 134048 }, { "epoch": 0.84, "learning_rate": 3.384806066072486e-05, "loss": 2.2473, "step": 134056 }, { "epoch": 0.84, "learning_rate": 3.384328880037204e-05, "loss": 2.2322, "step": 134064 }, { "epoch": 0.84, "learning_rate": 3.3838517590278014e-05, "loss": 2.2356, "step": 134072 }, { "epoch": 0.84, "learning_rate": 3.383374703056137e-05, "loss": 2.2374, "step": 134080 }, { "epoch": 0.84, "learning_rate": 3.3828977121340696e-05, "loss": 2.2402, "step": 134088 }, { "epoch": 0.84, "learning_rate": 3.3824207862734613e-05, "loss": 2.2445, "step": 134096 }, { "epoch": 0.84, "learning_rate": 3.381943925486164e-05, "loss": 2.2373, "step": 134104 }, { "epoch": 0.84, "learning_rate": 3.381467129784034e-05, "loss": 2.2278, "step": 134112 }, { "epoch": 0.84, "learning_rate": 3.380990399178926e-05, "loss": 2.2305, "step": 134120 }, { "epoch": 0.84, "learning_rate": 3.380513733682691e-05, "loss": 2.2261, "step": 134128 }, { "epoch": 0.84, "learning_rate": 3.380037133307177e-05, "loss": 2.2268, "step": 134136 }, { "epoch": 0.84, "learning_rate": 3.379560598064235e-05, "loss": 2.2247, "step": 134144 }, { "epoch": 0.84, "learning_rate": 3.37908412796571e-05, "loss": 2.2197, "step": 134152 }, { "epoch": 0.84, "learning_rate": 3.378607723023449e-05, "loss": 2.233, "step": 134160 }, { "epoch": 0.84, "learning_rate": 3.3781313832492926e-05, "loss": 2.2258, "step": 134168 }, { "epoch": 0.84, "learning_rate": 3.377655108655085e-05, "loss": 2.2286, "step": 134176 }, { "epoch": 0.84, "learning_rate": 3.3771788992526646e-05, "loss": 2.2258, "step": 134184 }, { "epoch": 0.84, "learning_rate": 3.376702755053871e-05, "loss": 2.2346, "step": 134192 }, { "epoch": 0.84, "learning_rate": 3.3762266760705423e-05, "loss": 2.2363, "step": 134200 }, { "epoch": 0.84, "learning_rate": 3.375750662314513e-05, "loss": 2.2378, "step": 134208 }, { "epoch": 0.84, "learning_rate": 3.3752747137976146e-05, "loss": 2.2359, "step": 134216 }, { "epoch": 0.84, "learning_rate": 3.374798830531684e-05, "loss": 2.2236, "step": 134224 }, { "epoch": 0.84, "learning_rate": 3.374323012528547e-05, "loss": 2.2302, "step": 134232 }, { "epoch": 0.84, "learning_rate": 3.373847259800035e-05, "loss": 2.2248, "step": 134240 }, { "epoch": 0.84, "learning_rate": 3.373371572357976e-05, "loss": 2.2468, "step": 134248 }, { "epoch": 0.84, "learning_rate": 3.372895950214193e-05, "loss": 2.2353, "step": 134256 }, { "epoch": 0.84, "learning_rate": 3.372420393380511e-05, "loss": 2.2262, "step": 134264 }, { "epoch": 0.84, "learning_rate": 3.371944901868754e-05, "loss": 2.2186, "step": 134272 }, { "epoch": 0.84, "learning_rate": 3.37146947569074e-05, "loss": 2.2152, "step": 134280 }, { "epoch": 0.84, "learning_rate": 3.370994114858292e-05, "loss": 2.2439, "step": 134288 }, { "epoch": 0.84, "learning_rate": 3.3705188193832246e-05, "loss": 2.2252, "step": 134296 }, { "epoch": 0.84, "learning_rate": 3.370043589277354e-05, "loss": 2.2376, "step": 134304 }, { "epoch": 0.84, "learning_rate": 3.369568424552496e-05, "loss": 2.2406, "step": 134312 }, { "epoch": 0.84, "learning_rate": 3.3690933252204605e-05, "loss": 2.2205, "step": 134320 }, { "epoch": 0.84, "learning_rate": 3.36861829129306e-05, "loss": 2.2373, "step": 134328 }, { "epoch": 0.84, "learning_rate": 3.368143322782105e-05, "loss": 2.2177, "step": 134336 }, { "epoch": 0.84, "learning_rate": 3.3676684196994024e-05, "loss": 2.2221, "step": 134344 }, { "epoch": 0.84, "learning_rate": 3.3671935820567566e-05, "loss": 2.2313, "step": 134352 }, { "epoch": 0.84, "learning_rate": 3.366718809865975e-05, "loss": 2.2247, "step": 134360 }, { "epoch": 0.84, "learning_rate": 3.3662441031388605e-05, "loss": 2.2189, "step": 134368 }, { "epoch": 0.84, "learning_rate": 3.365769461887211e-05, "loss": 2.2231, "step": 134376 }, { "epoch": 0.84, "learning_rate": 3.365294886122829e-05, "loss": 2.2254, "step": 134384 }, { "epoch": 0.84, "learning_rate": 3.364820375857512e-05, "loss": 2.2289, "step": 134392 }, { "epoch": 0.84, "learning_rate": 3.3643459311030564e-05, "loss": 2.2253, "step": 134400 }, { "epoch": 0.84, "learning_rate": 3.363871551871255e-05, "loss": 2.2325, "step": 134408 }, { "epoch": 0.84, "learning_rate": 3.363397238173904e-05, "loss": 2.2288, "step": 134416 }, { "epoch": 0.84, "learning_rate": 3.3629229900227944e-05, "loss": 2.2371, "step": 134424 }, { "epoch": 0.84, "learning_rate": 3.362448807429712e-05, "loss": 2.2365, "step": 134432 }, { "epoch": 0.84, "learning_rate": 3.361974690406451e-05, "loss": 2.2269, "step": 134440 }, { "epoch": 0.84, "learning_rate": 3.361500638964795e-05, "loss": 2.2196, "step": 134448 }, { "epoch": 0.84, "learning_rate": 3.361026653116527e-05, "loss": 2.2226, "step": 134456 }, { "epoch": 0.84, "learning_rate": 3.360552732873434e-05, "loss": 2.2266, "step": 134464 }, { "epoch": 0.84, "learning_rate": 3.3600788782472956e-05, "loss": 2.2347, "step": 134472 }, { "epoch": 0.84, "learning_rate": 3.3596050892498937e-05, "loss": 2.2454, "step": 134480 }, { "epoch": 0.84, "learning_rate": 3.359131365893005e-05, "loss": 2.2528, "step": 134488 }, { "epoch": 0.84, "learning_rate": 3.358657708188406e-05, "loss": 2.2432, "step": 134496 }, { "epoch": 0.84, "learning_rate": 3.358184116147874e-05, "loss": 2.2129, "step": 134504 }, { "epoch": 0.84, "learning_rate": 3.3577105897831805e-05, "loss": 2.2317, "step": 134512 }, { "epoch": 0.84, "learning_rate": 3.3572371291060976e-05, "loss": 2.2166, "step": 134520 }, { "epoch": 0.84, "learning_rate": 3.356763734128399e-05, "loss": 2.2245, "step": 134528 }, { "epoch": 0.84, "learning_rate": 3.356290404861847e-05, "loss": 2.2312, "step": 134536 }, { "epoch": 0.84, "learning_rate": 3.3558171413182123e-05, "loss": 2.2223, "step": 134544 }, { "epoch": 0.84, "learning_rate": 3.3553439435092625e-05, "loss": 2.2209, "step": 134552 }, { "epoch": 0.84, "learning_rate": 3.354870811446759e-05, "loss": 2.2332, "step": 134560 }, { "epoch": 0.84, "learning_rate": 3.354397745142464e-05, "loss": 2.2188, "step": 134568 }, { "epoch": 0.84, "learning_rate": 3.3539247446081344e-05, "loss": 2.226, "step": 134576 }, { "epoch": 0.84, "learning_rate": 3.353451809855536e-05, "loss": 2.2203, "step": 134584 }, { "epoch": 0.84, "learning_rate": 3.352978940896422e-05, "loss": 2.2349, "step": 134592 }, { "epoch": 0.84, "learning_rate": 3.352506137742546e-05, "loss": 2.2271, "step": 134600 }, { "epoch": 0.84, "learning_rate": 3.3520334004056676e-05, "loss": 2.2331, "step": 134608 }, { "epoch": 0.84, "learning_rate": 3.3515607288975347e-05, "loss": 2.2341, "step": 134616 }, { "epoch": 0.84, "learning_rate": 3.351088123229899e-05, "loss": 2.2164, "step": 134624 }, { "epoch": 0.84, "learning_rate": 3.35061558341451e-05, "loss": 2.2248, "step": 134632 }, { "epoch": 0.84, "learning_rate": 3.350143109463116e-05, "loss": 2.2171, "step": 134640 }, { "epoch": 0.84, "learning_rate": 3.3496707013874596e-05, "loss": 2.2288, "step": 134648 }, { "epoch": 0.84, "learning_rate": 3.349198359199288e-05, "loss": 2.2264, "step": 134656 }, { "epoch": 0.84, "learning_rate": 3.3487260829103426e-05, "loss": 2.2254, "step": 134664 }, { "epoch": 0.84, "learning_rate": 3.348253872532363e-05, "loss": 2.2227, "step": 134672 }, { "epoch": 0.84, "learning_rate": 3.347781728077092e-05, "loss": 2.2285, "step": 134680 }, { "epoch": 0.84, "learning_rate": 3.3473096495562615e-05, "loss": 2.2425, "step": 134688 }, { "epoch": 0.84, "learning_rate": 3.346837636981614e-05, "loss": 2.2355, "step": 134696 }, { "epoch": 0.84, "learning_rate": 3.34636569036488e-05, "loss": 2.2353, "step": 134704 }, { "epoch": 0.84, "learning_rate": 3.3458938097177904e-05, "loss": 2.2277, "step": 134712 }, { "epoch": 0.84, "learning_rate": 3.3454219950520825e-05, "loss": 2.2162, "step": 134720 }, { "epoch": 0.84, "learning_rate": 3.344950246379478e-05, "loss": 2.229, "step": 134728 }, { "epoch": 0.84, "learning_rate": 3.344478563711709e-05, "loss": 2.2235, "step": 134736 }, { "epoch": 0.84, "learning_rate": 3.344006947060503e-05, "loss": 2.231, "step": 134744 }, { "epoch": 0.84, "learning_rate": 3.3435353964375796e-05, "loss": 2.2327, "step": 134752 }, { "epoch": 0.84, "learning_rate": 3.343063911854665e-05, "loss": 2.2291, "step": 134760 }, { "epoch": 0.84, "learning_rate": 3.34259249332348e-05, "loss": 2.2241, "step": 134768 }, { "epoch": 0.84, "learning_rate": 3.342121140855744e-05, "loss": 2.2321, "step": 134776 }, { "epoch": 0.84, "learning_rate": 3.3416498544631745e-05, "loss": 2.2177, "step": 134784 }, { "epoch": 0.84, "learning_rate": 3.341178634157487e-05, "loss": 2.2218, "step": 134792 }, { "epoch": 0.84, "learning_rate": 3.340707479950398e-05, "loss": 2.2192, "step": 134800 }, { "epoch": 0.84, "learning_rate": 3.340236391853619e-05, "loss": 2.2318, "step": 134808 }, { "epoch": 0.84, "learning_rate": 3.3397653698788614e-05, "loss": 2.2276, "step": 134816 }, { "epoch": 0.84, "learning_rate": 3.339294414037835e-05, "loss": 2.2335, "step": 134824 }, { "epoch": 0.84, "learning_rate": 3.3388235243422506e-05, "loss": 2.2309, "step": 134832 }, { "epoch": 0.84, "learning_rate": 3.338352700803808e-05, "loss": 2.2316, "step": 134840 }, { "epoch": 0.84, "learning_rate": 3.337881943434219e-05, "loss": 2.2354, "step": 134848 }, { "epoch": 0.84, "learning_rate": 3.337411252245183e-05, "loss": 2.2329, "step": 134856 }, { "epoch": 0.84, "learning_rate": 3.3369406272484e-05, "loss": 2.2272, "step": 134864 }, { "epoch": 0.84, "learning_rate": 3.336470068455574e-05, "loss": 2.2372, "step": 134872 }, { "epoch": 0.84, "learning_rate": 3.335999575878401e-05, "loss": 2.2237, "step": 134880 }, { "epoch": 0.84, "learning_rate": 3.3355291495285756e-05, "loss": 2.2308, "step": 134888 }, { "epoch": 0.84, "learning_rate": 3.335058789417796e-05, "loss": 2.2284, "step": 134896 }, { "epoch": 0.84, "learning_rate": 3.334588495557752e-05, "loss": 2.2314, "step": 134904 }, { "epoch": 0.84, "learning_rate": 3.334118267960139e-05, "loss": 2.2383, "step": 134912 }, { "epoch": 0.84, "learning_rate": 3.333648106636645e-05, "loss": 2.2332, "step": 134920 }, { "epoch": 0.84, "learning_rate": 3.333178011598957e-05, "loss": 2.232, "step": 134928 }, { "epoch": 0.84, "learning_rate": 3.332707982858765e-05, "loss": 2.2432, "step": 134936 }, { "epoch": 0.84, "learning_rate": 3.332238020427749e-05, "loss": 2.2253, "step": 134944 }, { "epoch": 0.84, "learning_rate": 3.331768124317596e-05, "loss": 2.2336, "step": 134952 }, { "epoch": 0.84, "learning_rate": 3.331298294539989e-05, "loss": 2.2171, "step": 134960 }, { "epoch": 0.84, "learning_rate": 3.330828531106603e-05, "loss": 2.2312, "step": 134968 }, { "epoch": 0.84, "learning_rate": 3.3303588340291195e-05, "loss": 2.2289, "step": 134976 }, { "epoch": 0.84, "learning_rate": 3.3298892033192164e-05, "loss": 2.2346, "step": 134984 }, { "epoch": 0.84, "learning_rate": 3.329419638988567e-05, "loss": 2.2292, "step": 134992 }, { "epoch": 0.84, "learning_rate": 3.3289501410488446e-05, "loss": 2.2298, "step": 135000 }, { "epoch": 0.84, "learning_rate": 3.328480709511721e-05, "loss": 2.2269, "step": 135008 }, { "epoch": 0.84, "learning_rate": 3.328011344388867e-05, "loss": 2.238, "step": 135016 }, { "epoch": 0.84, "learning_rate": 3.3275420456919514e-05, "loss": 2.2217, "step": 135024 }, { "epoch": 0.84, "learning_rate": 3.327072813432639e-05, "loss": 2.2321, "step": 135032 }, { "epoch": 0.84, "learning_rate": 3.3266036476225973e-05, "loss": 2.2286, "step": 135040 }, { "epoch": 0.84, "learning_rate": 3.3261345482734894e-05, "loss": 2.2414, "step": 135048 }, { "epoch": 0.84, "learning_rate": 3.325665515396975e-05, "loss": 2.2348, "step": 135056 }, { "epoch": 0.84, "learning_rate": 3.325196549004717e-05, "loss": 2.2197, "step": 135064 }, { "epoch": 0.84, "learning_rate": 3.324727649108373e-05, "loss": 2.2365, "step": 135072 }, { "epoch": 0.84, "learning_rate": 3.324258815719599e-05, "loss": 2.2372, "step": 135080 }, { "epoch": 0.84, "learning_rate": 3.323790048850052e-05, "loss": 2.2426, "step": 135088 }, { "epoch": 0.84, "learning_rate": 3.323321348511384e-05, "loss": 2.222, "step": 135096 }, { "epoch": 0.84, "learning_rate": 3.3228527147152475e-05, "loss": 2.2363, "step": 135104 }, { "epoch": 0.84, "learning_rate": 3.322384147473294e-05, "loss": 2.2267, "step": 135112 }, { "epoch": 0.84, "learning_rate": 3.32191564679717e-05, "loss": 2.2157, "step": 135120 }, { "epoch": 0.84, "learning_rate": 3.321447212698524e-05, "loss": 2.2205, "step": 135128 }, { "epoch": 0.84, "learning_rate": 3.3209788451890006e-05, "loss": 2.2367, "step": 135136 }, { "epoch": 0.84, "learning_rate": 3.320510544280243e-05, "loss": 2.233, "step": 135144 }, { "epoch": 0.84, "learning_rate": 3.3200423099838965e-05, "loss": 2.2249, "step": 135152 }, { "epoch": 0.84, "learning_rate": 3.319574142311595e-05, "loss": 2.2242, "step": 135160 }, { "epoch": 0.84, "learning_rate": 3.319106041274983e-05, "loss": 2.2145, "step": 135168 }, { "epoch": 0.84, "learning_rate": 3.318638006885696e-05, "loss": 2.2522, "step": 135176 }, { "epoch": 0.84, "learning_rate": 3.318170039155369e-05, "loss": 2.2263, "step": 135184 }, { "epoch": 0.84, "learning_rate": 3.317702138095634e-05, "loss": 2.2246, "step": 135192 }, { "epoch": 0.84, "learning_rate": 3.317234303718127e-05, "loss": 2.2236, "step": 135200 }, { "epoch": 0.85, "learning_rate": 3.316766536034476e-05, "loss": 2.2301, "step": 135208 }, { "epoch": 0.85, "learning_rate": 3.316298835056309e-05, "loss": 2.232, "step": 135216 }, { "epoch": 0.85, "learning_rate": 3.315831200795254e-05, "loss": 2.2255, "step": 135224 }, { "epoch": 0.85, "learning_rate": 3.3153636332629377e-05, "loss": 2.2197, "step": 135232 }, { "epoch": 0.85, "learning_rate": 3.314896132470982e-05, "loss": 2.2379, "step": 135240 }, { "epoch": 0.85, "learning_rate": 3.314428698431009e-05, "loss": 2.2343, "step": 135248 }, { "epoch": 0.85, "learning_rate": 3.31396133115464e-05, "loss": 2.2256, "step": 135256 }, { "epoch": 0.85, "learning_rate": 3.313494030653495e-05, "loss": 2.2333, "step": 135264 }, { "epoch": 0.85, "learning_rate": 3.3130267969391884e-05, "loss": 2.2201, "step": 135272 }, { "epoch": 0.85, "learning_rate": 3.312559630023337e-05, "loss": 2.2196, "step": 135280 }, { "epoch": 0.85, "learning_rate": 3.3120925299175566e-05, "loss": 2.2158, "step": 135288 }, { "epoch": 0.85, "learning_rate": 3.311625496633455e-05, "loss": 2.2322, "step": 135296 }, { "epoch": 0.85, "learning_rate": 3.311158530182648e-05, "loss": 2.2442, "step": 135304 }, { "epoch": 0.85, "learning_rate": 3.31069163057674e-05, "loss": 2.2326, "step": 135312 }, { "epoch": 0.85, "learning_rate": 3.310224797827338e-05, "loss": 2.232, "step": 135320 }, { "epoch": 0.85, "learning_rate": 3.309758031946052e-05, "loss": 2.2294, "step": 135328 }, { "epoch": 0.85, "learning_rate": 3.309291332944482e-05, "loss": 2.2371, "step": 135336 }, { "epoch": 0.85, "learning_rate": 3.308824700834232e-05, "loss": 2.2385, "step": 135344 }, { "epoch": 0.85, "learning_rate": 3.3083581356269014e-05, "loss": 2.2183, "step": 135352 }, { "epoch": 0.85, "learning_rate": 3.307891637334089e-05, "loss": 2.2303, "step": 135360 }, { "epoch": 0.85, "learning_rate": 3.307425205967395e-05, "loss": 2.2297, "step": 135368 }, { "epoch": 0.85, "learning_rate": 3.30695884153841e-05, "loss": 2.2271, "step": 135376 }, { "epoch": 0.85, "learning_rate": 3.30649254405873e-05, "loss": 2.2342, "step": 135384 }, { "epoch": 0.85, "learning_rate": 3.3060263135399495e-05, "loss": 2.2367, "step": 135392 }, { "epoch": 0.85, "learning_rate": 3.3055601499936564e-05, "loss": 2.2358, "step": 135400 }, { "epoch": 0.85, "learning_rate": 3.30509405343144e-05, "loss": 2.2344, "step": 135408 }, { "epoch": 0.85, "learning_rate": 3.304628023864888e-05, "loss": 2.2391, "step": 135416 }, { "epoch": 0.85, "learning_rate": 3.304162061305586e-05, "loss": 2.2252, "step": 135424 }, { "epoch": 0.85, "learning_rate": 3.3036961657651175e-05, "loss": 2.2588, "step": 135432 }, { "epoch": 0.85, "learning_rate": 3.303230337255064e-05, "loss": 2.2377, "step": 135440 }, { "epoch": 0.85, "learning_rate": 3.302764575787008e-05, "loss": 2.2395, "step": 135448 }, { "epoch": 0.85, "learning_rate": 3.3022988813725266e-05, "loss": 2.2357, "step": 135456 }, { "epoch": 0.85, "learning_rate": 3.301833254023197e-05, "loss": 2.2506, "step": 135464 }, { "epoch": 0.85, "learning_rate": 3.3013676937505966e-05, "loss": 2.2197, "step": 135472 }, { "epoch": 0.85, "learning_rate": 3.300902200566298e-05, "loss": 2.2134, "step": 135480 }, { "epoch": 0.85, "learning_rate": 3.300436774481873e-05, "loss": 2.222, "step": 135488 }, { "epoch": 0.85, "learning_rate": 3.2999714155088934e-05, "loss": 2.2365, "step": 135496 }, { "epoch": 0.85, "learning_rate": 3.299506123658928e-05, "loss": 2.2365, "step": 135504 }, { "epoch": 0.85, "learning_rate": 3.2990408989435405e-05, "loss": 2.2366, "step": 135512 }, { "epoch": 0.85, "learning_rate": 3.2985757413743015e-05, "loss": 2.2227, "step": 135520 }, { "epoch": 0.85, "learning_rate": 3.298110650962772e-05, "loss": 2.2224, "step": 135528 }, { "epoch": 0.85, "learning_rate": 3.297645627720515e-05, "loss": 2.2117, "step": 135536 }, { "epoch": 0.85, "learning_rate": 3.2971806716590915e-05, "loss": 2.2226, "step": 135544 }, { "epoch": 0.85, "learning_rate": 3.296715782790059e-05, "loss": 2.2328, "step": 135552 }, { "epoch": 0.85, "learning_rate": 3.296250961124977e-05, "loss": 2.2245, "step": 135560 }, { "epoch": 0.85, "learning_rate": 3.2957862066753976e-05, "loss": 2.2182, "step": 135568 }, { "epoch": 0.85, "learning_rate": 3.295321519452876e-05, "loss": 2.2234, "step": 135576 }, { "epoch": 0.85, "learning_rate": 3.294856899468968e-05, "loss": 2.2009, "step": 135584 }, { "epoch": 0.85, "learning_rate": 3.2943923467352175e-05, "loss": 2.2199, "step": 135592 }, { "epoch": 0.85, "learning_rate": 3.2939278612631776e-05, "loss": 2.2205, "step": 135600 }, { "epoch": 0.85, "learning_rate": 3.293463443064396e-05, "loss": 2.2274, "step": 135608 }, { "epoch": 0.85, "learning_rate": 3.292999092150416e-05, "loss": 2.2203, "step": 135616 }, { "epoch": 0.85, "learning_rate": 3.2925348085327835e-05, "loss": 2.2415, "step": 135624 }, { "epoch": 0.85, "learning_rate": 3.2920705922230376e-05, "loss": 2.2379, "step": 135632 }, { "epoch": 0.85, "learning_rate": 3.291606443232722e-05, "loss": 2.2443, "step": 135640 }, { "epoch": 0.85, "learning_rate": 3.2911423615733736e-05, "loss": 2.2115, "step": 135648 }, { "epoch": 0.85, "learning_rate": 3.2906783472565294e-05, "loss": 2.2439, "step": 135656 }, { "epoch": 0.85, "learning_rate": 3.2902144002937265e-05, "loss": 2.2246, "step": 135664 }, { "epoch": 0.85, "learning_rate": 3.2897505206964974e-05, "loss": 2.2245, "step": 135672 }, { "epoch": 0.85, "learning_rate": 3.2892867084763733e-05, "loss": 2.2242, "step": 135680 }, { "epoch": 0.85, "learning_rate": 3.2888229636448875e-05, "loss": 2.2186, "step": 135688 }, { "epoch": 0.85, "learning_rate": 3.2883592862135656e-05, "loss": 2.2303, "step": 135696 }, { "epoch": 0.85, "learning_rate": 3.287895676193936e-05, "loss": 2.2083, "step": 135704 }, { "epoch": 0.85, "learning_rate": 3.287432133597526e-05, "loss": 2.2318, "step": 135712 }, { "epoch": 0.85, "learning_rate": 3.286968658435857e-05, "loss": 2.2265, "step": 135720 }, { "epoch": 0.85, "learning_rate": 3.2865052507204495e-05, "loss": 2.2238, "step": 135728 }, { "epoch": 0.85, "learning_rate": 3.286041910462828e-05, "loss": 2.2513, "step": 135736 }, { "epoch": 0.85, "learning_rate": 3.2855786376745076e-05, "loss": 2.2288, "step": 135744 }, { "epoch": 0.85, "learning_rate": 3.285115432367008e-05, "loss": 2.2319, "step": 135752 }, { "epoch": 0.85, "learning_rate": 3.2846522945518435e-05, "loss": 2.2292, "step": 135760 }, { "epoch": 0.85, "learning_rate": 3.2841892242405264e-05, "loss": 2.2282, "step": 135768 }, { "epoch": 0.85, "learning_rate": 3.2837262214445724e-05, "loss": 2.2332, "step": 135776 }, { "epoch": 0.85, "learning_rate": 3.283263286175486e-05, "loss": 2.2451, "step": 135784 }, { "epoch": 0.85, "learning_rate": 3.28280041844478e-05, "loss": 2.2432, "step": 135792 }, { "epoch": 0.85, "learning_rate": 3.282337618263963e-05, "loss": 2.2242, "step": 135800 }, { "epoch": 0.85, "learning_rate": 3.281874885644535e-05, "loss": 2.2364, "step": 135808 }, { "epoch": 0.85, "learning_rate": 3.2814122205980024e-05, "loss": 2.2249, "step": 135816 }, { "epoch": 0.85, "learning_rate": 3.280949623135868e-05, "loss": 2.2172, "step": 135824 }, { "epoch": 0.85, "learning_rate": 3.2804870932696316e-05, "loss": 2.2431, "step": 135832 }, { "epoch": 0.85, "learning_rate": 3.280024631010791e-05, "loss": 2.2298, "step": 135840 }, { "epoch": 0.85, "learning_rate": 3.2795622363708414e-05, "loss": 2.2489, "step": 135848 }, { "epoch": 0.85, "learning_rate": 3.279099909361281e-05, "loss": 2.2193, "step": 135856 }, { "epoch": 0.85, "learning_rate": 3.278637649993603e-05, "loss": 2.2297, "step": 135864 }, { "epoch": 0.85, "learning_rate": 3.278175458279297e-05, "loss": 2.2329, "step": 135872 }, { "epoch": 0.85, "learning_rate": 3.2777133342298535e-05, "loss": 2.2245, "step": 135880 }, { "epoch": 0.85, "learning_rate": 3.277251277856765e-05, "loss": 2.2495, "step": 135888 }, { "epoch": 0.85, "learning_rate": 3.2767892891715135e-05, "loss": 2.225, "step": 135896 }, { "epoch": 0.85, "learning_rate": 3.276327368185586e-05, "loss": 2.2323, "step": 135904 }, { "epoch": 0.85, "learning_rate": 3.275865514910466e-05, "loss": 2.2237, "step": 135912 }, { "epoch": 0.85, "learning_rate": 3.275403729357634e-05, "loss": 2.2236, "step": 135920 }, { "epoch": 0.85, "learning_rate": 3.274942011538572e-05, "loss": 2.2164, "step": 135928 }, { "epoch": 0.85, "learning_rate": 3.274480361464758e-05, "loss": 2.2198, "step": 135936 }, { "epoch": 0.85, "learning_rate": 3.274018779147666e-05, "loss": 2.2172, "step": 135944 }, { "epoch": 0.85, "learning_rate": 3.273557264598774e-05, "loss": 2.2491, "step": 135952 }, { "epoch": 0.85, "learning_rate": 3.273095817829554e-05, "loss": 2.2262, "step": 135960 }, { "epoch": 0.85, "learning_rate": 3.272634438851479e-05, "loss": 2.2258, "step": 135968 }, { "epoch": 0.85, "learning_rate": 3.272173127676017e-05, "loss": 2.2409, "step": 135976 }, { "epoch": 0.85, "learning_rate": 3.2717118843146355e-05, "loss": 2.2239, "step": 135984 }, { "epoch": 0.85, "learning_rate": 3.271250708778806e-05, "loss": 2.2223, "step": 135992 }, { "epoch": 0.85, "learning_rate": 3.2707896010799875e-05, "loss": 2.2271, "step": 136000 }, { "epoch": 0.85, "learning_rate": 3.270328561229646e-05, "loss": 2.2282, "step": 136008 }, { "epoch": 0.85, "learning_rate": 3.269867589239245e-05, "loss": 2.238, "step": 136016 }, { "epoch": 0.85, "learning_rate": 3.26940668512024e-05, "loss": 2.2184, "step": 136024 }, { "epoch": 0.85, "learning_rate": 3.2689458488840906e-05, "loss": 2.2347, "step": 136032 }, { "epoch": 0.85, "learning_rate": 3.268485080542255e-05, "loss": 2.2129, "step": 136040 }, { "epoch": 0.85, "learning_rate": 3.268024380106187e-05, "loss": 2.2517, "step": 136048 }, { "epoch": 0.85, "learning_rate": 3.267563747587339e-05, "loss": 2.2432, "step": 136056 }, { "epoch": 0.85, "learning_rate": 3.267103182997162e-05, "loss": 2.2316, "step": 136064 }, { "epoch": 0.85, "learning_rate": 3.266642686347108e-05, "loss": 2.2356, "step": 136072 }, { "epoch": 0.85, "learning_rate": 3.266182257648623e-05, "loss": 2.2231, "step": 136080 }, { "epoch": 0.85, "learning_rate": 3.265721896913153e-05, "loss": 2.2135, "step": 136088 }, { "epoch": 0.85, "learning_rate": 3.2652616041521443e-05, "loss": 2.2154, "step": 136096 }, { "epoch": 0.85, "learning_rate": 3.264801379377039e-05, "loss": 2.2189, "step": 136104 }, { "epoch": 0.85, "learning_rate": 3.264341222599277e-05, "loss": 2.2229, "step": 136112 }, { "epoch": 0.85, "learning_rate": 3.263881133830301e-05, "loss": 2.2044, "step": 136120 }, { "epoch": 0.85, "learning_rate": 3.263421113081546e-05, "loss": 2.2225, "step": 136128 }, { "epoch": 0.85, "learning_rate": 3.262961160364448e-05, "loss": 2.2263, "step": 136136 }, { "epoch": 0.85, "learning_rate": 3.262501275690445e-05, "loss": 2.2298, "step": 136144 }, { "epoch": 0.85, "learning_rate": 3.2620414590709666e-05, "loss": 2.2153, "step": 136152 }, { "epoch": 0.85, "learning_rate": 3.2615817105174435e-05, "loss": 2.2334, "step": 136160 }, { "epoch": 0.85, "learning_rate": 3.261122030041308e-05, "loss": 2.2389, "step": 136168 }, { "epoch": 0.85, "learning_rate": 3.260662417653984e-05, "loss": 2.2311, "step": 136176 }, { "epoch": 0.85, "learning_rate": 3.260202873366901e-05, "loss": 2.2534, "step": 136184 }, { "epoch": 0.85, "learning_rate": 3.259743397191483e-05, "loss": 2.2443, "step": 136192 }, { "epoch": 0.85, "learning_rate": 3.259283989139149e-05, "loss": 2.2208, "step": 136200 }, { "epoch": 0.85, "learning_rate": 3.2588246492213265e-05, "loss": 2.2308, "step": 136208 }, { "epoch": 0.85, "learning_rate": 3.2583653774494275e-05, "loss": 2.2614, "step": 136216 }, { "epoch": 0.85, "learning_rate": 3.257906173834873e-05, "loss": 2.2248, "step": 136224 }, { "epoch": 0.85, "learning_rate": 3.25744703838908e-05, "loss": 2.2401, "step": 136232 }, { "epoch": 0.85, "learning_rate": 3.256987971123461e-05, "loss": 2.2286, "step": 136240 }, { "epoch": 0.85, "learning_rate": 3.256528972049428e-05, "loss": 2.2349, "step": 136248 }, { "epoch": 0.85, "learning_rate": 3.256070041178393e-05, "loss": 2.2466, "step": 136256 }, { "epoch": 0.85, "learning_rate": 3.255611178521765e-05, "loss": 2.2399, "step": 136264 }, { "epoch": 0.85, "learning_rate": 3.2551523840909514e-05, "loss": 2.2233, "step": 136272 }, { "epoch": 0.85, "learning_rate": 3.2546936578973566e-05, "loss": 2.2301, "step": 136280 }, { "epoch": 0.85, "learning_rate": 3.254234999952386e-05, "loss": 2.231, "step": 136288 }, { "epoch": 0.85, "learning_rate": 3.253776410267441e-05, "loss": 2.2268, "step": 136296 }, { "epoch": 0.85, "learning_rate": 3.253317888853922e-05, "loss": 2.2274, "step": 136304 }, { "epoch": 0.85, "learning_rate": 3.252859435723229e-05, "loss": 2.2399, "step": 136312 }, { "epoch": 0.85, "learning_rate": 3.2524010508867596e-05, "loss": 2.2143, "step": 136320 }, { "epoch": 0.85, "learning_rate": 3.251942734355907e-05, "loss": 2.2301, "step": 136328 }, { "epoch": 0.85, "learning_rate": 3.2514844861420665e-05, "loss": 2.2208, "step": 136336 }, { "epoch": 0.85, "learning_rate": 3.251026306256631e-05, "loss": 2.2178, "step": 136344 }, { "epoch": 0.85, "learning_rate": 3.250568194710989e-05, "loss": 2.2355, "step": 136352 }, { "epoch": 0.85, "learning_rate": 3.2501101515165305e-05, "loss": 2.2462, "step": 136360 }, { "epoch": 0.85, "learning_rate": 3.2496521766846426e-05, "loss": 2.2158, "step": 136368 }, { "epoch": 0.85, "learning_rate": 3.249194270226709e-05, "loss": 2.222, "step": 136376 }, { "epoch": 0.85, "learning_rate": 3.248736432154116e-05, "loss": 2.2305, "step": 136384 }, { "epoch": 0.85, "learning_rate": 3.248278662478242e-05, "loss": 2.2202, "step": 136392 }, { "epoch": 0.85, "learning_rate": 3.247820961210471e-05, "loss": 2.2398, "step": 136400 }, { "epoch": 0.85, "learning_rate": 3.24736332836218e-05, "loss": 2.2273, "step": 136408 }, { "epoch": 0.85, "learning_rate": 3.246905763944743e-05, "loss": 2.2312, "step": 136416 }, { "epoch": 0.85, "learning_rate": 3.246448267969541e-05, "loss": 2.2385, "step": 136424 }, { "epoch": 0.85, "learning_rate": 3.2459908404479414e-05, "loss": 2.2134, "step": 136432 }, { "epoch": 0.85, "learning_rate": 3.245533481391319e-05, "loss": 2.2274, "step": 136440 }, { "epoch": 0.85, "learning_rate": 3.245076190811043e-05, "loss": 2.2497, "step": 136448 }, { "epoch": 0.85, "learning_rate": 3.244618968718484e-05, "loss": 2.2388, "step": 136456 }, { "epoch": 0.85, "learning_rate": 3.244161815125005e-05, "loss": 2.2322, "step": 136464 }, { "epoch": 0.85, "learning_rate": 3.243704730041972e-05, "loss": 2.2235, "step": 136472 }, { "epoch": 0.85, "learning_rate": 3.24324771348075e-05, "loss": 2.2306, "step": 136480 }, { "epoch": 0.85, "learning_rate": 3.2427907654526984e-05, "loss": 2.2164, "step": 136488 }, { "epoch": 0.85, "learning_rate": 3.242333885969177e-05, "loss": 2.2344, "step": 136496 }, { "epoch": 0.85, "learning_rate": 3.241877075041546e-05, "loss": 2.2201, "step": 136504 }, { "epoch": 0.85, "learning_rate": 3.2414203326811596e-05, "loss": 2.2365, "step": 136512 }, { "epoch": 0.85, "learning_rate": 3.240963658899373e-05, "loss": 2.2244, "step": 136520 }, { "epoch": 0.85, "learning_rate": 3.24050705370754e-05, "loss": 2.2337, "step": 136528 }, { "epoch": 0.85, "learning_rate": 3.2400505171170115e-05, "loss": 2.2209, "step": 136536 }, { "epoch": 0.85, "learning_rate": 3.239594049139136e-05, "loss": 2.2319, "step": 136544 }, { "epoch": 0.85, "learning_rate": 3.2391376497852624e-05, "loss": 2.2064, "step": 136552 }, { "epoch": 0.85, "learning_rate": 3.238681319066737e-05, "loss": 2.2261, "step": 136560 }, { "epoch": 0.85, "learning_rate": 3.238225056994903e-05, "loss": 2.2423, "step": 136568 }, { "epoch": 0.85, "learning_rate": 3.2377688635811045e-05, "loss": 2.225, "step": 136576 }, { "epoch": 0.85, "learning_rate": 3.237312738836681e-05, "loss": 2.2025, "step": 136584 }, { "epoch": 0.85, "learning_rate": 3.236856682772974e-05, "loss": 2.2462, "step": 136592 }, { "epoch": 0.85, "learning_rate": 3.23640069540132e-05, "loss": 2.2293, "step": 136600 }, { "epoch": 0.85, "learning_rate": 3.235944776733054e-05, "loss": 2.2418, "step": 136608 }, { "epoch": 0.85, "learning_rate": 3.235488926779513e-05, "loss": 2.2201, "step": 136616 }, { "epoch": 0.85, "learning_rate": 3.2350331455520244e-05, "loss": 2.222, "step": 136624 }, { "epoch": 0.85, "learning_rate": 3.2345774330619226e-05, "loss": 2.225, "step": 136632 }, { "epoch": 0.85, "learning_rate": 3.234121789320539e-05, "loss": 2.2349, "step": 136640 }, { "epoch": 0.85, "learning_rate": 3.233666214339195e-05, "loss": 2.2218, "step": 136648 }, { "epoch": 0.85, "learning_rate": 3.233210708129219e-05, "loss": 2.2234, "step": 136656 }, { "epoch": 0.85, "learning_rate": 3.232755270701937e-05, "loss": 2.2371, "step": 136664 }, { "epoch": 0.85, "learning_rate": 3.232299902068669e-05, "loss": 2.2424, "step": 136672 }, { "epoch": 0.85, "learning_rate": 3.231844602240737e-05, "loss": 2.2264, "step": 136680 }, { "epoch": 0.85, "learning_rate": 3.2313893712294566e-05, "loss": 2.2275, "step": 136688 }, { "epoch": 0.85, "learning_rate": 3.230934209046148e-05, "loss": 2.2289, "step": 136696 }, { "epoch": 0.85, "learning_rate": 3.230479115702127e-05, "loss": 2.2274, "step": 136704 }, { "epoch": 0.85, "learning_rate": 3.230024091208703e-05, "loss": 2.2245, "step": 136712 }, { "epoch": 0.85, "learning_rate": 3.2295691355771936e-05, "loss": 2.2354, "step": 136720 }, { "epoch": 0.85, "learning_rate": 3.229114248818905e-05, "loss": 2.2305, "step": 136728 }, { "epoch": 0.85, "learning_rate": 3.228659430945147e-05, "loss": 2.2283, "step": 136736 }, { "epoch": 0.85, "learning_rate": 3.228204681967227e-05, "loss": 2.2337, "step": 136744 }, { "epoch": 0.85, "learning_rate": 3.22775000189645e-05, "loss": 2.2239, "step": 136752 }, { "epoch": 0.85, "learning_rate": 3.227295390744118e-05, "loss": 2.2501, "step": 136760 }, { "epoch": 0.85, "learning_rate": 3.226840848521534e-05, "loss": 2.223, "step": 136768 }, { "epoch": 0.85, "learning_rate": 3.226386375239998e-05, "loss": 2.2171, "step": 136776 }, { "epoch": 0.85, "learning_rate": 3.225931970910807e-05, "loss": 2.2172, "step": 136784 }, { "epoch": 0.85, "learning_rate": 3.22547763554526e-05, "loss": 2.2138, "step": 136792 }, { "epoch": 0.85, "learning_rate": 3.225023369154648e-05, "loss": 2.2266, "step": 136800 }, { "epoch": 0.86, "learning_rate": 3.224569171750268e-05, "loss": 2.2445, "step": 136808 }, { "epoch": 0.86, "learning_rate": 3.22411504334341e-05, "loss": 2.2206, "step": 136816 }, { "epoch": 0.86, "learning_rate": 3.223660983945362e-05, "loss": 2.2313, "step": 136824 }, { "epoch": 0.86, "learning_rate": 3.223206993567416e-05, "loss": 2.2266, "step": 136832 }, { "epoch": 0.86, "learning_rate": 3.222753072220854e-05, "loss": 2.2228, "step": 136840 }, { "epoch": 0.86, "learning_rate": 3.222299219916961e-05, "loss": 2.2432, "step": 136848 }, { "epoch": 0.86, "learning_rate": 3.221845436667024e-05, "loss": 2.2415, "step": 136856 }, { "epoch": 0.86, "learning_rate": 3.2213917224823185e-05, "loss": 2.2286, "step": 136864 }, { "epoch": 0.86, "learning_rate": 3.220938077374127e-05, "loss": 2.2291, "step": 136872 }, { "epoch": 0.86, "learning_rate": 3.220484501353728e-05, "loss": 2.227, "step": 136880 }, { "epoch": 0.86, "learning_rate": 3.220030994432395e-05, "loss": 2.2401, "step": 136888 }, { "epoch": 0.86, "learning_rate": 3.219577556621405e-05, "loss": 2.2203, "step": 136896 }, { "epoch": 0.86, "learning_rate": 3.219124187932027e-05, "loss": 2.2349, "step": 136904 }, { "epoch": 0.86, "learning_rate": 3.2186708883755346e-05, "loss": 2.2374, "step": 136912 }, { "epoch": 0.86, "learning_rate": 3.2182176579631963e-05, "loss": 2.227, "step": 136920 }, { "epoch": 0.86, "learning_rate": 3.2177644967062776e-05, "loss": 2.2403, "step": 136928 }, { "epoch": 0.86, "learning_rate": 3.217311404616047e-05, "loss": 2.2277, "step": 136936 }, { "epoch": 0.86, "learning_rate": 3.216858381703767e-05, "loss": 2.2277, "step": 136944 }, { "epoch": 0.86, "learning_rate": 3.2164054279806994e-05, "loss": 2.2077, "step": 136952 }, { "epoch": 0.86, "learning_rate": 3.215952543458105e-05, "loss": 2.2205, "step": 136960 }, { "epoch": 0.86, "learning_rate": 3.215499728147244e-05, "loss": 2.2099, "step": 136968 }, { "epoch": 0.86, "learning_rate": 3.215046982059371e-05, "loss": 2.2264, "step": 136976 }, { "epoch": 0.86, "learning_rate": 3.214594305205742e-05, "loss": 2.2264, "step": 136984 }, { "epoch": 0.86, "learning_rate": 3.214141697597613e-05, "loss": 2.2329, "step": 136992 }, { "epoch": 0.86, "learning_rate": 3.213689159246232e-05, "loss": 2.2378, "step": 137000 }, { "epoch": 0.86, "learning_rate": 3.213236690162853e-05, "loss": 2.2232, "step": 137008 }, { "epoch": 0.86, "learning_rate": 3.2127842903587205e-05, "loss": 2.2307, "step": 137016 }, { "epoch": 0.86, "learning_rate": 3.2123319598450844e-05, "loss": 2.2489, "step": 137024 }, { "epoch": 0.86, "learning_rate": 3.211879698633189e-05, "loss": 2.244, "step": 137032 }, { "epoch": 0.86, "learning_rate": 3.211427506734276e-05, "loss": 2.2403, "step": 137040 }, { "epoch": 0.86, "learning_rate": 3.2109753841595904e-05, "loss": 2.2144, "step": 137048 }, { "epoch": 0.86, "learning_rate": 3.210523330920367e-05, "loss": 2.2196, "step": 137056 }, { "epoch": 0.86, "learning_rate": 3.2100713470278464e-05, "loss": 2.2447, "step": 137064 }, { "epoch": 0.86, "learning_rate": 3.209619432493267e-05, "loss": 2.2285, "step": 137072 }, { "epoch": 0.86, "learning_rate": 3.209167587327861e-05, "loss": 2.2394, "step": 137080 }, { "epoch": 0.86, "learning_rate": 3.208715811542862e-05, "loss": 2.227, "step": 137088 }, { "epoch": 0.86, "learning_rate": 3.2082641051495e-05, "loss": 2.2501, "step": 137096 }, { "epoch": 0.86, "learning_rate": 3.2078124681590065e-05, "loss": 2.2443, "step": 137104 }, { "epoch": 0.86, "learning_rate": 3.207360900582609e-05, "loss": 2.2309, "step": 137112 }, { "epoch": 0.86, "learning_rate": 3.206909402431531e-05, "loss": 2.2372, "step": 137120 }, { "epoch": 0.86, "learning_rate": 3.206457973717e-05, "loss": 2.2419, "step": 137128 }, { "epoch": 0.86, "learning_rate": 3.206006614450238e-05, "loss": 2.2217, "step": 137136 }, { "epoch": 0.86, "learning_rate": 3.205555324642462e-05, "loss": 2.2065, "step": 137144 }, { "epoch": 0.86, "learning_rate": 3.2051041043048966e-05, "loss": 2.232, "step": 137152 }, { "epoch": 0.86, "learning_rate": 3.2046529534487566e-05, "loss": 2.2126, "step": 137160 }, { "epoch": 0.86, "learning_rate": 3.2042018720852575e-05, "loss": 2.234, "step": 137168 }, { "epoch": 0.86, "learning_rate": 3.203750860225614e-05, "loss": 2.2478, "step": 137176 }, { "epoch": 0.86, "learning_rate": 3.203299917881038e-05, "loss": 2.2221, "step": 137184 }, { "epoch": 0.86, "learning_rate": 3.2028490450627375e-05, "loss": 2.2274, "step": 137192 }, { "epoch": 0.86, "learning_rate": 3.202398241781926e-05, "loss": 2.2199, "step": 137200 }, { "epoch": 0.86, "learning_rate": 3.201947508049807e-05, "loss": 2.2324, "step": 137208 }, { "epoch": 0.86, "learning_rate": 3.201496843877587e-05, "loss": 2.2252, "step": 137216 }, { "epoch": 0.86, "learning_rate": 3.20104624927647e-05, "loss": 2.2434, "step": 137224 }, { "epoch": 0.86, "learning_rate": 3.2005957242576555e-05, "loss": 2.2372, "step": 137232 }, { "epoch": 0.86, "learning_rate": 3.200145268832348e-05, "loss": 2.2297, "step": 137240 }, { "epoch": 0.86, "learning_rate": 3.1996948830117425e-05, "loss": 2.2299, "step": 137248 }, { "epoch": 0.86, "learning_rate": 3.199244566807035e-05, "loss": 2.2257, "step": 137256 }, { "epoch": 0.86, "learning_rate": 3.198794320229424e-05, "loss": 2.224, "step": 137264 }, { "epoch": 0.86, "learning_rate": 3.1983441432900984e-05, "loss": 2.2436, "step": 137272 }, { "epoch": 0.86, "learning_rate": 3.197894036000252e-05, "loss": 2.2256, "step": 137280 }, { "epoch": 0.86, "learning_rate": 3.197443998371075e-05, "loss": 2.224, "step": 137288 }, { "epoch": 0.86, "learning_rate": 3.196994030413755e-05, "loss": 2.2342, "step": 137296 }, { "epoch": 0.86, "learning_rate": 3.1965441321394776e-05, "loss": 2.2381, "step": 137304 }, { "epoch": 0.86, "learning_rate": 3.196094303559427e-05, "loss": 2.2325, "step": 137312 }, { "epoch": 0.86, "learning_rate": 3.1956445446847875e-05, "loss": 2.2302, "step": 137320 }, { "epoch": 0.86, "learning_rate": 3.195194855526739e-05, "loss": 2.225, "step": 137328 }, { "epoch": 0.86, "learning_rate": 3.19474523609646e-05, "loss": 2.2359, "step": 137336 }, { "epoch": 0.86, "learning_rate": 3.1942956864051305e-05, "loss": 2.2382, "step": 137344 }, { "epoch": 0.86, "learning_rate": 3.1938462064639255e-05, "loss": 2.231, "step": 137352 }, { "epoch": 0.86, "learning_rate": 3.193396796284016e-05, "loss": 2.2291, "step": 137360 }, { "epoch": 0.86, "learning_rate": 3.192947455876579e-05, "loss": 2.2365, "step": 137368 }, { "epoch": 0.86, "learning_rate": 3.192498185252784e-05, "loss": 2.2143, "step": 137376 }, { "epoch": 0.86, "learning_rate": 3.1920489844237966e-05, "loss": 2.225, "step": 137384 }, { "epoch": 0.86, "learning_rate": 3.191599853400788e-05, "loss": 2.2208, "step": 137392 }, { "epoch": 0.86, "learning_rate": 3.191150792194924e-05, "loss": 2.2417, "step": 137400 }, { "epoch": 0.86, "learning_rate": 3.190701800817363e-05, "loss": 2.2419, "step": 137408 }, { "epoch": 0.86, "learning_rate": 3.190252879279272e-05, "loss": 2.2329, "step": 137416 }, { "epoch": 0.86, "learning_rate": 3.18980402759181e-05, "loss": 2.2378, "step": 137424 }, { "epoch": 0.86, "learning_rate": 3.1893552457661345e-05, "loss": 2.2333, "step": 137432 }, { "epoch": 0.86, "learning_rate": 3.188906533813403e-05, "loss": 2.2293, "step": 137440 }, { "epoch": 0.86, "learning_rate": 3.188457891744771e-05, "loss": 2.2464, "step": 137448 }, { "epoch": 0.86, "learning_rate": 3.188009319571392e-05, "loss": 2.2307, "step": 137456 }, { "epoch": 0.86, "learning_rate": 3.1875608173044154e-05, "loss": 2.227, "step": 137464 }, { "epoch": 0.86, "learning_rate": 3.187112384954992e-05, "loss": 2.226, "step": 137472 }, { "epoch": 0.86, "learning_rate": 3.186664022534273e-05, "loss": 2.2201, "step": 137480 }, { "epoch": 0.86, "learning_rate": 3.186215730053399e-05, "loss": 2.2197, "step": 137488 }, { "epoch": 0.86, "learning_rate": 3.185767507523518e-05, "loss": 2.223, "step": 137496 }, { "epoch": 0.86, "learning_rate": 3.185319354955774e-05, "loss": 2.2189, "step": 137504 }, { "epoch": 0.86, "learning_rate": 3.1848712723613056e-05, "loss": 2.2397, "step": 137512 }, { "epoch": 0.86, "learning_rate": 3.184423259751255e-05, "loss": 2.2377, "step": 137520 }, { "epoch": 0.86, "learning_rate": 3.1839753171367557e-05, "loss": 2.2393, "step": 137528 }, { "epoch": 0.86, "learning_rate": 3.183527444528947e-05, "loss": 2.2477, "step": 137536 }, { "epoch": 0.86, "learning_rate": 3.1830796419389617e-05, "loss": 2.2356, "step": 137544 }, { "epoch": 0.86, "learning_rate": 3.182631909377932e-05, "loss": 2.2219, "step": 137552 }, { "epoch": 0.86, "learning_rate": 3.182184246856991e-05, "loss": 2.226, "step": 137560 }, { "epoch": 0.86, "learning_rate": 3.181736654387265e-05, "loss": 2.2302, "step": 137568 }, { "epoch": 0.86, "learning_rate": 3.181289131979881e-05, "loss": 2.2142, "step": 137576 }, { "epoch": 0.86, "learning_rate": 3.180841679645966e-05, "loss": 2.2342, "step": 137584 }, { "epoch": 0.86, "learning_rate": 3.1803942973966435e-05, "loss": 2.2279, "step": 137592 }, { "epoch": 0.86, "learning_rate": 3.1799469852430344e-05, "loss": 2.2214, "step": 137600 }, { "epoch": 0.86, "learning_rate": 3.1794997431962607e-05, "loss": 2.2347, "step": 137608 }, { "epoch": 0.86, "learning_rate": 3.1790525712674394e-05, "loss": 2.2224, "step": 137616 }, { "epoch": 0.86, "learning_rate": 3.178605469467687e-05, "loss": 2.2294, "step": 137624 }, { "epoch": 0.86, "learning_rate": 3.17815843780812e-05, "loss": 2.2347, "step": 137632 }, { "epoch": 0.86, "learning_rate": 3.17771147629985e-05, "loss": 2.2361, "step": 137640 }, { "epoch": 0.86, "learning_rate": 3.17726458495399e-05, "loss": 2.2188, "step": 137648 }, { "epoch": 0.86, "learning_rate": 3.1768177637816496e-05, "loss": 2.227, "step": 137656 }, { "epoch": 0.86, "learning_rate": 3.176371012793935e-05, "loss": 2.2219, "step": 137664 }, { "epoch": 0.86, "learning_rate": 3.175924332001956e-05, "loss": 2.2379, "step": 137672 }, { "epoch": 0.86, "learning_rate": 3.175477721416813e-05, "loss": 2.2292, "step": 137680 }, { "epoch": 0.86, "learning_rate": 3.175031181049611e-05, "loss": 2.2507, "step": 137688 }, { "epoch": 0.86, "learning_rate": 3.1745847109114526e-05, "loss": 2.2528, "step": 137696 }, { "epoch": 0.86, "learning_rate": 3.174138311013433e-05, "loss": 2.2266, "step": 137704 }, { "epoch": 0.86, "learning_rate": 3.173691981366652e-05, "loss": 2.2268, "step": 137712 }, { "epoch": 0.86, "learning_rate": 3.173245721982207e-05, "loss": 2.2338, "step": 137720 }, { "epoch": 0.86, "learning_rate": 3.17279953287119e-05, "loss": 2.2317, "step": 137728 }, { "epoch": 0.86, "learning_rate": 3.172353414044694e-05, "loss": 2.239, "step": 137736 }, { "epoch": 0.86, "learning_rate": 3.171907365513808e-05, "loss": 2.2237, "step": 137744 }, { "epoch": 0.86, "learning_rate": 3.171461387289624e-05, "loss": 2.2255, "step": 137752 }, { "epoch": 0.86, "learning_rate": 3.171015479383227e-05, "loss": 2.2267, "step": 137760 }, { "epoch": 0.86, "learning_rate": 3.170569641805701e-05, "loss": 2.2438, "step": 137768 }, { "epoch": 0.86, "learning_rate": 3.1701238745681326e-05, "loss": 2.2218, "step": 137776 }, { "epoch": 0.86, "learning_rate": 3.169678177681602e-05, "loss": 2.2253, "step": 137784 }, { "epoch": 0.86, "learning_rate": 3.169232551157189e-05, "loss": 2.2209, "step": 137792 }, { "epoch": 0.86, "learning_rate": 3.168786995005973e-05, "loss": 2.2439, "step": 137800 }, { "epoch": 0.86, "learning_rate": 3.16834150923903e-05, "loss": 2.2179, "step": 137808 }, { "epoch": 0.86, "learning_rate": 3.167896093867433e-05, "loss": 2.2375, "step": 137816 }, { "epoch": 0.86, "learning_rate": 3.1674507489022596e-05, "loss": 2.2259, "step": 137824 }, { "epoch": 0.86, "learning_rate": 3.1670054743545776e-05, "loss": 2.2346, "step": 137832 }, { "epoch": 0.86, "learning_rate": 3.166560270235456e-05, "loss": 2.2283, "step": 137840 }, { "epoch": 0.86, "learning_rate": 3.166115136555965e-05, "loss": 2.2209, "step": 137848 }, { "epoch": 0.86, "learning_rate": 3.165670073327169e-05, "loss": 2.2427, "step": 137856 }, { "epoch": 0.86, "learning_rate": 3.165225080560134e-05, "loss": 2.2228, "step": 137864 }, { "epoch": 0.86, "learning_rate": 3.164780158265921e-05, "loss": 2.2118, "step": 137872 }, { "epoch": 0.86, "learning_rate": 3.1643353064555905e-05, "loss": 2.2284, "step": 137880 }, { "epoch": 0.86, "learning_rate": 3.163890525140205e-05, "loss": 2.2287, "step": 137888 }, { "epoch": 0.86, "learning_rate": 3.1634458143308165e-05, "loss": 2.2247, "step": 137896 }, { "epoch": 0.86, "learning_rate": 3.163001174038484e-05, "loss": 2.2247, "step": 137904 }, { "epoch": 0.86, "learning_rate": 3.162556604274263e-05, "loss": 2.2289, "step": 137912 }, { "epoch": 0.86, "learning_rate": 3.1621121050492e-05, "loss": 2.2344, "step": 137920 }, { "epoch": 0.86, "learning_rate": 3.1616676763743485e-05, "loss": 2.2117, "step": 137928 }, { "epoch": 0.86, "learning_rate": 3.161223318260759e-05, "loss": 2.2135, "step": 137936 }, { "epoch": 0.86, "learning_rate": 3.160779030719476e-05, "loss": 2.245, "step": 137944 }, { "epoch": 0.86, "learning_rate": 3.1603348137615445e-05, "loss": 2.2132, "step": 137952 }, { "epoch": 0.86, "learning_rate": 3.159890667398007e-05, "loss": 2.2247, "step": 137960 }, { "epoch": 0.86, "learning_rate": 3.159446591639907e-05, "loss": 2.2172, "step": 137968 }, { "epoch": 0.86, "learning_rate": 3.1590025864982845e-05, "loss": 2.2319, "step": 137976 }, { "epoch": 0.86, "learning_rate": 3.1585586519841744e-05, "loss": 2.2317, "step": 137984 }, { "epoch": 0.86, "learning_rate": 3.158114788108617e-05, "loss": 2.235, "step": 137992 }, { "epoch": 0.86, "learning_rate": 3.157670994882644e-05, "loss": 2.2323, "step": 138000 }, { "epoch": 0.86, "learning_rate": 3.1572272723172884e-05, "loss": 2.2264, "step": 138008 }, { "epoch": 0.86, "learning_rate": 3.156783620423582e-05, "loss": 2.2173, "step": 138016 }, { "epoch": 0.86, "learning_rate": 3.156340039212555e-05, "loss": 2.2307, "step": 138024 }, { "epoch": 0.86, "learning_rate": 3.1558965286952324e-05, "loss": 2.2371, "step": 138032 }, { "epoch": 0.86, "learning_rate": 3.155453088882642e-05, "loss": 2.2261, "step": 138040 }, { "epoch": 0.86, "learning_rate": 3.155009719785807e-05, "loss": 2.232, "step": 138048 }, { "epoch": 0.86, "learning_rate": 3.1545664214157475e-05, "loss": 2.2153, "step": 138056 }, { "epoch": 0.86, "learning_rate": 3.1541231937834886e-05, "loss": 2.2331, "step": 138064 }, { "epoch": 0.86, "learning_rate": 3.153680036900044e-05, "loss": 2.2282, "step": 138072 }, { "epoch": 0.86, "learning_rate": 3.1532369507764354e-05, "loss": 2.2413, "step": 138080 }, { "epoch": 0.86, "learning_rate": 3.152793935423675e-05, "loss": 2.2162, "step": 138088 }, { "epoch": 0.86, "learning_rate": 3.152350990852775e-05, "loss": 2.239, "step": 138096 }, { "epoch": 0.86, "learning_rate": 3.1519081170747526e-05, "loss": 2.2196, "step": 138104 }, { "epoch": 0.86, "learning_rate": 3.1514653141006106e-05, "loss": 2.2288, "step": 138112 }, { "epoch": 0.86, "learning_rate": 3.1510225819413605e-05, "loss": 2.2301, "step": 138120 }, { "epoch": 0.86, "learning_rate": 3.1505799206080104e-05, "loss": 2.2211, "step": 138128 }, { "epoch": 0.86, "learning_rate": 3.1501373301115634e-05, "loss": 2.2217, "step": 138136 }, { "epoch": 0.86, "learning_rate": 3.149694810463022e-05, "loss": 2.2254, "step": 138144 }, { "epoch": 0.86, "learning_rate": 3.149252361673385e-05, "loss": 2.2161, "step": 138152 }, { "epoch": 0.86, "learning_rate": 3.148809983753657e-05, "loss": 2.212, "step": 138160 }, { "epoch": 0.86, "learning_rate": 3.148367676714832e-05, "loss": 2.2304, "step": 138168 }, { "epoch": 0.86, "learning_rate": 3.147925440567905e-05, "loss": 2.2322, "step": 138176 }, { "epoch": 0.86, "learning_rate": 3.1474832753238726e-05, "loss": 2.2278, "step": 138184 }, { "epoch": 0.86, "learning_rate": 3.147041180993726e-05, "loss": 2.2219, "step": 138192 }, { "epoch": 0.86, "learning_rate": 3.146599157588455e-05, "loss": 2.228, "step": 138200 }, { "epoch": 0.86, "learning_rate": 3.1461572051190504e-05, "loss": 2.2236, "step": 138208 }, { "epoch": 0.86, "learning_rate": 3.1457153235964974e-05, "loss": 2.2334, "step": 138216 }, { "epoch": 0.86, "learning_rate": 3.1452735130317815e-05, "loss": 2.2224, "step": 138224 }, { "epoch": 0.86, "learning_rate": 3.1448317734358864e-05, "loss": 2.2239, "step": 138232 }, { "epoch": 0.86, "learning_rate": 3.1443901048197945e-05, "loss": 2.238, "step": 138240 }, { "epoch": 0.86, "learning_rate": 3.143948507194483e-05, "loss": 2.228, "step": 138248 }, { "epoch": 0.86, "learning_rate": 3.1435069805709335e-05, "loss": 2.2306, "step": 138256 }, { "epoch": 0.86, "learning_rate": 3.1430655249601217e-05, "loss": 2.2374, "step": 138264 }, { "epoch": 0.86, "learning_rate": 3.14262414037302e-05, "loss": 2.2188, "step": 138272 }, { "epoch": 0.86, "learning_rate": 3.142182826820603e-05, "loss": 2.215, "step": 138280 }, { "epoch": 0.86, "learning_rate": 3.1417415843138415e-05, "loss": 2.2345, "step": 138288 }, { "epoch": 0.86, "learning_rate": 3.141300412863706e-05, "loss": 2.2296, "step": 138296 }, { "epoch": 0.86, "learning_rate": 3.1408593124811616e-05, "loss": 2.2299, "step": 138304 }, { "epoch": 0.86, "learning_rate": 3.1404182831771755e-05, "loss": 2.2302, "step": 138312 }, { "epoch": 0.86, "learning_rate": 3.1399773249627145e-05, "loss": 2.2305, "step": 138320 }, { "epoch": 0.86, "learning_rate": 3.139536437848735e-05, "loss": 2.2212, "step": 138328 }, { "epoch": 0.86, "learning_rate": 3.1390956218462006e-05, "loss": 2.2193, "step": 138336 }, { "epoch": 0.86, "learning_rate": 3.1386548769660716e-05, "loss": 2.2295, "step": 138344 }, { "epoch": 0.86, "learning_rate": 3.138214203219303e-05, "loss": 2.2301, "step": 138352 }, { "epoch": 0.86, "learning_rate": 3.137773600616851e-05, "loss": 2.2276, "step": 138360 }, { "epoch": 0.86, "learning_rate": 3.137333069169666e-05, "loss": 2.2147, "step": 138368 }, { "epoch": 0.86, "learning_rate": 3.136892608888704e-05, "loss": 2.2047, "step": 138376 }, { "epoch": 0.86, "learning_rate": 3.136452219784913e-05, "loss": 2.2269, "step": 138384 }, { "epoch": 0.86, "learning_rate": 3.13601190186924e-05, "loss": 2.2225, "step": 138392 }, { "epoch": 0.86, "learning_rate": 3.135571655152634e-05, "loss": 2.2321, "step": 138400 }, { "epoch": 0.87, "learning_rate": 3.135131479646038e-05, "loss": 2.2323, "step": 138408 }, { "epoch": 0.87, "learning_rate": 3.134691375360393e-05, "loss": 2.2215, "step": 138416 }, { "epoch": 0.87, "learning_rate": 3.134251342306643e-05, "loss": 2.2275, "step": 138424 }, { "epoch": 0.87, "learning_rate": 3.133811380495727e-05, "loss": 2.2078, "step": 138432 }, { "epoch": 0.87, "learning_rate": 3.13337148993858e-05, "loss": 2.2343, "step": 138440 }, { "epoch": 0.87, "learning_rate": 3.13293167064614e-05, "loss": 2.2287, "step": 138448 }, { "epoch": 0.87, "learning_rate": 3.132491922629341e-05, "loss": 2.1978, "step": 138456 }, { "epoch": 0.87, "learning_rate": 3.1320522458991135e-05, "loss": 2.2234, "step": 138464 }, { "epoch": 0.87, "learning_rate": 3.1316126404663907e-05, "loss": 2.2243, "step": 138472 }, { "epoch": 0.87, "learning_rate": 3.131173106342097e-05, "loss": 2.2392, "step": 138480 }, { "epoch": 0.87, "learning_rate": 3.130733643537163e-05, "loss": 2.2194, "step": 138488 }, { "epoch": 0.87, "learning_rate": 3.130294252062513e-05, "loss": 2.2361, "step": 138496 }, { "epoch": 0.87, "learning_rate": 3.129854931929069e-05, "loss": 2.226, "step": 138504 }, { "epoch": 0.87, "learning_rate": 3.1294156831477555e-05, "loss": 2.2204, "step": 138512 }, { "epoch": 0.87, "learning_rate": 3.128976505729488e-05, "loss": 2.2214, "step": 138520 }, { "epoch": 0.87, "learning_rate": 3.128537399685186e-05, "loss": 2.2291, "step": 138528 }, { "epoch": 0.87, "learning_rate": 3.1280983650257694e-05, "loss": 2.208, "step": 138536 }, { "epoch": 0.87, "learning_rate": 3.127659401762147e-05, "loss": 2.2167, "step": 138544 }, { "epoch": 0.87, "learning_rate": 3.127220509905234e-05, "loss": 2.2215, "step": 138552 }, { "epoch": 0.87, "learning_rate": 3.126781689465944e-05, "loss": 2.2222, "step": 138560 }, { "epoch": 0.87, "learning_rate": 3.126342940455182e-05, "loss": 2.2318, "step": 138568 }, { "epoch": 0.87, "learning_rate": 3.1259042628838576e-05, "loss": 2.2245, "step": 138576 }, { "epoch": 0.87, "learning_rate": 3.125465656762874e-05, "loss": 2.2468, "step": 138584 }, { "epoch": 0.87, "learning_rate": 3.1250271221031386e-05, "loss": 2.2233, "step": 138592 }, { "epoch": 0.87, "learning_rate": 3.12458865891555e-05, "loss": 2.2208, "step": 138600 }, { "epoch": 0.87, "learning_rate": 3.124150267211011e-05, "loss": 2.2436, "step": 138608 }, { "epoch": 0.87, "learning_rate": 3.123711947000418e-05, "loss": 2.2371, "step": 138616 }, { "epoch": 0.87, "learning_rate": 3.123273698294671e-05, "loss": 2.2178, "step": 138624 }, { "epoch": 0.87, "learning_rate": 3.12283552110466e-05, "loss": 2.2105, "step": 138632 }, { "epoch": 0.87, "learning_rate": 3.122397415441282e-05, "loss": 2.2274, "step": 138640 }, { "epoch": 0.87, "learning_rate": 3.121959381315427e-05, "loss": 2.2289, "step": 138648 }, { "epoch": 0.87, "learning_rate": 3.121521418737984e-05, "loss": 2.2298, "step": 138656 }, { "epoch": 0.87, "learning_rate": 3.121083527719842e-05, "loss": 2.2262, "step": 138664 }, { "epoch": 0.87, "learning_rate": 3.1206457082718875e-05, "loss": 2.2173, "step": 138672 }, { "epoch": 0.87, "learning_rate": 3.120207960405001e-05, "loss": 2.2196, "step": 138680 }, { "epoch": 0.87, "learning_rate": 3.119770284130071e-05, "loss": 2.2174, "step": 138688 }, { "epoch": 0.87, "learning_rate": 3.119332679457972e-05, "loss": 2.2221, "step": 138696 }, { "epoch": 0.87, "learning_rate": 3.118895146399588e-05, "loss": 2.2296, "step": 138704 }, { "epoch": 0.87, "learning_rate": 3.118457684965794e-05, "loss": 2.2294, "step": 138712 }, { "epoch": 0.87, "learning_rate": 3.1180202951674634e-05, "loss": 2.2418, "step": 138720 }, { "epoch": 0.87, "learning_rate": 3.117582977015474e-05, "loss": 2.2334, "step": 138728 }, { "epoch": 0.87, "learning_rate": 3.117145730520693e-05, "loss": 2.2139, "step": 138736 }, { "epoch": 0.87, "learning_rate": 3.1167085556939925e-05, "loss": 2.2177, "step": 138744 }, { "epoch": 0.87, "learning_rate": 3.1162714525462436e-05, "loss": 2.2226, "step": 138752 }, { "epoch": 0.87, "learning_rate": 3.1158344210883065e-05, "loss": 2.2161, "step": 138760 }, { "epoch": 0.87, "learning_rate": 3.1153974613310505e-05, "loss": 2.2218, "step": 138768 }, { "epoch": 0.87, "learning_rate": 3.114960573285338e-05, "loss": 2.2369, "step": 138776 }, { "epoch": 0.87, "learning_rate": 3.114523756962029e-05, "loss": 2.2177, "step": 138784 }, { "epoch": 0.87, "learning_rate": 3.114087012371984e-05, "loss": 2.2319, "step": 138792 }, { "epoch": 0.87, "learning_rate": 3.113650339526058e-05, "loss": 2.2339, "step": 138800 }, { "epoch": 0.87, "learning_rate": 3.113213738435109e-05, "loss": 2.2315, "step": 138808 }, { "epoch": 0.87, "learning_rate": 3.112777209109991e-05, "loss": 2.231, "step": 138816 }, { "epoch": 0.87, "learning_rate": 3.1123407515615545e-05, "loss": 2.2089, "step": 138824 }, { "epoch": 0.87, "learning_rate": 3.1119043658006516e-05, "loss": 2.217, "step": 138832 }, { "epoch": 0.87, "learning_rate": 3.11146805183813e-05, "loss": 2.2187, "step": 138840 }, { "epoch": 0.87, "learning_rate": 3.111031809684836e-05, "loss": 2.2219, "step": 138848 }, { "epoch": 0.87, "learning_rate": 3.110595639351617e-05, "loss": 2.2027, "step": 138856 }, { "epoch": 0.87, "learning_rate": 3.110159540849313e-05, "loss": 2.2357, "step": 138864 }, { "epoch": 0.87, "learning_rate": 3.1097235141887675e-05, "loss": 2.2173, "step": 138872 }, { "epoch": 0.87, "learning_rate": 3.10928755938082e-05, "loss": 2.2135, "step": 138880 }, { "epoch": 0.87, "learning_rate": 3.108851676436308e-05, "loss": 2.2176, "step": 138888 }, { "epoch": 0.87, "learning_rate": 3.108415865366068e-05, "loss": 2.2216, "step": 138896 }, { "epoch": 0.87, "learning_rate": 3.1079801261809335e-05, "loss": 2.2302, "step": 138904 }, { "epoch": 0.87, "learning_rate": 3.1075444588917374e-05, "loss": 2.1962, "step": 138912 }, { "epoch": 0.87, "learning_rate": 3.1071088635093115e-05, "loss": 2.2367, "step": 138920 }, { "epoch": 0.87, "learning_rate": 3.1066733400444837e-05, "loss": 2.2049, "step": 138928 }, { "epoch": 0.87, "learning_rate": 3.10623788850808e-05, "loss": 2.2169, "step": 138936 }, { "epoch": 0.87, "learning_rate": 3.105802508910929e-05, "loss": 2.2304, "step": 138944 }, { "epoch": 0.87, "learning_rate": 3.105367201263851e-05, "loss": 2.2174, "step": 138952 }, { "epoch": 0.87, "learning_rate": 3.104931965577669e-05, "loss": 2.2107, "step": 138960 }, { "epoch": 0.87, "learning_rate": 3.104496801863205e-05, "loss": 2.2171, "step": 138968 }, { "epoch": 0.87, "learning_rate": 3.104061710131273e-05, "loss": 2.2387, "step": 138976 }, { "epoch": 0.87, "learning_rate": 3.103626690392694e-05, "loss": 2.218, "step": 138984 }, { "epoch": 0.87, "learning_rate": 3.103191742658278e-05, "loss": 2.212, "step": 138992 }, { "epoch": 0.87, "learning_rate": 3.102756866938842e-05, "loss": 2.2239, "step": 139000 }, { "epoch": 0.87, "learning_rate": 3.1023220632451956e-05, "loss": 2.23, "step": 139008 }, { "epoch": 0.87, "learning_rate": 3.101887331588146e-05, "loss": 2.2243, "step": 139016 }, { "epoch": 0.87, "learning_rate": 3.1014526719785035e-05, "loss": 2.2242, "step": 139024 }, { "epoch": 0.87, "learning_rate": 3.1010180844270734e-05, "loss": 2.2263, "step": 139032 }, { "epoch": 0.87, "learning_rate": 3.100583568944658e-05, "loss": 2.2303, "step": 139040 }, { "epoch": 0.87, "learning_rate": 3.100149125542061e-05, "loss": 2.2034, "step": 139048 }, { "epoch": 0.87, "learning_rate": 3.099714754230083e-05, "loss": 2.2174, "step": 139056 }, { "epoch": 0.87, "learning_rate": 3.0992804550195194e-05, "loss": 2.2031, "step": 139064 }, { "epoch": 0.87, "learning_rate": 3.0988462279211705e-05, "loss": 2.2166, "step": 139072 }, { "epoch": 0.87, "learning_rate": 3.09841207294583e-05, "loss": 2.219, "step": 139080 }, { "epoch": 0.87, "learning_rate": 3.09797799010429e-05, "loss": 2.2025, "step": 139088 }, { "epoch": 0.87, "learning_rate": 3.0975439794073434e-05, "loss": 2.2312, "step": 139096 }, { "epoch": 0.87, "learning_rate": 3.09711004086578e-05, "loss": 2.2304, "step": 139104 }, { "epoch": 0.87, "learning_rate": 3.096676174490385e-05, "loss": 2.2231, "step": 139112 }, { "epoch": 0.87, "learning_rate": 3.0962423802919475e-05, "loss": 2.214, "step": 139120 }, { "epoch": 0.87, "learning_rate": 3.095808658281248e-05, "loss": 2.231, "step": 139128 }, { "epoch": 0.87, "learning_rate": 3.095375008469073e-05, "loss": 2.2088, "step": 139136 }, { "epoch": 0.87, "learning_rate": 3.094941430866201e-05, "loss": 2.2199, "step": 139144 }, { "epoch": 0.87, "learning_rate": 3.09450792548341e-05, "loss": 2.2256, "step": 139152 }, { "epoch": 0.87, "learning_rate": 3.094074492331481e-05, "loss": 2.2266, "step": 139160 }, { "epoch": 0.87, "learning_rate": 3.093641131421183e-05, "loss": 2.225, "step": 139168 }, { "epoch": 0.87, "learning_rate": 3.0932078427632926e-05, "loss": 2.2125, "step": 139176 }, { "epoch": 0.87, "learning_rate": 3.092774626368583e-05, "loss": 2.2193, "step": 139184 }, { "epoch": 0.87, "learning_rate": 3.0923414822478215e-05, "loss": 2.2309, "step": 139192 }, { "epoch": 0.87, "learning_rate": 3.0919084104117774e-05, "loss": 2.218, "step": 139200 }, { "epoch": 0.87, "learning_rate": 3.091475410871216e-05, "loss": 2.2301, "step": 139208 }, { "epoch": 0.87, "learning_rate": 3.091042483636902e-05, "loss": 2.2271, "step": 139216 }, { "epoch": 0.87, "learning_rate": 3.0906096287195995e-05, "loss": 2.2301, "step": 139224 }, { "epoch": 0.87, "learning_rate": 3.0901768461300664e-05, "loss": 2.2322, "step": 139232 }, { "epoch": 0.87, "learning_rate": 3.0897441358790646e-05, "loss": 2.2384, "step": 139240 }, { "epoch": 0.87, "learning_rate": 3.0893114979773495e-05, "loss": 2.2192, "step": 139248 }, { "epoch": 0.87, "learning_rate": 3.088878932435677e-05, "loss": 2.2349, "step": 139256 }, { "epoch": 0.87, "learning_rate": 3.088446439264802e-05, "loss": 2.2119, "step": 139264 }, { "epoch": 0.87, "learning_rate": 3.0880140184754744e-05, "loss": 2.228, "step": 139272 }, { "epoch": 0.87, "learning_rate": 3.087581670078444e-05, "loss": 2.2304, "step": 139280 }, { "epoch": 0.87, "learning_rate": 3.0871493940844616e-05, "loss": 2.23, "step": 139288 }, { "epoch": 0.87, "learning_rate": 3.086717190504272e-05, "loss": 2.2373, "step": 139296 }, { "epoch": 0.87, "learning_rate": 3.0862850593486186e-05, "loss": 2.2273, "step": 139304 }, { "epoch": 0.87, "learning_rate": 3.085853000628247e-05, "loss": 2.2246, "step": 139312 }, { "epoch": 0.87, "learning_rate": 3.0854210143538956e-05, "loss": 2.2168, "step": 139320 }, { "epoch": 0.87, "learning_rate": 3.084989100536305e-05, "loss": 2.2429, "step": 139328 }, { "epoch": 0.87, "learning_rate": 3.084557259186213e-05, "loss": 2.2195, "step": 139336 }, { "epoch": 0.87, "learning_rate": 3.084125490314353e-05, "loss": 2.2152, "step": 139344 }, { "epoch": 0.87, "learning_rate": 3.083693793931464e-05, "loss": 2.2312, "step": 139352 }, { "epoch": 0.87, "learning_rate": 3.083262170048272e-05, "loss": 2.2232, "step": 139360 }, { "epoch": 0.87, "learning_rate": 3.082830618675509e-05, "loss": 2.2249, "step": 139368 }, { "epoch": 0.87, "learning_rate": 3.082399139823906e-05, "loss": 2.2265, "step": 139376 }, { "epoch": 0.87, "learning_rate": 3.0819677335041866e-05, "loss": 2.2293, "step": 139384 }, { "epoch": 0.87, "learning_rate": 3.081536399727076e-05, "loss": 2.2333, "step": 139392 }, { "epoch": 0.87, "learning_rate": 3.0811051385032995e-05, "loss": 2.2181, "step": 139400 }, { "epoch": 0.87, "learning_rate": 3.080673949843577e-05, "loss": 2.2347, "step": 139408 }, { "epoch": 0.87, "learning_rate": 3.080242833758627e-05, "loss": 2.2412, "step": 139416 }, { "epoch": 0.87, "learning_rate": 3.0798117902591674e-05, "loss": 2.2258, "step": 139424 }, { "epoch": 0.87, "learning_rate": 3.079380819355915e-05, "loss": 2.2158, "step": 139432 }, { "epoch": 0.87, "learning_rate": 3.078949921059583e-05, "loss": 2.2304, "step": 139440 }, { "epoch": 0.87, "learning_rate": 3.078519095380883e-05, "loss": 2.2314, "step": 139448 }, { "epoch": 0.87, "learning_rate": 3.078088342330526e-05, "loss": 2.2456, "step": 139456 }, { "epoch": 0.87, "learning_rate": 3.077657661919222e-05, "loss": 2.2398, "step": 139464 }, { "epoch": 0.87, "learning_rate": 3.077227054157674e-05, "loss": 2.2402, "step": 139472 }, { "epoch": 0.87, "learning_rate": 3.076796519056592e-05, "loss": 2.2215, "step": 139480 }, { "epoch": 0.87, "learning_rate": 3.0763660566266755e-05, "loss": 2.2304, "step": 139488 }, { "epoch": 0.87, "learning_rate": 3.075935666878626e-05, "loss": 2.2345, "step": 139496 }, { "epoch": 0.87, "learning_rate": 3.0755053498231445e-05, "loss": 2.2181, "step": 139504 }, { "epoch": 0.87, "learning_rate": 3.0750751054709285e-05, "loss": 2.2316, "step": 139512 }, { "epoch": 0.87, "learning_rate": 3.074644933832673e-05, "loss": 2.231, "step": 139520 }, { "epoch": 0.87, "learning_rate": 3.074214834919074e-05, "loss": 2.2537, "step": 139528 }, { "epoch": 0.87, "learning_rate": 3.0737848087408197e-05, "loss": 2.2423, "step": 139536 }, { "epoch": 0.87, "learning_rate": 3.073354855308606e-05, "loss": 2.2456, "step": 139544 }, { "epoch": 0.87, "learning_rate": 3.072924974633118e-05, "loss": 2.2117, "step": 139552 }, { "epoch": 0.87, "learning_rate": 3.072495166725043e-05, "loss": 2.2248, "step": 139560 }, { "epoch": 0.87, "learning_rate": 3.072065431595069e-05, "loss": 2.2402, "step": 139568 }, { "epoch": 0.87, "learning_rate": 3.071635769253874e-05, "loss": 2.2295, "step": 139576 }, { "epoch": 0.87, "learning_rate": 3.071206179712143e-05, "loss": 2.2335, "step": 139584 }, { "epoch": 0.87, "learning_rate": 3.0707766629805566e-05, "loss": 2.2225, "step": 139592 }, { "epoch": 0.87, "learning_rate": 3.070347219069789e-05, "loss": 2.2297, "step": 139600 }, { "epoch": 0.87, "learning_rate": 3.069917847990518e-05, "loss": 2.2457, "step": 139608 }, { "epoch": 0.87, "learning_rate": 3.06948854975342e-05, "loss": 2.226, "step": 139616 }, { "epoch": 0.87, "learning_rate": 3.0690593243691645e-05, "loss": 2.2405, "step": 139624 }, { "epoch": 0.87, "learning_rate": 3.068630171848423e-05, "loss": 2.2295, "step": 139632 }, { "epoch": 0.87, "learning_rate": 3.068201092201864e-05, "loss": 2.2315, "step": 139640 }, { "epoch": 0.87, "learning_rate": 3.067772085440156e-05, "loss": 2.2237, "step": 139648 }, { "epoch": 0.87, "learning_rate": 3.067343151573963e-05, "loss": 2.2263, "step": 139656 }, { "epoch": 0.87, "learning_rate": 3.066914290613946e-05, "loss": 2.2215, "step": 139664 }, { "epoch": 0.87, "learning_rate": 3.06648550257077e-05, "loss": 2.2176, "step": 139672 }, { "epoch": 0.87, "learning_rate": 3.066056787455095e-05, "loss": 2.2226, "step": 139680 }, { "epoch": 0.87, "learning_rate": 3.065628145277575e-05, "loss": 2.2289, "step": 139688 }, { "epoch": 0.87, "learning_rate": 3.065199576048871e-05, "loss": 2.2134, "step": 139696 }, { "epoch": 0.87, "learning_rate": 3.0647710797796334e-05, "loss": 2.2165, "step": 139704 }, { "epoch": 0.87, "learning_rate": 3.064342656480516e-05, "loss": 2.215, "step": 139712 }, { "epoch": 0.87, "learning_rate": 3.06391430616217e-05, "loss": 2.2343, "step": 139720 }, { "epoch": 0.87, "learning_rate": 3.0634860288352435e-05, "loss": 2.2387, "step": 139728 }, { "epoch": 0.87, "learning_rate": 3.063057824510383e-05, "loss": 2.2374, "step": 139736 }, { "epoch": 0.87, "learning_rate": 3.0626296931982353e-05, "loss": 2.2174, "step": 139744 }, { "epoch": 0.87, "learning_rate": 3.062201634909443e-05, "loss": 2.2335, "step": 139752 }, { "epoch": 0.87, "learning_rate": 3.061773649654648e-05, "loss": 2.2285, "step": 139760 }, { "epoch": 0.87, "learning_rate": 3.06134573744449e-05, "loss": 2.2326, "step": 139768 }, { "epoch": 0.87, "learning_rate": 3.0609178982896054e-05, "loss": 2.2317, "step": 139776 }, { "epoch": 0.87, "learning_rate": 3.0604901322006336e-05, "loss": 2.2388, "step": 139784 }, { "epoch": 0.87, "learning_rate": 3.060062439188205e-05, "loss": 2.2403, "step": 139792 }, { "epoch": 0.87, "learning_rate": 3.059634819262954e-05, "loss": 2.2415, "step": 139800 }, { "epoch": 0.87, "learning_rate": 3.059207272435514e-05, "loss": 2.2397, "step": 139808 }, { "epoch": 0.87, "learning_rate": 3.058779798716508e-05, "loss": 2.2236, "step": 139816 }, { "epoch": 0.87, "learning_rate": 3.0583523981165675e-05, "loss": 2.2386, "step": 139824 }, { "epoch": 0.87, "learning_rate": 3.057925070646315e-05, "loss": 2.221, "step": 139832 }, { "epoch": 0.87, "learning_rate": 3.057497816316378e-05, "loss": 2.2285, "step": 139840 }, { "epoch": 0.87, "learning_rate": 3.057070635137374e-05, "loss": 2.2217, "step": 139848 }, { "epoch": 0.87, "learning_rate": 3.0566435271199236e-05, "loss": 2.2261, "step": 139856 }, { "epoch": 0.87, "learning_rate": 3.056216492274646e-05, "loss": 2.2275, "step": 139864 }, { "epoch": 0.87, "learning_rate": 3.055789530612157e-05, "loss": 2.2216, "step": 139872 }, { "epoch": 0.87, "learning_rate": 3.0553626421430695e-05, "loss": 2.2138, "step": 139880 }, { "epoch": 0.87, "learning_rate": 3.054935826877998e-05, "loss": 2.2354, "step": 139888 }, { "epoch": 0.87, "learning_rate": 3.0545090848275524e-05, "loss": 2.2096, "step": 139896 }, { "epoch": 0.87, "learning_rate": 3.054082416002341e-05, "loss": 2.2214, "step": 139904 }, { "epoch": 0.87, "learning_rate": 3.0536558204129716e-05, "loss": 2.2271, "step": 139912 }, { "epoch": 0.87, "learning_rate": 3.0532292980700496e-05, "loss": 2.222, "step": 139920 }, { "epoch": 0.87, "learning_rate": 3.052802848984176e-05, "loss": 2.2279, "step": 139928 }, { "epoch": 0.87, "learning_rate": 3.052376473165957e-05, "loss": 2.2312, "step": 139936 }, { "epoch": 0.87, "learning_rate": 3.051950170625988e-05, "loss": 2.2296, "step": 139944 }, { "epoch": 0.87, "learning_rate": 3.0515239413748675e-05, "loss": 2.2182, "step": 139952 }, { "epoch": 0.87, "learning_rate": 3.0510977854231938e-05, "loss": 2.2334, "step": 139960 }, { "epoch": 0.87, "learning_rate": 3.0506717027815597e-05, "loss": 2.2179, "step": 139968 }, { "epoch": 0.87, "learning_rate": 3.0502456934605584e-05, "loss": 2.208, "step": 139976 }, { "epoch": 0.87, "learning_rate": 3.04981975747078e-05, "loss": 2.2405, "step": 139984 }, { "epoch": 0.87, "learning_rate": 3.0493938948228123e-05, "loss": 2.229, "step": 139992 }, { "epoch": 0.88, "learning_rate": 3.0489681055272463e-05, "loss": 2.2147, "step": 140000 }, { "epoch": 0.88, "learning_rate": 3.0485423895946617e-05, "loss": 2.2272, "step": 140008 }, { "epoch": 0.88, "learning_rate": 3.0481167470356442e-05, "loss": 2.2274, "step": 140016 }, { "epoch": 0.88, "learning_rate": 3.0476911778607786e-05, "loss": 2.225, "step": 140024 }, { "epoch": 0.88, "learning_rate": 3.0472656820806385e-05, "loss": 2.2303, "step": 140032 }, { "epoch": 0.88, "learning_rate": 3.046840259705806e-05, "loss": 2.217, "step": 140040 }, { "epoch": 0.88, "learning_rate": 3.0464149107468555e-05, "loss": 2.2246, "step": 140048 }, { "epoch": 0.88, "learning_rate": 3.045989635214362e-05, "loss": 2.242, "step": 140056 }, { "epoch": 0.88, "learning_rate": 3.0455644331188982e-05, "loss": 2.2471, "step": 140064 }, { "epoch": 0.88, "learning_rate": 3.0451393044710324e-05, "loss": 2.2236, "step": 140072 }, { "epoch": 0.88, "learning_rate": 3.0447142492813367e-05, "loss": 2.2304, "step": 140080 }, { "epoch": 0.88, "learning_rate": 3.0442892675603763e-05, "loss": 2.2241, "step": 140088 }, { "epoch": 0.88, "learning_rate": 3.043864359318715e-05, "loss": 2.2426, "step": 140096 }, { "epoch": 0.88, "learning_rate": 3.0434395245669185e-05, "loss": 2.2261, "step": 140104 }, { "epoch": 0.88, "learning_rate": 3.0430147633155472e-05, "loss": 2.2396, "step": 140112 }, { "epoch": 0.88, "learning_rate": 3.0425900755751598e-05, "loss": 2.2387, "step": 140120 }, { "epoch": 0.88, "learning_rate": 3.0421654613563157e-05, "loss": 2.2272, "step": 140128 }, { "epoch": 0.88, "learning_rate": 3.0417409206695703e-05, "loss": 2.239, "step": 140136 }, { "epoch": 0.88, "learning_rate": 3.0413164535254756e-05, "loss": 2.221, "step": 140144 }, { "epoch": 0.88, "learning_rate": 3.040892059934588e-05, "loss": 2.2128, "step": 140152 }, { "epoch": 0.88, "learning_rate": 3.0404677399074556e-05, "loss": 2.2335, "step": 140160 }, { "epoch": 0.88, "learning_rate": 3.0400434934546258e-05, "loss": 2.2268, "step": 140168 }, { "epoch": 0.88, "learning_rate": 3.0396193205866485e-05, "loss": 2.2162, "step": 140176 }, { "epoch": 0.88, "learning_rate": 3.039195221314065e-05, "loss": 2.2317, "step": 140184 }, { "epoch": 0.88, "learning_rate": 3.0387711956474236e-05, "loss": 2.2241, "step": 140192 }, { "epoch": 0.88, "learning_rate": 3.03834724359726e-05, "loss": 2.2257, "step": 140200 }, { "epoch": 0.88, "learning_rate": 3.0379233651741155e-05, "loss": 2.2368, "step": 140208 }, { "epoch": 0.88, "learning_rate": 3.037499560388532e-05, "loss": 2.2182, "step": 140216 }, { "epoch": 0.88, "learning_rate": 3.0370758292510386e-05, "loss": 2.2298, "step": 140224 }, { "epoch": 0.88, "learning_rate": 3.036652171772173e-05, "loss": 2.2126, "step": 140232 }, { "epoch": 0.88, "learning_rate": 3.036228587962468e-05, "loss": 2.2431, "step": 140240 }, { "epoch": 0.88, "learning_rate": 3.0358050778324524e-05, "loss": 2.2205, "step": 140248 }, { "epoch": 0.88, "learning_rate": 3.035381641392656e-05, "loss": 2.2266, "step": 140256 }, { "epoch": 0.88, "learning_rate": 3.034958278653603e-05, "loss": 2.2336, "step": 140264 }, { "epoch": 0.88, "learning_rate": 3.0345349896258206e-05, "loss": 2.2491, "step": 140272 }, { "epoch": 0.88, "learning_rate": 3.0341117743198315e-05, "loss": 2.2188, "step": 140280 }, { "epoch": 0.88, "learning_rate": 3.033688632746155e-05, "loss": 2.2375, "step": 140288 }, { "epoch": 0.88, "learning_rate": 3.0332655649153134e-05, "loss": 2.2291, "step": 140296 }, { "epoch": 0.88, "learning_rate": 3.032842570837823e-05, "loss": 2.2257, "step": 140304 }, { "epoch": 0.88, "learning_rate": 3.0324196505241976e-05, "loss": 2.2291, "step": 140312 }, { "epoch": 0.88, "learning_rate": 3.0319968039849533e-05, "loss": 2.2271, "step": 140320 }, { "epoch": 0.88, "learning_rate": 3.0315740312306023e-05, "loss": 2.2278, "step": 140328 }, { "epoch": 0.88, "learning_rate": 3.031151332271653e-05, "loss": 2.2225, "step": 140336 }, { "epoch": 0.88, "learning_rate": 3.030728707118615e-05, "loss": 2.23, "step": 140344 }, { "epoch": 0.88, "learning_rate": 3.0303061557819945e-05, "loss": 2.2169, "step": 140352 }, { "epoch": 0.88, "learning_rate": 3.0298836782722957e-05, "loss": 2.2268, "step": 140360 }, { "epoch": 0.88, "learning_rate": 3.029461274600023e-05, "loss": 2.2278, "step": 140368 }, { "epoch": 0.88, "learning_rate": 3.029038944775675e-05, "loss": 2.2284, "step": 140376 }, { "epoch": 0.88, "learning_rate": 3.0286166888097523e-05, "loss": 2.2379, "step": 140384 }, { "epoch": 0.88, "learning_rate": 3.0281945067127532e-05, "loss": 2.2126, "step": 140392 }, { "epoch": 0.88, "learning_rate": 3.0277723984951706e-05, "loss": 2.2323, "step": 140400 }, { "epoch": 0.88, "learning_rate": 3.0273503641675022e-05, "loss": 2.2489, "step": 140408 }, { "epoch": 0.88, "learning_rate": 3.0269284037402347e-05, "loss": 2.2501, "step": 140416 }, { "epoch": 0.88, "learning_rate": 3.0265065172238604e-05, "loss": 2.2213, "step": 140424 }, { "epoch": 0.88, "learning_rate": 3.026084704628871e-05, "loss": 2.2394, "step": 140432 }, { "epoch": 0.88, "learning_rate": 3.025662965965746e-05, "loss": 2.2238, "step": 140440 }, { "epoch": 0.88, "learning_rate": 3.0252413012449742e-05, "loss": 2.2246, "step": 140448 }, { "epoch": 0.88, "learning_rate": 3.024819710477038e-05, "loss": 2.2137, "step": 140456 }, { "epoch": 0.88, "learning_rate": 3.024398193672418e-05, "loss": 2.2492, "step": 140464 }, { "epoch": 0.88, "learning_rate": 3.023976750841593e-05, "loss": 2.2342, "step": 140472 }, { "epoch": 0.88, "learning_rate": 3.023555381995038e-05, "loss": 2.2309, "step": 140480 }, { "epoch": 0.88, "learning_rate": 3.0231340871432317e-05, "loss": 2.2286, "step": 140488 }, { "epoch": 0.88, "learning_rate": 3.0227128662966464e-05, "loss": 2.2186, "step": 140496 }, { "epoch": 0.88, "learning_rate": 3.0222917194657514e-05, "loss": 2.2333, "step": 140504 }, { "epoch": 0.88, "learning_rate": 3.0218706466610202e-05, "loss": 2.2196, "step": 140512 }, { "epoch": 0.88, "learning_rate": 3.0214496478929182e-05, "loss": 2.2301, "step": 140520 }, { "epoch": 0.88, "learning_rate": 3.0210287231719116e-05, "loss": 2.2245, "step": 140528 }, { "epoch": 0.88, "learning_rate": 3.0206078725084657e-05, "loss": 2.2209, "step": 140536 }, { "epoch": 0.88, "learning_rate": 3.020187095913043e-05, "loss": 2.2381, "step": 140544 }, { "epoch": 0.88, "learning_rate": 3.0197663933961017e-05, "loss": 2.2278, "step": 140552 }, { "epoch": 0.88, "learning_rate": 3.0193457649681034e-05, "loss": 2.2269, "step": 140560 }, { "epoch": 0.88, "learning_rate": 3.0189252106395044e-05, "loss": 2.2286, "step": 140568 }, { "epoch": 0.88, "learning_rate": 3.0185047304207575e-05, "loss": 2.2401, "step": 140576 }, { "epoch": 0.88, "learning_rate": 3.018084324322319e-05, "loss": 2.2268, "step": 140584 }, { "epoch": 0.88, "learning_rate": 3.0176639923546374e-05, "loss": 2.2148, "step": 140592 }, { "epoch": 0.88, "learning_rate": 3.0172437345281645e-05, "loss": 2.2275, "step": 140600 }, { "epoch": 0.88, "learning_rate": 3.016823550853347e-05, "loss": 2.2335, "step": 140608 }, { "epoch": 0.88, "learning_rate": 3.01640344134063e-05, "loss": 2.2298, "step": 140616 }, { "epoch": 0.88, "learning_rate": 3.0159834060004605e-05, "loss": 2.2301, "step": 140624 }, { "epoch": 0.88, "learning_rate": 3.0155634448432757e-05, "loss": 2.226, "step": 140632 }, { "epoch": 0.88, "learning_rate": 3.0151435578795183e-05, "loss": 2.2284, "step": 140640 }, { "epoch": 0.88, "learning_rate": 3.0147237451196297e-05, "loss": 2.2394, "step": 140648 }, { "epoch": 0.88, "learning_rate": 3.0143040065740418e-05, "loss": 2.2288, "step": 140656 }, { "epoch": 0.88, "learning_rate": 3.0138843422531904e-05, "loss": 2.2315, "step": 140664 }, { "epoch": 0.88, "learning_rate": 3.0134647521675113e-05, "loss": 2.2412, "step": 140672 }, { "epoch": 0.88, "learning_rate": 3.013045236327433e-05, "loss": 2.2335, "step": 140680 }, { "epoch": 0.88, "learning_rate": 3.0126257947433852e-05, "loss": 2.2357, "step": 140688 }, { "epoch": 0.88, "learning_rate": 3.0122064274257944e-05, "loss": 2.2186, "step": 140696 }, { "epoch": 0.88, "learning_rate": 3.0117871343850883e-05, "loss": 2.2191, "step": 140704 }, { "epoch": 0.88, "learning_rate": 3.0113679156316886e-05, "loss": 2.226, "step": 140712 }, { "epoch": 0.88, "learning_rate": 3.0109487711760174e-05, "loss": 2.2213, "step": 140720 }, { "epoch": 0.88, "learning_rate": 3.0105297010284962e-05, "loss": 2.2283, "step": 140728 }, { "epoch": 0.88, "learning_rate": 3.010110705199542e-05, "loss": 2.2326, "step": 140736 }, { "epoch": 0.88, "learning_rate": 3.0096917836995698e-05, "loss": 2.2158, "step": 140744 }, { "epoch": 0.88, "learning_rate": 3.0092729365389966e-05, "loss": 2.225, "step": 140752 }, { "epoch": 0.88, "learning_rate": 3.008854163728234e-05, "loss": 2.2275, "step": 140760 }, { "epoch": 0.88, "learning_rate": 3.008435465277691e-05, "loss": 2.2287, "step": 140768 }, { "epoch": 0.88, "learning_rate": 3.0080168411977794e-05, "loss": 2.2438, "step": 140776 }, { "epoch": 0.88, "learning_rate": 3.0075982914989044e-05, "loss": 2.225, "step": 140784 }, { "epoch": 0.88, "learning_rate": 3.0071798161914705e-05, "loss": 2.2188, "step": 140792 }, { "epoch": 0.88, "learning_rate": 3.0067614152858837e-05, "loss": 2.2229, "step": 140800 }, { "epoch": 0.88, "learning_rate": 3.0063430887925424e-05, "loss": 2.2417, "step": 140808 }, { "epoch": 0.88, "learning_rate": 3.0059248367218496e-05, "loss": 2.2229, "step": 140816 }, { "epoch": 0.88, "learning_rate": 3.0055066590842008e-05, "loss": 2.2201, "step": 140824 }, { "epoch": 0.88, "learning_rate": 3.005088555889991e-05, "loss": 2.2287, "step": 140832 }, { "epoch": 0.88, "learning_rate": 3.0046705271496183e-05, "loss": 2.2254, "step": 140840 }, { "epoch": 0.88, "learning_rate": 3.0042525728734704e-05, "loss": 2.2323, "step": 140848 }, { "epoch": 0.88, "learning_rate": 3.003834693071939e-05, "loss": 2.2199, "step": 140856 }, { "epoch": 0.88, "learning_rate": 3.0034168877554164e-05, "loss": 2.2148, "step": 140864 }, { "epoch": 0.88, "learning_rate": 3.0029991569342836e-05, "loss": 2.2259, "step": 140872 }, { "epoch": 0.88, "learning_rate": 3.002581500618929e-05, "loss": 2.2208, "step": 140880 }, { "epoch": 0.88, "learning_rate": 3.002163918819734e-05, "loss": 2.2316, "step": 140888 }, { "epoch": 0.88, "learning_rate": 3.00174641154708e-05, "loss": 2.2225, "step": 140896 }, { "epoch": 0.88, "learning_rate": 3.001328978811348e-05, "loss": 2.2193, "step": 140904 }, { "epoch": 0.88, "learning_rate": 3.0009116206229125e-05, "loss": 2.2134, "step": 140912 }, { "epoch": 0.88, "learning_rate": 3.0004943369921517e-05, "loss": 2.2219, "step": 140920 }, { "epoch": 0.88, "learning_rate": 3.0000771279294383e-05, "loss": 2.2152, "step": 140928 }, { "epoch": 0.88, "learning_rate": 2.9996599934451424e-05, "loss": 2.2361, "step": 140936 }, { "epoch": 0.88, "learning_rate": 2.9992429335496374e-05, "loss": 2.2226, "step": 140944 }, { "epoch": 0.88, "learning_rate": 2.9988259482532898e-05, "loss": 2.2443, "step": 140952 }, { "epoch": 0.88, "learning_rate": 2.998409037566464e-05, "loss": 2.2104, "step": 140960 }, { "epoch": 0.88, "learning_rate": 2.9979922014995286e-05, "loss": 2.2123, "step": 140968 }, { "epoch": 0.88, "learning_rate": 2.997575440062843e-05, "loss": 2.2197, "step": 140976 }, { "epoch": 0.88, "learning_rate": 2.9971587532667678e-05, "loss": 2.207, "step": 140984 }, { "epoch": 0.88, "learning_rate": 2.9967421411216645e-05, "loss": 2.2362, "step": 140992 }, { "epoch": 0.88, "learning_rate": 2.9963256036378884e-05, "loss": 2.2154, "step": 141000 }, { "epoch": 0.88, "learning_rate": 2.9959091408257932e-05, "loss": 2.2261, "step": 141008 }, { "epoch": 0.88, "learning_rate": 2.995492752695735e-05, "loss": 2.2209, "step": 141016 }, { "epoch": 0.88, "learning_rate": 2.995076439258063e-05, "loss": 2.2214, "step": 141024 }, { "epoch": 0.88, "learning_rate": 2.9946602005231307e-05, "loss": 2.2259, "step": 141032 }, { "epoch": 0.88, "learning_rate": 2.99424403650128e-05, "loss": 2.2139, "step": 141040 }, { "epoch": 0.88, "learning_rate": 2.993827947202861e-05, "loss": 2.2159, "step": 141048 }, { "epoch": 0.88, "learning_rate": 2.993411932638217e-05, "loss": 2.2275, "step": 141056 }, { "epoch": 0.88, "learning_rate": 2.992995992817689e-05, "loss": 2.2359, "step": 141064 }, { "epoch": 0.88, "learning_rate": 2.992580127751617e-05, "loss": 2.2282, "step": 141072 }, { "epoch": 0.88, "learning_rate": 2.9921643374503433e-05, "loss": 2.2315, "step": 141080 }, { "epoch": 0.88, "learning_rate": 2.991748621924199e-05, "loss": 2.2243, "step": 141088 }, { "epoch": 0.88, "learning_rate": 2.9913329811835228e-05, "loss": 2.2328, "step": 141096 }, { "epoch": 0.88, "learning_rate": 2.9909174152386456e-05, "loss": 2.2206, "step": 141104 }, { "epoch": 0.88, "learning_rate": 2.9905019240998994e-05, "loss": 2.2215, "step": 141112 }, { "epoch": 0.88, "learning_rate": 2.9900865077776132e-05, "loss": 2.2172, "step": 141120 }, { "epoch": 0.88, "learning_rate": 2.989671166282113e-05, "loss": 2.2204, "step": 141128 }, { "epoch": 0.88, "learning_rate": 2.9892558996237263e-05, "loss": 2.2088, "step": 141136 }, { "epoch": 0.88, "learning_rate": 2.988840707812776e-05, "loss": 2.227, "step": 141144 }, { "epoch": 0.88, "learning_rate": 2.9884255908595825e-05, "loss": 2.2053, "step": 141152 }, { "epoch": 0.88, "learning_rate": 2.988010548774468e-05, "loss": 2.2323, "step": 141160 }, { "epoch": 0.88, "learning_rate": 2.9875955815677485e-05, "loss": 2.2134, "step": 141168 }, { "epoch": 0.88, "learning_rate": 2.98718068924974e-05, "loss": 2.2202, "step": 141176 }, { "epoch": 0.88, "learning_rate": 2.986765871830759e-05, "loss": 2.2348, "step": 141184 }, { "epoch": 0.88, "learning_rate": 2.9863511293211168e-05, "loss": 2.2147, "step": 141192 }, { "epoch": 0.88, "learning_rate": 2.985936461731122e-05, "loss": 2.2371, "step": 141200 }, { "epoch": 0.88, "learning_rate": 2.9855218690710863e-05, "loss": 2.2387, "step": 141208 }, { "epoch": 0.88, "learning_rate": 2.985107351351315e-05, "loss": 2.2271, "step": 141216 }, { "epoch": 0.88, "learning_rate": 2.9846929085821117e-05, "loss": 2.2227, "step": 141224 }, { "epoch": 0.88, "learning_rate": 2.984278540773783e-05, "loss": 2.2245, "step": 141232 }, { "epoch": 0.88, "learning_rate": 2.9838642479366263e-05, "loss": 2.225, "step": 141240 }, { "epoch": 0.88, "learning_rate": 2.9834500300809454e-05, "loss": 2.2064, "step": 141248 }, { "epoch": 0.88, "learning_rate": 2.9830358872170327e-05, "loss": 2.2212, "step": 141256 }, { "epoch": 0.88, "learning_rate": 2.982621819355187e-05, "loss": 2.2276, "step": 141264 }, { "epoch": 0.88, "learning_rate": 2.982207826505703e-05, "loss": 2.2302, "step": 141272 }, { "epoch": 0.88, "learning_rate": 2.9817939086788688e-05, "loss": 2.2176, "step": 141280 }, { "epoch": 0.88, "learning_rate": 2.9813800658849768e-05, "loss": 2.2317, "step": 141288 }, { "epoch": 0.88, "learning_rate": 2.9809662981343156e-05, "loss": 2.2179, "step": 141296 }, { "epoch": 0.88, "learning_rate": 2.9805526054371718e-05, "loss": 2.2341, "step": 141304 }, { "epoch": 0.88, "learning_rate": 2.980138987803829e-05, "loss": 2.22, "step": 141312 }, { "epoch": 0.88, "learning_rate": 2.979725445244568e-05, "loss": 2.2367, "step": 141320 }, { "epoch": 0.88, "learning_rate": 2.979311977769673e-05, "loss": 2.2309, "step": 141328 }, { "epoch": 0.88, "learning_rate": 2.9788985853894207e-05, "loss": 2.2344, "step": 141336 }, { "epoch": 0.88, "learning_rate": 2.978485268114088e-05, "loss": 2.217, "step": 141344 }, { "epoch": 0.88, "learning_rate": 2.9780720259539513e-05, "loss": 2.2247, "step": 141352 }, { "epoch": 0.88, "learning_rate": 2.9776588589192834e-05, "loss": 2.2344, "step": 141360 }, { "epoch": 0.88, "learning_rate": 2.9772457670203536e-05, "loss": 2.2485, "step": 141368 }, { "epoch": 0.88, "learning_rate": 2.9768327502674347e-05, "loss": 2.2236, "step": 141376 }, { "epoch": 0.88, "learning_rate": 2.9764198086707927e-05, "loss": 2.2434, "step": 141384 }, { "epoch": 0.88, "learning_rate": 2.9760069422406923e-05, "loss": 2.2142, "step": 141392 }, { "epoch": 0.88, "learning_rate": 2.9755941509873996e-05, "loss": 2.2362, "step": 141400 }, { "epoch": 0.88, "learning_rate": 2.9751814349211766e-05, "loss": 2.2236, "step": 141408 }, { "epoch": 0.88, "learning_rate": 2.9747687940522807e-05, "loss": 2.2152, "step": 141416 }, { "epoch": 0.88, "learning_rate": 2.974356228390973e-05, "loss": 2.2352, "step": 141424 }, { "epoch": 0.88, "learning_rate": 2.9739437379475077e-05, "loss": 2.2326, "step": 141432 }, { "epoch": 0.88, "learning_rate": 2.9735313227321415e-05, "loss": 2.2272, "step": 141440 }, { "epoch": 0.88, "learning_rate": 2.973118982755127e-05, "loss": 2.2317, "step": 141448 }, { "epoch": 0.88, "learning_rate": 2.9727067180267126e-05, "loss": 2.2295, "step": 141456 }, { "epoch": 0.88, "learning_rate": 2.9722945285571513e-05, "loss": 2.2257, "step": 141464 }, { "epoch": 0.88, "learning_rate": 2.9718824143566853e-05, "loss": 2.2339, "step": 141472 }, { "epoch": 0.88, "learning_rate": 2.9714703754355627e-05, "loss": 2.2162, "step": 141480 }, { "epoch": 0.88, "learning_rate": 2.971058411804028e-05, "loss": 2.2433, "step": 141488 }, { "epoch": 0.88, "learning_rate": 2.9706465234723192e-05, "loss": 2.2254, "step": 141496 }, { "epoch": 0.88, "learning_rate": 2.9702347104506773e-05, "loss": 2.2463, "step": 141504 }, { "epoch": 0.88, "learning_rate": 2.9698229727493416e-05, "loss": 2.2277, "step": 141512 }, { "epoch": 0.88, "learning_rate": 2.969411310378547e-05, "loss": 2.2284, "step": 141520 }, { "epoch": 0.88, "learning_rate": 2.9689997233485266e-05, "loss": 2.2437, "step": 141528 }, { "epoch": 0.88, "learning_rate": 2.968588211669513e-05, "loss": 2.2187, "step": 141536 }, { "epoch": 0.88, "learning_rate": 2.9681767753517377e-05, "loss": 2.2401, "step": 141544 }, { "epoch": 0.88, "learning_rate": 2.9677654144054273e-05, "loss": 2.2359, "step": 141552 }, { "epoch": 0.88, "learning_rate": 2.967354128840808e-05, "loss": 2.2183, "step": 141560 }, { "epoch": 0.88, "learning_rate": 2.9669429186681064e-05, "loss": 2.2463, "step": 141568 }, { "epoch": 0.88, "learning_rate": 2.9665317838975436e-05, "loss": 2.248, "step": 141576 }, { "epoch": 0.88, "learning_rate": 2.9661207245393406e-05, "loss": 2.2318, "step": 141584 }, { "epoch": 0.88, "learning_rate": 2.9657097406037183e-05, "loss": 2.222, "step": 141592 }, { "epoch": 0.89, "learning_rate": 2.965298832100891e-05, "loss": 2.2225, "step": 141600 }, { "epoch": 0.89, "learning_rate": 2.9648879990410756e-05, "loss": 2.2398, "step": 141608 }, { "epoch": 0.89, "learning_rate": 2.9644772414344853e-05, "loss": 2.2368, "step": 141616 }, { "epoch": 0.89, "learning_rate": 2.964066559291332e-05, "loss": 2.2155, "step": 141624 }, { "epoch": 0.89, "learning_rate": 2.963655952621822e-05, "loss": 2.2078, "step": 141632 }, { "epoch": 0.89, "learning_rate": 2.9632454214361683e-05, "loss": 2.2293, "step": 141640 }, { "epoch": 0.89, "learning_rate": 2.9628349657445726e-05, "loss": 2.2157, "step": 141648 }, { "epoch": 0.89, "learning_rate": 2.9624245855572418e-05, "loss": 2.216, "step": 141656 }, { "epoch": 0.89, "learning_rate": 2.9620142808843758e-05, "loss": 2.2182, "step": 141664 }, { "epoch": 0.89, "learning_rate": 2.9616040517361753e-05, "loss": 2.2298, "step": 141672 }, { "epoch": 0.89, "learning_rate": 2.961193898122841e-05, "loss": 2.226, "step": 141680 }, { "epoch": 0.89, "learning_rate": 2.960783820054565e-05, "loss": 2.2199, "step": 141688 }, { "epoch": 0.89, "learning_rate": 2.960373817541544e-05, "loss": 2.2419, "step": 141696 }, { "epoch": 0.89, "learning_rate": 2.9599638905939736e-05, "loss": 2.2349, "step": 141704 }, { "epoch": 0.89, "learning_rate": 2.95955403922204e-05, "loss": 2.2359, "step": 141712 }, { "epoch": 0.89, "learning_rate": 2.9591442634359347e-05, "loss": 2.2104, "step": 141720 }, { "epoch": 0.89, "learning_rate": 2.958734563245843e-05, "loss": 2.2089, "step": 141728 }, { "epoch": 0.89, "learning_rate": 2.9583249386619528e-05, "loss": 2.233, "step": 141736 }, { "epoch": 0.89, "learning_rate": 2.9579153896944456e-05, "loss": 2.2301, "step": 141744 }, { "epoch": 0.89, "learning_rate": 2.9575059163535023e-05, "loss": 2.2385, "step": 141752 }, { "epoch": 0.89, "learning_rate": 2.957096518649304e-05, "loss": 2.2106, "step": 141760 }, { "epoch": 0.89, "learning_rate": 2.956687196592028e-05, "loss": 2.2533, "step": 141768 }, { "epoch": 0.89, "learning_rate": 2.956277950191848e-05, "loss": 2.2298, "step": 141776 }, { "epoch": 0.89, "learning_rate": 2.9558687794589414e-05, "loss": 2.2313, "step": 141784 }, { "epoch": 0.89, "learning_rate": 2.955459684403479e-05, "loss": 2.2206, "step": 141792 }, { "epoch": 0.89, "learning_rate": 2.955050665035628e-05, "loss": 2.2103, "step": 141800 }, { "epoch": 0.89, "learning_rate": 2.954641721365561e-05, "loss": 2.2365, "step": 141808 }, { "epoch": 0.89, "learning_rate": 2.9542328534034426e-05, "loss": 2.2195, "step": 141816 }, { "epoch": 0.89, "learning_rate": 2.953824061159436e-05, "loss": 2.2096, "step": 141824 }, { "epoch": 0.89, "learning_rate": 2.9534153446437057e-05, "loss": 2.2198, "step": 141832 }, { "epoch": 0.89, "learning_rate": 2.9530067038664123e-05, "loss": 2.2437, "step": 141840 }, { "epoch": 0.89, "learning_rate": 2.952598138837712e-05, "loss": 2.2112, "step": 141848 }, { "epoch": 0.89, "learning_rate": 2.952189649567766e-05, "loss": 2.2234, "step": 141856 }, { "epoch": 0.89, "learning_rate": 2.9517812360667256e-05, "loss": 2.221, "step": 141864 }, { "epoch": 0.89, "learning_rate": 2.9513728983447486e-05, "loss": 2.2361, "step": 141872 }, { "epoch": 0.89, "learning_rate": 2.95096463641198e-05, "loss": 2.239, "step": 141880 }, { "epoch": 0.89, "learning_rate": 2.9505564502785736e-05, "loss": 2.2287, "step": 141888 }, { "epoch": 0.89, "learning_rate": 2.9501483399546782e-05, "loss": 2.2179, "step": 141896 }, { "epoch": 0.89, "learning_rate": 2.9497403054504346e-05, "loss": 2.2263, "step": 141904 }, { "epoch": 0.89, "learning_rate": 2.94933234677599e-05, "loss": 2.235, "step": 141912 }, { "epoch": 0.89, "learning_rate": 2.948924463941487e-05, "loss": 2.2391, "step": 141920 }, { "epoch": 0.89, "learning_rate": 2.9485166569570623e-05, "loss": 2.2209, "step": 141928 }, { "epoch": 0.89, "learning_rate": 2.9481089258328564e-05, "loss": 2.2287, "step": 141936 }, { "epoch": 0.89, "learning_rate": 2.9477012705790043e-05, "loss": 2.2149, "step": 141944 }, { "epoch": 0.89, "learning_rate": 2.9472936912056426e-05, "loss": 2.2342, "step": 141952 }, { "epoch": 0.89, "learning_rate": 2.9468861877229016e-05, "loss": 2.2258, "step": 141960 }, { "epoch": 0.89, "learning_rate": 2.9464787601409118e-05, "loss": 2.2175, "step": 141968 }, { "epoch": 0.89, "learning_rate": 2.946071408469804e-05, "loss": 2.2248, "step": 141976 }, { "epoch": 0.89, "learning_rate": 2.945664132719703e-05, "loss": 2.2315, "step": 141984 }, { "epoch": 0.89, "learning_rate": 2.9452569329007328e-05, "loss": 2.2324, "step": 141992 }, { "epoch": 0.89, "learning_rate": 2.9448498090230204e-05, "loss": 2.2219, "step": 142000 }, { "epoch": 0.89, "learning_rate": 2.944442761096684e-05, "loss": 2.217, "step": 142008 }, { "epoch": 0.89, "learning_rate": 2.944035789131842e-05, "loss": 2.2117, "step": 142016 }, { "epoch": 0.89, "learning_rate": 2.9436288931386148e-05, "loss": 2.209, "step": 142024 }, { "epoch": 0.89, "learning_rate": 2.9432220731271154e-05, "loss": 2.2288, "step": 142032 }, { "epoch": 0.89, "learning_rate": 2.9428153291074577e-05, "loss": 2.2238, "step": 142040 }, { "epoch": 0.89, "learning_rate": 2.942408661089755e-05, "loss": 2.2056, "step": 142048 }, { "epoch": 0.89, "learning_rate": 2.9420020690841154e-05, "loss": 2.2336, "step": 142056 }, { "epoch": 0.89, "learning_rate": 2.9415955531006474e-05, "loss": 2.222, "step": 142064 }, { "epoch": 0.89, "learning_rate": 2.9411891131494578e-05, "loss": 2.2292, "step": 142072 }, { "epoch": 0.89, "learning_rate": 2.9407827492406487e-05, "loss": 2.229, "step": 142080 }, { "epoch": 0.89, "learning_rate": 2.940376461384326e-05, "loss": 2.2366, "step": 142088 }, { "epoch": 0.89, "learning_rate": 2.9399702495905855e-05, "loss": 2.2392, "step": 142096 }, { "epoch": 0.89, "learning_rate": 2.9395641138695285e-05, "loss": 2.2186, "step": 142104 }, { "epoch": 0.89, "learning_rate": 2.9391580542312526e-05, "loss": 2.2334, "step": 142112 }, { "epoch": 0.89, "learning_rate": 2.9387520706858485e-05, "loss": 2.2461, "step": 142120 }, { "epoch": 0.89, "learning_rate": 2.938346163243412e-05, "loss": 2.2413, "step": 142128 }, { "epoch": 0.89, "learning_rate": 2.937940331914034e-05, "loss": 2.2312, "step": 142136 }, { "epoch": 0.89, "learning_rate": 2.9375345767078034e-05, "loss": 2.2225, "step": 142144 }, { "epoch": 0.89, "learning_rate": 2.9371288976348066e-05, "loss": 2.2294, "step": 142152 }, { "epoch": 0.89, "learning_rate": 2.9367232947051275e-05, "loss": 2.2299, "step": 142160 }, { "epoch": 0.89, "learning_rate": 2.936317767928853e-05, "loss": 2.2222, "step": 142168 }, { "epoch": 0.89, "learning_rate": 2.9359123173160613e-05, "loss": 2.2264, "step": 142176 }, { "epoch": 0.89, "learning_rate": 2.9355069428768333e-05, "loss": 2.2435, "step": 142184 }, { "epoch": 0.89, "learning_rate": 2.9351016446212472e-05, "loss": 2.2328, "step": 142192 }, { "epoch": 0.89, "learning_rate": 2.9346964225593775e-05, "loss": 2.2435, "step": 142200 }, { "epoch": 0.89, "learning_rate": 2.9342912767012982e-05, "loss": 2.2292, "step": 142208 }, { "epoch": 0.89, "learning_rate": 2.933886207057083e-05, "loss": 2.233, "step": 142216 }, { "epoch": 0.89, "learning_rate": 2.9334812136368e-05, "loss": 2.2254, "step": 142224 }, { "epoch": 0.89, "learning_rate": 2.933076296450517e-05, "loss": 2.2159, "step": 142232 }, { "epoch": 0.89, "learning_rate": 2.9326714555083035e-05, "loss": 2.225, "step": 142240 }, { "epoch": 0.89, "learning_rate": 2.9322666908202207e-05, "loss": 2.218, "step": 142248 }, { "epoch": 0.89, "learning_rate": 2.9318620023963316e-05, "loss": 2.226, "step": 142256 }, { "epoch": 0.89, "learning_rate": 2.9314573902466986e-05, "loss": 2.2165, "step": 142264 }, { "epoch": 0.89, "learning_rate": 2.9310528543813787e-05, "loss": 2.2277, "step": 142272 }, { "epoch": 0.89, "learning_rate": 2.930648394810428e-05, "loss": 2.2388, "step": 142280 }, { "epoch": 0.89, "learning_rate": 2.930244011543904e-05, "loss": 2.2292, "step": 142288 }, { "epoch": 0.89, "learning_rate": 2.929839704591857e-05, "loss": 2.2381, "step": 142296 }, { "epoch": 0.89, "learning_rate": 2.929435473964342e-05, "loss": 2.2368, "step": 142304 }, { "epoch": 0.89, "learning_rate": 2.9290313196714032e-05, "loss": 2.229, "step": 142312 }, { "epoch": 0.89, "learning_rate": 2.9286272417230897e-05, "loss": 2.2365, "step": 142320 }, { "epoch": 0.89, "learning_rate": 2.9282232401294506e-05, "loss": 2.2308, "step": 142328 }, { "epoch": 0.89, "learning_rate": 2.927819314900524e-05, "loss": 2.2285, "step": 142336 }, { "epoch": 0.89, "learning_rate": 2.927415466046354e-05, "loss": 2.229, "step": 142344 }, { "epoch": 0.89, "learning_rate": 2.9270116935769816e-05, "loss": 2.2274, "step": 142352 }, { "epoch": 0.89, "learning_rate": 2.926607997502443e-05, "loss": 2.2471, "step": 142360 }, { "epoch": 0.89, "learning_rate": 2.926204377832774e-05, "loss": 2.2321, "step": 142368 }, { "epoch": 0.89, "learning_rate": 2.9258008345780084e-05, "loss": 2.2278, "step": 142376 }, { "epoch": 0.89, "learning_rate": 2.92539736774818e-05, "loss": 2.2329, "step": 142384 }, { "epoch": 0.89, "learning_rate": 2.924993977353318e-05, "loss": 2.2153, "step": 142392 }, { "epoch": 0.89, "learning_rate": 2.92459066340345e-05, "loss": 2.2432, "step": 142400 }, { "epoch": 0.89, "learning_rate": 2.9241874259086034e-05, "loss": 2.2143, "step": 142408 }, { "epoch": 0.89, "learning_rate": 2.9237842648788028e-05, "loss": 2.2372, "step": 142416 }, { "epoch": 0.89, "learning_rate": 2.9233811803240695e-05, "loss": 2.2237, "step": 142424 }, { "epoch": 0.89, "learning_rate": 2.9229781722544268e-05, "loss": 2.2183, "step": 142432 }, { "epoch": 0.89, "learning_rate": 2.9225752406798912e-05, "loss": 2.2409, "step": 142440 }, { "epoch": 0.89, "learning_rate": 2.92217238561048e-05, "loss": 2.231, "step": 142448 }, { "epoch": 0.89, "learning_rate": 2.921769607056209e-05, "loss": 2.2376, "step": 142456 }, { "epoch": 0.89, "learning_rate": 2.9213669050270914e-05, "loss": 2.243, "step": 142464 }, { "epoch": 0.89, "learning_rate": 2.9209642795331365e-05, "loss": 2.2359, "step": 142472 }, { "epoch": 0.89, "learning_rate": 2.920561730584357e-05, "loss": 2.2247, "step": 142480 }, { "epoch": 0.89, "learning_rate": 2.9201592581907565e-05, "loss": 2.2232, "step": 142488 }, { "epoch": 0.89, "learning_rate": 2.919756862362344e-05, "loss": 2.2291, "step": 142496 }, { "epoch": 0.89, "learning_rate": 2.919354543109121e-05, "loss": 2.2293, "step": 142504 }, { "epoch": 0.89, "learning_rate": 2.918952300441089e-05, "loss": 2.2306, "step": 142512 }, { "epoch": 0.89, "learning_rate": 2.9185501343682503e-05, "loss": 2.2214, "step": 142520 }, { "epoch": 0.89, "learning_rate": 2.9181480449005992e-05, "loss": 2.2444, "step": 142528 }, { "epoch": 0.89, "learning_rate": 2.917746032048133e-05, "loss": 2.229, "step": 142536 }, { "epoch": 0.89, "learning_rate": 2.9173440958208485e-05, "loss": 2.2358, "step": 142544 }, { "epoch": 0.89, "learning_rate": 2.9169422362287348e-05, "loss": 2.2142, "step": 142552 }, { "epoch": 0.89, "learning_rate": 2.9165404532817823e-05, "loss": 2.2207, "step": 142560 }, { "epoch": 0.89, "learning_rate": 2.9161387469899797e-05, "loss": 2.2247, "step": 142568 }, { "epoch": 0.89, "learning_rate": 2.9157371173633152e-05, "loss": 2.2258, "step": 142576 }, { "epoch": 0.89, "learning_rate": 2.915335564411772e-05, "loss": 2.2229, "step": 142584 }, { "epoch": 0.89, "learning_rate": 2.9149340881453312e-05, "loss": 2.2322, "step": 142592 }, { "epoch": 0.89, "learning_rate": 2.9145326885739766e-05, "loss": 2.2446, "step": 142600 }, { "epoch": 0.89, "learning_rate": 2.914131365707685e-05, "loss": 2.2409, "step": 142608 }, { "epoch": 0.89, "learning_rate": 2.913730119556433e-05, "loss": 2.2134, "step": 142616 }, { "epoch": 0.89, "learning_rate": 2.9133289501301987e-05, "loss": 2.2258, "step": 142624 }, { "epoch": 0.89, "learning_rate": 2.9129278574389517e-05, "loss": 2.2168, "step": 142632 }, { "epoch": 0.89, "learning_rate": 2.9125268414926638e-05, "loss": 2.2133, "step": 142640 }, { "epoch": 0.89, "learning_rate": 2.9121259023013058e-05, "loss": 2.2285, "step": 142648 }, { "epoch": 0.89, "learning_rate": 2.9117250398748447e-05, "loss": 2.2103, "step": 142656 }, { "epoch": 0.89, "learning_rate": 2.9113242542232443e-05, "loss": 2.229, "step": 142664 }, { "epoch": 0.89, "learning_rate": 2.9109235453564708e-05, "loss": 2.223, "step": 142672 }, { "epoch": 0.89, "learning_rate": 2.9105229132844846e-05, "loss": 2.2192, "step": 142680 }, { "epoch": 0.89, "learning_rate": 2.9101223580172444e-05, "loss": 2.2155, "step": 142688 }, { "epoch": 0.89, "learning_rate": 2.9097218795647103e-05, "loss": 2.2113, "step": 142696 }, { "epoch": 0.89, "learning_rate": 2.909321477936835e-05, "loss": 2.2179, "step": 142704 }, { "epoch": 0.89, "learning_rate": 2.908921153143577e-05, "loss": 2.2139, "step": 142712 }, { "epoch": 0.89, "learning_rate": 2.9085209051948848e-05, "loss": 2.2323, "step": 142720 }, { "epoch": 0.89, "learning_rate": 2.9081207341007087e-05, "loss": 2.218, "step": 142728 }, { "epoch": 0.89, "learning_rate": 2.9077206398710012e-05, "loss": 2.2325, "step": 142736 }, { "epoch": 0.89, "learning_rate": 2.9073206225157025e-05, "loss": 2.2345, "step": 142744 }, { "epoch": 0.89, "learning_rate": 2.9069206820447604e-05, "loss": 2.2239, "step": 142752 }, { "epoch": 0.89, "learning_rate": 2.906520818468119e-05, "loss": 2.2275, "step": 142760 }, { "epoch": 0.89, "learning_rate": 2.906121031795715e-05, "loss": 2.21, "step": 142768 }, { "epoch": 0.89, "learning_rate": 2.9057213220374906e-05, "loss": 2.2132, "step": 142776 }, { "epoch": 0.89, "learning_rate": 2.90532168920338e-05, "loss": 2.2358, "step": 142784 }, { "epoch": 0.89, "learning_rate": 2.9049221333033206e-05, "loss": 2.2361, "step": 142792 }, { "epoch": 0.89, "learning_rate": 2.9045226543472448e-05, "loss": 2.22, "step": 142800 }, { "epoch": 0.89, "learning_rate": 2.9041232523450813e-05, "loss": 2.2225, "step": 142808 }, { "epoch": 0.89, "learning_rate": 2.903723927306763e-05, "loss": 2.2326, "step": 142816 }, { "epoch": 0.89, "learning_rate": 2.9033246792422142e-05, "loss": 2.2153, "step": 142824 }, { "epoch": 0.89, "learning_rate": 2.902925508161361e-05, "loss": 2.2113, "step": 142832 }, { "epoch": 0.89, "learning_rate": 2.9025264140741276e-05, "loss": 2.208, "step": 142840 }, { "epoch": 0.89, "learning_rate": 2.9021273969904355e-05, "loss": 2.2208, "step": 142848 }, { "epoch": 0.89, "learning_rate": 2.901728456920203e-05, "loss": 2.2333, "step": 142856 }, { "epoch": 0.89, "learning_rate": 2.90132959387335e-05, "loss": 2.2198, "step": 142864 }, { "epoch": 0.89, "learning_rate": 2.9009308078597897e-05, "loss": 2.2072, "step": 142872 }, { "epoch": 0.89, "learning_rate": 2.900532098889437e-05, "loss": 2.222, "step": 142880 }, { "epoch": 0.89, "learning_rate": 2.9001334669722052e-05, "loss": 2.2304, "step": 142888 }, { "epoch": 0.89, "learning_rate": 2.8997349121180035e-05, "loss": 2.2328, "step": 142896 }, { "epoch": 0.89, "learning_rate": 2.899336434336738e-05, "loss": 2.239, "step": 142904 }, { "epoch": 0.89, "learning_rate": 2.8989380336383183e-05, "loss": 2.2204, "step": 142912 }, { "epoch": 0.89, "learning_rate": 2.898539710032645e-05, "loss": 2.2116, "step": 142920 }, { "epoch": 0.89, "learning_rate": 2.8981414635296257e-05, "loss": 2.2309, "step": 142928 }, { "epoch": 0.89, "learning_rate": 2.8977432941391546e-05, "loss": 2.2246, "step": 142936 }, { "epoch": 0.89, "learning_rate": 2.897345201871134e-05, "loss": 2.2302, "step": 142944 }, { "epoch": 0.89, "learning_rate": 2.8969471867354614e-05, "loss": 2.2362, "step": 142952 }, { "epoch": 0.89, "learning_rate": 2.8965492487420282e-05, "loss": 2.2203, "step": 142960 }, { "epoch": 0.89, "learning_rate": 2.8961513879007285e-05, "loss": 2.2118, "step": 142968 }, { "epoch": 0.89, "learning_rate": 2.895753604221456e-05, "loss": 2.2307, "step": 142976 }, { "epoch": 0.89, "learning_rate": 2.895355897714095e-05, "loss": 2.2164, "step": 142984 }, { "epoch": 0.89, "learning_rate": 2.894958268388535e-05, "loss": 2.208, "step": 142992 }, { "epoch": 0.89, "learning_rate": 2.8945607162546607e-05, "loss": 2.2041, "step": 143000 }, { "epoch": 0.89, "learning_rate": 2.894163241322356e-05, "loss": 2.2479, "step": 143008 }, { "epoch": 0.89, "learning_rate": 2.8937658436015018e-05, "loss": 2.2336, "step": 143016 }, { "epoch": 0.89, "learning_rate": 2.8933685231019762e-05, "loss": 2.2132, "step": 143024 }, { "epoch": 0.89, "learning_rate": 2.8929712798336587e-05, "loss": 2.2363, "step": 143032 }, { "epoch": 0.89, "learning_rate": 2.8925741138064238e-05, "loss": 2.2336, "step": 143040 }, { "epoch": 0.89, "learning_rate": 2.8921770250301444e-05, "loss": 2.2313, "step": 143048 }, { "epoch": 0.89, "learning_rate": 2.8917800135146932e-05, "loss": 2.2378, "step": 143056 }, { "epoch": 0.89, "learning_rate": 2.8913830792699402e-05, "loss": 2.2302, "step": 143064 }, { "epoch": 0.89, "learning_rate": 2.8909862223057516e-05, "loss": 2.2015, "step": 143072 }, { "epoch": 0.89, "learning_rate": 2.8905894426319947e-05, "loss": 2.2182, "step": 143080 }, { "epoch": 0.89, "learning_rate": 2.8901927402585333e-05, "loss": 2.2177, "step": 143088 }, { "epoch": 0.89, "learning_rate": 2.889796115195229e-05, "loss": 2.2277, "step": 143096 }, { "epoch": 0.89, "learning_rate": 2.8893995674519425e-05, "loss": 2.2342, "step": 143104 }, { "epoch": 0.89, "learning_rate": 2.8890030970385317e-05, "loss": 2.2117, "step": 143112 }, { "epoch": 0.89, "learning_rate": 2.8886067039648522e-05, "loss": 2.2307, "step": 143120 }, { "epoch": 0.89, "learning_rate": 2.8882103882407602e-05, "loss": 2.2163, "step": 143128 }, { "epoch": 0.89, "learning_rate": 2.8878141498761063e-05, "loss": 2.2238, "step": 143136 }, { "epoch": 0.89, "learning_rate": 2.8874179888807435e-05, "loss": 2.228, "step": 143144 }, { "epoch": 0.89, "learning_rate": 2.887021905264517e-05, "loss": 2.2154, "step": 143152 }, { "epoch": 0.89, "learning_rate": 2.8866258990372745e-05, "loss": 2.229, "step": 143160 }, { "epoch": 0.89, "learning_rate": 2.8862299702088646e-05, "loss": 2.212, "step": 143168 }, { "epoch": 0.89, "learning_rate": 2.8858341187891237e-05, "loss": 2.2236, "step": 143176 }, { "epoch": 0.89, "learning_rate": 2.885438344787897e-05, "loss": 2.2187, "step": 143184 }, { "epoch": 0.89, "learning_rate": 2.8850426482150234e-05, "loss": 2.2305, "step": 143192 }, { "epoch": 0.9, "learning_rate": 2.8846470290803386e-05, "loss": 2.2206, "step": 143200 }, { "epoch": 0.9, "learning_rate": 2.884251487393679e-05, "loss": 2.2244, "step": 143208 }, { "epoch": 0.9, "learning_rate": 2.8838560231648748e-05, "loss": 2.2356, "step": 143216 }, { "epoch": 0.9, "learning_rate": 2.883460636403761e-05, "loss": 2.2346, "step": 143224 }, { "epoch": 0.9, "learning_rate": 2.8830653271201657e-05, "loss": 2.2143, "step": 143232 }, { "epoch": 0.9, "learning_rate": 2.8826700953239145e-05, "loss": 2.2213, "step": 143240 }, { "epoch": 0.9, "learning_rate": 2.882274941024836e-05, "loss": 2.2138, "step": 143248 }, { "epoch": 0.9, "learning_rate": 2.8818798642327527e-05, "loss": 2.2121, "step": 143256 }, { "epoch": 0.9, "learning_rate": 2.8814848649574838e-05, "loss": 2.2248, "step": 143264 }, { "epoch": 0.9, "learning_rate": 2.8810899432088524e-05, "loss": 2.2138, "step": 143272 }, { "epoch": 0.9, "learning_rate": 2.8806950989966752e-05, "loss": 2.2356, "step": 143280 }, { "epoch": 0.9, "learning_rate": 2.880300332330767e-05, "loss": 2.2175, "step": 143288 }, { "epoch": 0.9, "learning_rate": 2.879905643220943e-05, "loss": 2.2318, "step": 143296 }, { "epoch": 0.9, "learning_rate": 2.879511031677015e-05, "loss": 2.2371, "step": 143304 }, { "epoch": 0.9, "learning_rate": 2.879116497708792e-05, "loss": 2.2197, "step": 143312 }, { "epoch": 0.9, "learning_rate": 2.8787220413260842e-05, "loss": 2.2288, "step": 143320 }, { "epoch": 0.9, "learning_rate": 2.8783276625386963e-05, "loss": 2.222, "step": 143328 }, { "epoch": 0.9, "learning_rate": 2.877933361356432e-05, "loss": 2.2299, "step": 143336 }, { "epoch": 0.9, "learning_rate": 2.877539137789096e-05, "loss": 2.2053, "step": 143344 }, { "epoch": 0.9, "learning_rate": 2.8771449918464853e-05, "loss": 2.2276, "step": 143352 }, { "epoch": 0.9, "learning_rate": 2.876750923538404e-05, "loss": 2.2261, "step": 143360 }, { "epoch": 0.9, "learning_rate": 2.876356932874642e-05, "loss": 2.2273, "step": 143368 }, { "epoch": 0.9, "learning_rate": 2.875963019864998e-05, "loss": 2.2128, "step": 143376 }, { "epoch": 0.9, "learning_rate": 2.8755691845192645e-05, "loss": 2.2218, "step": 143384 }, { "epoch": 0.9, "learning_rate": 2.875175426847231e-05, "loss": 2.2393, "step": 143392 }, { "epoch": 0.9, "learning_rate": 2.8747817468586872e-05, "loss": 2.2408, "step": 143400 }, { "epoch": 0.9, "learning_rate": 2.874388144563419e-05, "loss": 2.2209, "step": 143408 }, { "epoch": 0.9, "learning_rate": 2.8739946199712136e-05, "loss": 2.2148, "step": 143416 }, { "epoch": 0.9, "learning_rate": 2.873601173091852e-05, "loss": 2.2272, "step": 143424 }, { "epoch": 0.9, "learning_rate": 2.8732078039351157e-05, "loss": 2.2393, "step": 143432 }, { "epoch": 0.9, "learning_rate": 2.8728145125107847e-05, "loss": 2.2293, "step": 143440 }, { "epoch": 0.9, "learning_rate": 2.872421298828636e-05, "loss": 2.2333, "step": 143448 }, { "epoch": 0.9, "learning_rate": 2.8720281628984435e-05, "loss": 2.2281, "step": 143456 }, { "epoch": 0.9, "learning_rate": 2.8716351047299832e-05, "loss": 2.2315, "step": 143464 }, { "epoch": 0.9, "learning_rate": 2.8712421243330245e-05, "loss": 2.2367, "step": 143472 }, { "epoch": 0.9, "learning_rate": 2.870849221717338e-05, "loss": 2.2313, "step": 143480 }, { "epoch": 0.9, "learning_rate": 2.8704563968926906e-05, "loss": 2.2104, "step": 143488 }, { "epoch": 0.9, "learning_rate": 2.870063649868849e-05, "loss": 2.2325, "step": 143496 }, { "epoch": 0.9, "learning_rate": 2.8696709806555744e-05, "loss": 2.2161, "step": 143504 }, { "epoch": 0.9, "learning_rate": 2.8692783892626323e-05, "loss": 2.2196, "step": 143512 }, { "epoch": 0.9, "learning_rate": 2.8688858756997805e-05, "loss": 2.2258, "step": 143520 }, { "epoch": 0.9, "learning_rate": 2.868493439976776e-05, "loss": 2.2221, "step": 143528 }, { "epoch": 0.9, "learning_rate": 2.8681010821033772e-05, "loss": 2.2247, "step": 143536 }, { "epoch": 0.9, "learning_rate": 2.867708802089335e-05, "loss": 2.2241, "step": 143544 }, { "epoch": 0.9, "learning_rate": 2.867316599944405e-05, "loss": 2.2211, "step": 143552 }, { "epoch": 0.9, "learning_rate": 2.8669244756783366e-05, "loss": 2.2008, "step": 143560 }, { "epoch": 0.9, "learning_rate": 2.8665324293008755e-05, "loss": 2.2302, "step": 143568 }, { "epoch": 0.9, "learning_rate": 2.8661404608217717e-05, "loss": 2.2273, "step": 143576 }, { "epoch": 0.9, "learning_rate": 2.865748570250766e-05, "loss": 2.2208, "step": 143584 }, { "epoch": 0.9, "learning_rate": 2.865356757597602e-05, "loss": 2.1996, "step": 143592 }, { "epoch": 0.9, "learning_rate": 2.8649650228720232e-05, "loss": 2.2326, "step": 143600 }, { "epoch": 0.9, "learning_rate": 2.8645733660837632e-05, "loss": 2.2282, "step": 143608 }, { "epoch": 0.9, "learning_rate": 2.8641817872425623e-05, "loss": 2.2269, "step": 143616 }, { "epoch": 0.9, "learning_rate": 2.8637902863581533e-05, "loss": 2.2095, "step": 143624 }, { "epoch": 0.9, "learning_rate": 2.8633988634402705e-05, "loss": 2.2395, "step": 143632 }, { "epoch": 0.9, "learning_rate": 2.8630075184986436e-05, "loss": 2.2184, "step": 143640 }, { "epoch": 0.9, "learning_rate": 2.862616251543001e-05, "loss": 2.2392, "step": 143648 }, { "epoch": 0.9, "learning_rate": 2.8622250625830715e-05, "loss": 2.2219, "step": 143656 }, { "epoch": 0.9, "learning_rate": 2.8618339516285785e-05, "loss": 2.2169, "step": 143664 }, { "epoch": 0.9, "learning_rate": 2.8614429186892454e-05, "loss": 2.2282, "step": 143672 }, { "epoch": 0.9, "learning_rate": 2.861051963774794e-05, "loss": 2.2143, "step": 143680 }, { "epoch": 0.9, "learning_rate": 2.860661086894943e-05, "loss": 2.2233, "step": 143688 }, { "epoch": 0.9, "learning_rate": 2.8602702880594085e-05, "loss": 2.2201, "step": 143696 }, { "epoch": 0.9, "learning_rate": 2.8598795672779077e-05, "loss": 2.2194, "step": 143704 }, { "epoch": 0.9, "learning_rate": 2.8594889245601543e-05, "loss": 2.214, "step": 143712 }, { "epoch": 0.9, "learning_rate": 2.8590983599158562e-05, "loss": 2.2203, "step": 143720 }, { "epoch": 0.9, "learning_rate": 2.858707873354727e-05, "loss": 2.2286, "step": 143728 }, { "epoch": 0.9, "learning_rate": 2.8583174648864724e-05, "loss": 2.2328, "step": 143736 }, { "epoch": 0.9, "learning_rate": 2.857927134520797e-05, "loss": 2.2247, "step": 143744 }, { "epoch": 0.9, "learning_rate": 2.8575368822674065e-05, "loss": 2.2144, "step": 143752 }, { "epoch": 0.9, "learning_rate": 2.8571467081360004e-05, "loss": 2.2322, "step": 143760 }, { "epoch": 0.9, "learning_rate": 2.856756612136282e-05, "loss": 2.2205, "step": 143768 }, { "epoch": 0.9, "learning_rate": 2.8563665942779454e-05, "loss": 2.2082, "step": 143776 }, { "epoch": 0.9, "learning_rate": 2.8559766545706873e-05, "loss": 2.2083, "step": 143784 }, { "epoch": 0.9, "learning_rate": 2.8555867930242054e-05, "loss": 2.2179, "step": 143792 }, { "epoch": 0.9, "learning_rate": 2.8551970096481852e-05, "loss": 2.2466, "step": 143800 }, { "epoch": 0.9, "learning_rate": 2.854807304452321e-05, "loss": 2.2098, "step": 143808 }, { "epoch": 0.9, "learning_rate": 2.854417677446302e-05, "loss": 2.2249, "step": 143816 }, { "epoch": 0.9, "learning_rate": 2.8540281286398102e-05, "loss": 2.2175, "step": 143824 }, { "epoch": 0.9, "learning_rate": 2.8536386580425334e-05, "loss": 2.2185, "step": 143832 }, { "epoch": 0.9, "learning_rate": 2.8532492656641513e-05, "loss": 2.2297, "step": 143840 }, { "epoch": 0.9, "learning_rate": 2.8528599515143467e-05, "loss": 2.222, "step": 143848 }, { "epoch": 0.9, "learning_rate": 2.8524707156027976e-05, "loss": 2.2134, "step": 143856 }, { "epoch": 0.9, "learning_rate": 2.852081557939177e-05, "loss": 2.2222, "step": 143864 }, { "epoch": 0.9, "learning_rate": 2.851692478533164e-05, "loss": 2.2141, "step": 143872 }, { "epoch": 0.9, "learning_rate": 2.8513034773944293e-05, "loss": 2.2289, "step": 143880 }, { "epoch": 0.9, "learning_rate": 2.8509145545326423e-05, "loss": 2.2233, "step": 143888 }, { "epoch": 0.9, "learning_rate": 2.850525709957474e-05, "loss": 2.2184, "step": 143896 }, { "epoch": 0.9, "learning_rate": 2.8501369436785895e-05, "loss": 2.2218, "step": 143904 }, { "epoch": 0.9, "learning_rate": 2.849748255705653e-05, "loss": 2.2303, "step": 143912 }, { "epoch": 0.9, "learning_rate": 2.8493596460483296e-05, "loss": 2.2377, "step": 143920 }, { "epoch": 0.9, "learning_rate": 2.848971114716279e-05, "loss": 2.2244, "step": 143928 }, { "epoch": 0.9, "learning_rate": 2.8485826617191586e-05, "loss": 2.2122, "step": 143936 }, { "epoch": 0.9, "learning_rate": 2.848194287066628e-05, "loss": 2.2261, "step": 143944 }, { "epoch": 0.9, "learning_rate": 2.847805990768341e-05, "loss": 2.2184, "step": 143952 }, { "epoch": 0.9, "learning_rate": 2.8474177728339497e-05, "loss": 2.2128, "step": 143960 }, { "epoch": 0.9, "learning_rate": 2.8470296332731072e-05, "loss": 2.2284, "step": 143968 }, { "epoch": 0.9, "learning_rate": 2.846641572095461e-05, "loss": 2.2142, "step": 143976 }, { "epoch": 0.9, "learning_rate": 2.8462535893106613e-05, "loss": 2.236, "step": 143984 }, { "epoch": 0.9, "learning_rate": 2.845865684928349e-05, "loss": 2.2169, "step": 143992 }, { "epoch": 0.9, "learning_rate": 2.8454778589581695e-05, "loss": 2.2187, "step": 144000 }, { "epoch": 0.9, "learning_rate": 2.8450901114097667e-05, "loss": 2.2323, "step": 144008 }, { "epoch": 0.9, "learning_rate": 2.8447024422927748e-05, "loss": 2.2261, "step": 144016 }, { "epoch": 0.9, "learning_rate": 2.844314851616835e-05, "loss": 2.2076, "step": 144024 }, { "epoch": 0.9, "learning_rate": 2.8439273393915843e-05, "loss": 2.2237, "step": 144032 }, { "epoch": 0.9, "learning_rate": 2.8435399056266514e-05, "loss": 2.2179, "step": 144040 }, { "epoch": 0.9, "learning_rate": 2.843152550331672e-05, "loss": 2.2303, "step": 144048 }, { "epoch": 0.9, "learning_rate": 2.842765273516273e-05, "loss": 2.2405, "step": 144056 }, { "epoch": 0.9, "learning_rate": 2.8423780751900853e-05, "loss": 2.2319, "step": 144064 }, { "epoch": 0.9, "learning_rate": 2.841990955362732e-05, "loss": 2.2238, "step": 144072 }, { "epoch": 0.9, "learning_rate": 2.8416039140438378e-05, "loss": 2.2284, "step": 144080 }, { "epoch": 0.9, "learning_rate": 2.8412169512430248e-05, "loss": 2.2072, "step": 144088 }, { "epoch": 0.9, "learning_rate": 2.840830066969913e-05, "loss": 2.2342, "step": 144096 }, { "epoch": 0.9, "learning_rate": 2.8404432612341198e-05, "loss": 2.2207, "step": 144104 }, { "epoch": 0.9, "learning_rate": 2.8400565340452616e-05, "loss": 2.2148, "step": 144112 }, { "epoch": 0.9, "learning_rate": 2.839669885412953e-05, "loss": 2.2242, "step": 144120 }, { "epoch": 0.9, "learning_rate": 2.8392833153468052e-05, "loss": 2.239, "step": 144128 }, { "epoch": 0.9, "learning_rate": 2.8388968238564297e-05, "loss": 2.2163, "step": 144136 }, { "epoch": 0.9, "learning_rate": 2.838510410951433e-05, "loss": 2.215, "step": 144144 }, { "epoch": 0.9, "learning_rate": 2.838124076641422e-05, "loss": 2.2352, "step": 144152 }, { "epoch": 0.9, "learning_rate": 2.8377378209360016e-05, "loss": 2.2261, "step": 144160 }, { "epoch": 0.9, "learning_rate": 2.837351643844774e-05, "loss": 2.2042, "step": 144168 }, { "epoch": 0.9, "learning_rate": 2.836965545377338e-05, "loss": 2.2233, "step": 144176 }, { "epoch": 0.9, "learning_rate": 2.8365795255432948e-05, "loss": 2.2326, "step": 144184 }, { "epoch": 0.9, "learning_rate": 2.8361935843522385e-05, "loss": 2.2243, "step": 144192 }, { "epoch": 0.9, "learning_rate": 2.8358077218137668e-05, "loss": 2.214, "step": 144200 }, { "epoch": 0.9, "learning_rate": 2.835421937937468e-05, "loss": 2.228, "step": 144208 }, { "epoch": 0.9, "learning_rate": 2.835036232732935e-05, "loss": 2.2348, "step": 144216 }, { "epoch": 0.9, "learning_rate": 2.8346506062097588e-05, "loss": 2.2103, "step": 144224 }, { "epoch": 0.9, "learning_rate": 2.834265058377521e-05, "loss": 2.2253, "step": 144232 }, { "epoch": 0.9, "learning_rate": 2.833879589245809e-05, "loss": 2.2418, "step": 144240 }, { "epoch": 0.9, "learning_rate": 2.8334941988242068e-05, "loss": 2.2345, "step": 144248 }, { "epoch": 0.9, "learning_rate": 2.8331088871222945e-05, "loss": 2.2394, "step": 144256 }, { "epoch": 0.9, "learning_rate": 2.83272365414965e-05, "loss": 2.206, "step": 144264 }, { "epoch": 0.9, "learning_rate": 2.8323384999158496e-05, "loss": 2.2406, "step": 144272 }, { "epoch": 0.9, "learning_rate": 2.8319534244304714e-05, "loss": 2.226, "step": 144280 }, { "epoch": 0.9, "learning_rate": 2.8315684277030864e-05, "loss": 2.2459, "step": 144288 }, { "epoch": 0.9, "learning_rate": 2.8311835097432643e-05, "loss": 2.2492, "step": 144296 }, { "epoch": 0.9, "learning_rate": 2.8307986705605766e-05, "loss": 2.2203, "step": 144304 }, { "epoch": 0.9, "learning_rate": 2.8304139101645897e-05, "loss": 2.2317, "step": 144312 }, { "epoch": 0.9, "learning_rate": 2.8300292285648677e-05, "loss": 2.2163, "step": 144320 }, { "epoch": 0.9, "learning_rate": 2.829644625770976e-05, "loss": 2.2401, "step": 144328 }, { "epoch": 0.9, "learning_rate": 2.8292601017924742e-05, "loss": 2.2264, "step": 144336 }, { "epoch": 0.9, "learning_rate": 2.8288756566389206e-05, "loss": 2.2364, "step": 144344 }, { "epoch": 0.9, "learning_rate": 2.8284912903198757e-05, "loss": 2.2225, "step": 144352 }, { "epoch": 0.9, "learning_rate": 2.828107002844893e-05, "loss": 2.227, "step": 144360 }, { "epoch": 0.9, "learning_rate": 2.827722794223525e-05, "loss": 2.2298, "step": 144368 }, { "epoch": 0.9, "learning_rate": 2.8273386644653253e-05, "loss": 2.2429, "step": 144376 }, { "epoch": 0.9, "learning_rate": 2.8269546135798426e-05, "loss": 2.2207, "step": 144384 }, { "epoch": 0.9, "learning_rate": 2.8265706415766223e-05, "loss": 2.2186, "step": 144392 }, { "epoch": 0.9, "learning_rate": 2.8261867484652138e-05, "loss": 2.2341, "step": 144400 }, { "epoch": 0.9, "learning_rate": 2.8258029342551578e-05, "loss": 2.2376, "step": 144408 }, { "epoch": 0.9, "learning_rate": 2.8254191989559993e-05, "loss": 2.2249, "step": 144416 }, { "epoch": 0.9, "learning_rate": 2.825035542577273e-05, "loss": 2.2199, "step": 144424 }, { "epoch": 0.9, "learning_rate": 2.82465196512852e-05, "loss": 2.2229, "step": 144432 }, { "epoch": 0.9, "learning_rate": 2.8242684666192764e-05, "loss": 2.2199, "step": 144440 }, { "epoch": 0.9, "learning_rate": 2.8238850470590738e-05, "loss": 2.224, "step": 144448 }, { "epoch": 0.9, "learning_rate": 2.823501706457446e-05, "loss": 2.2381, "step": 144456 }, { "epoch": 0.9, "learning_rate": 2.8231184448239212e-05, "loss": 2.2397, "step": 144464 }, { "epoch": 0.9, "learning_rate": 2.822735262168029e-05, "loss": 2.2292, "step": 144472 }, { "epoch": 0.9, "learning_rate": 2.822352158499295e-05, "loss": 2.2273, "step": 144480 }, { "epoch": 0.9, "learning_rate": 2.8219691338272425e-05, "loss": 2.2346, "step": 144488 }, { "epoch": 0.9, "learning_rate": 2.8215861881613937e-05, "loss": 2.2383, "step": 144496 }, { "epoch": 0.9, "learning_rate": 2.8212033215112698e-05, "loss": 2.2358, "step": 144504 }, { "epoch": 0.9, "learning_rate": 2.8208205338863864e-05, "loss": 2.225, "step": 144512 }, { "epoch": 0.9, "learning_rate": 2.8204378252962626e-05, "loss": 2.2253, "step": 144520 }, { "epoch": 0.9, "learning_rate": 2.8200551957504107e-05, "loss": 2.2288, "step": 144528 }, { "epoch": 0.9, "learning_rate": 2.8196726452583427e-05, "loss": 2.2378, "step": 144536 }, { "epoch": 0.9, "learning_rate": 2.8192901738295708e-05, "loss": 2.2396, "step": 144544 }, { "epoch": 0.9, "learning_rate": 2.818907781473602e-05, "loss": 2.2169, "step": 144552 }, { "epoch": 0.9, "learning_rate": 2.8185254681999416e-05, "loss": 2.2238, "step": 144560 }, { "epoch": 0.9, "learning_rate": 2.818143234018096e-05, "loss": 2.2359, "step": 144568 }, { "epoch": 0.9, "learning_rate": 2.8177610789375662e-05, "loss": 2.229, "step": 144576 }, { "epoch": 0.9, "learning_rate": 2.8173790029678527e-05, "loss": 2.2296, "step": 144584 }, { "epoch": 0.9, "learning_rate": 2.816997006118455e-05, "loss": 2.2334, "step": 144592 }, { "epoch": 0.9, "learning_rate": 2.8166150883988678e-05, "loss": 2.2254, "step": 144600 }, { "epoch": 0.9, "learning_rate": 2.8162332498185888e-05, "loss": 2.2362, "step": 144608 }, { "epoch": 0.9, "learning_rate": 2.8158514903871057e-05, "loss": 2.2421, "step": 144616 }, { "epoch": 0.9, "learning_rate": 2.8154698101139127e-05, "loss": 2.2439, "step": 144624 }, { "epoch": 0.9, "learning_rate": 2.815088209008499e-05, "loss": 2.2219, "step": 144632 }, { "epoch": 0.9, "learning_rate": 2.8147066870803484e-05, "loss": 2.2452, "step": 144640 }, { "epoch": 0.9, "learning_rate": 2.8143252443389467e-05, "loss": 2.2233, "step": 144648 }, { "epoch": 0.9, "learning_rate": 2.8139438807937783e-05, "loss": 2.2308, "step": 144656 }, { "epoch": 0.9, "learning_rate": 2.813562596454321e-05, "loss": 2.2297, "step": 144664 }, { "epoch": 0.9, "learning_rate": 2.813181391330056e-05, "loss": 2.2447, "step": 144672 }, { "epoch": 0.9, "learning_rate": 2.8128002654304574e-05, "loss": 2.2251, "step": 144680 }, { "epoch": 0.9, "learning_rate": 2.8124192187650038e-05, "loss": 2.226, "step": 144688 }, { "epoch": 0.9, "learning_rate": 2.812038251343166e-05, "loss": 2.2196, "step": 144696 }, { "epoch": 0.9, "learning_rate": 2.8116573631744135e-05, "loss": 2.225, "step": 144704 }, { "epoch": 0.9, "learning_rate": 2.811276554268218e-05, "loss": 2.2297, "step": 144712 }, { "epoch": 0.9, "learning_rate": 2.810895824634045e-05, "loss": 2.2325, "step": 144720 }, { "epoch": 0.9, "learning_rate": 2.8105151742813586e-05, "loss": 2.2336, "step": 144728 }, { "epoch": 0.9, "learning_rate": 2.810134603219624e-05, "loss": 2.2385, "step": 144736 }, { "epoch": 0.9, "learning_rate": 2.8097541114583004e-05, "loss": 2.2199, "step": 144744 }, { "epoch": 0.9, "learning_rate": 2.8093736990068474e-05, "loss": 2.2232, "step": 144752 }, { "epoch": 0.9, "learning_rate": 2.808993365874723e-05, "loss": 2.2293, "step": 144760 }, { "epoch": 0.9, "learning_rate": 2.808613112071381e-05, "loss": 2.2282, "step": 144768 }, { "epoch": 0.9, "learning_rate": 2.8082329376062743e-05, "loss": 2.2074, "step": 144776 }, { "epoch": 0.9, "learning_rate": 2.807852842488856e-05, "loss": 2.2361, "step": 144784 }, { "epoch": 0.9, "learning_rate": 2.8074728267285743e-05, "loss": 2.2148, "step": 144792 }, { "epoch": 0.91, "learning_rate": 2.807092890334876e-05, "loss": 2.2451, "step": 144800 }, { "epoch": 0.91, "learning_rate": 2.806713033317207e-05, "loss": 2.2267, "step": 144808 }, { "epoch": 0.91, "learning_rate": 2.8063332556850092e-05, "loss": 2.2271, "step": 144816 }, { "epoch": 0.91, "learning_rate": 2.8059535574477268e-05, "loss": 2.223, "step": 144824 }, { "epoch": 0.91, "learning_rate": 2.8055739386147955e-05, "loss": 2.2488, "step": 144832 }, { "epoch": 0.91, "learning_rate": 2.8051943991956543e-05, "loss": 2.2144, "step": 144840 }, { "epoch": 0.91, "learning_rate": 2.8048149391997413e-05, "loss": 2.2254, "step": 144848 }, { "epoch": 0.91, "learning_rate": 2.8044355586364852e-05, "loss": 2.2366, "step": 144856 }, { "epoch": 0.91, "learning_rate": 2.8040562575153196e-05, "loss": 2.238, "step": 144864 }, { "epoch": 0.91, "learning_rate": 2.803677035845676e-05, "loss": 2.2164, "step": 144872 }, { "epoch": 0.91, "learning_rate": 2.803297893636978e-05, "loss": 2.2172, "step": 144880 }, { "epoch": 0.91, "learning_rate": 2.8029188308986536e-05, "loss": 2.2191, "step": 144888 }, { "epoch": 0.91, "learning_rate": 2.8025398476401256e-05, "loss": 2.2278, "step": 144896 }, { "epoch": 0.91, "learning_rate": 2.8021609438708156e-05, "loss": 2.2406, "step": 144904 }, { "epoch": 0.91, "learning_rate": 2.8017821196001444e-05, "loss": 2.2303, "step": 144912 }, { "epoch": 0.91, "learning_rate": 2.801403374837527e-05, "loss": 2.201, "step": 144920 }, { "epoch": 0.91, "learning_rate": 2.8010247095923815e-05, "loss": 2.224, "step": 144928 }, { "epoch": 0.91, "learning_rate": 2.800646123874121e-05, "loss": 2.2179, "step": 144936 }, { "epoch": 0.91, "learning_rate": 2.800267617692156e-05, "loss": 2.2353, "step": 144944 }, { "epoch": 0.91, "learning_rate": 2.7998891910558978e-05, "loss": 2.2214, "step": 144952 }, { "epoch": 0.91, "learning_rate": 2.799510843974753e-05, "loss": 2.237, "step": 144960 }, { "epoch": 0.91, "learning_rate": 2.7991325764581265e-05, "loss": 2.2173, "step": 144968 }, { "epoch": 0.91, "learning_rate": 2.7987543885154248e-05, "loss": 2.195, "step": 144976 }, { "epoch": 0.91, "learning_rate": 2.7983762801560482e-05, "loss": 2.2114, "step": 144984 }, { "epoch": 0.91, "learning_rate": 2.7979982513893955e-05, "loss": 2.2317, "step": 144992 }, { "epoch": 0.91, "learning_rate": 2.797620302224866e-05, "loss": 2.1975, "step": 145000 }, { "epoch": 0.91, "learning_rate": 2.797242432671856e-05, "loss": 2.2209, "step": 145008 }, { "epoch": 0.91, "learning_rate": 2.7968646427397566e-05, "loss": 2.2203, "step": 145016 }, { "epoch": 0.91, "learning_rate": 2.7964869324379628e-05, "loss": 2.216, "step": 145024 }, { "epoch": 0.91, "learning_rate": 2.796109301775862e-05, "loss": 2.2169, "step": 145032 }, { "epoch": 0.91, "learning_rate": 2.7957317507628465e-05, "loss": 2.2488, "step": 145040 }, { "epoch": 0.91, "learning_rate": 2.7953542794082964e-05, "loss": 2.2352, "step": 145048 }, { "epoch": 0.91, "learning_rate": 2.7949768877215988e-05, "loss": 2.2122, "step": 145056 }, { "epoch": 0.91, "learning_rate": 2.7945995757121375e-05, "loss": 2.2184, "step": 145064 }, { "epoch": 0.91, "learning_rate": 2.794222343389288e-05, "loss": 2.2153, "step": 145072 }, { "epoch": 0.91, "learning_rate": 2.7938451907624303e-05, "loss": 2.2365, "step": 145080 }, { "epoch": 0.91, "learning_rate": 2.793468117840943e-05, "loss": 2.2115, "step": 145088 }, { "epoch": 0.91, "learning_rate": 2.7930911246341966e-05, "loss": 2.2155, "step": 145096 }, { "epoch": 0.91, "learning_rate": 2.792714211151566e-05, "loss": 2.2285, "step": 145104 }, { "epoch": 0.91, "learning_rate": 2.792337377402418e-05, "loss": 2.2374, "step": 145112 }, { "epoch": 0.91, "learning_rate": 2.7919606233961243e-05, "loss": 2.2169, "step": 145120 }, { "epoch": 0.91, "learning_rate": 2.791583949142049e-05, "loss": 2.2246, "step": 145128 }, { "epoch": 0.91, "learning_rate": 2.7912073546495564e-05, "loss": 2.2235, "step": 145136 }, { "epoch": 0.91, "learning_rate": 2.7908308399280093e-05, "loss": 2.2111, "step": 145144 }, { "epoch": 0.91, "learning_rate": 2.7904544049867676e-05, "loss": 2.2167, "step": 145152 }, { "epoch": 0.91, "learning_rate": 2.7900780498351886e-05, "loss": 2.2403, "step": 145160 }, { "epoch": 0.91, "learning_rate": 2.789701774482631e-05, "loss": 2.2305, "step": 145168 }, { "epoch": 0.91, "learning_rate": 2.7893255789384464e-05, "loss": 2.217, "step": 145176 }, { "epoch": 0.91, "learning_rate": 2.7889494632119877e-05, "loss": 2.2179, "step": 145184 }, { "epoch": 0.91, "learning_rate": 2.7885734273126068e-05, "loss": 2.2098, "step": 145192 }, { "epoch": 0.91, "learning_rate": 2.7881974712496513e-05, "loss": 2.2121, "step": 145200 }, { "epoch": 0.91, "learning_rate": 2.787821595032465e-05, "loss": 2.2178, "step": 145208 }, { "epoch": 0.91, "learning_rate": 2.7874457986703962e-05, "loss": 2.2133, "step": 145216 }, { "epoch": 0.91, "learning_rate": 2.7870700821727845e-05, "loss": 2.221, "step": 145224 }, { "epoch": 0.91, "learning_rate": 2.7866944455489697e-05, "loss": 2.2378, "step": 145232 }, { "epoch": 0.91, "learning_rate": 2.7863188888082937e-05, "loss": 2.2112, "step": 145240 }, { "epoch": 0.91, "learning_rate": 2.7859434119600885e-05, "loss": 2.2113, "step": 145248 }, { "epoch": 0.91, "learning_rate": 2.7855680150136932e-05, "loss": 2.2272, "step": 145256 }, { "epoch": 0.91, "learning_rate": 2.785192697978436e-05, "loss": 2.2019, "step": 145264 }, { "epoch": 0.91, "learning_rate": 2.784817460863649e-05, "loss": 2.2268, "step": 145272 }, { "epoch": 0.91, "learning_rate": 2.7844423036786628e-05, "loss": 2.2266, "step": 145280 }, { "epoch": 0.91, "learning_rate": 2.7840672264327988e-05, "loss": 2.221, "step": 145288 }, { "epoch": 0.91, "learning_rate": 2.7836922291353863e-05, "loss": 2.2165, "step": 145296 }, { "epoch": 0.91, "learning_rate": 2.7833173117957438e-05, "loss": 2.2108, "step": 145304 }, { "epoch": 0.91, "learning_rate": 2.7829424744231957e-05, "loss": 2.2249, "step": 145312 }, { "epoch": 0.91, "learning_rate": 2.7825677170270587e-05, "loss": 2.2242, "step": 145320 }, { "epoch": 0.91, "learning_rate": 2.782193039616648e-05, "loss": 2.2312, "step": 145328 }, { "epoch": 0.91, "learning_rate": 2.7818184422012804e-05, "loss": 2.2266, "step": 145336 }, { "epoch": 0.91, "learning_rate": 2.7814439247902673e-05, "loss": 2.2022, "step": 145344 }, { "epoch": 0.91, "learning_rate": 2.7810694873929182e-05, "loss": 2.2277, "step": 145352 }, { "epoch": 0.91, "learning_rate": 2.780695130018544e-05, "loss": 2.2282, "step": 145360 }, { "epoch": 0.91, "learning_rate": 2.78032085267645e-05, "loss": 2.2143, "step": 145368 }, { "epoch": 0.91, "learning_rate": 2.77994665537594e-05, "loss": 2.2318, "step": 145376 }, { "epoch": 0.91, "learning_rate": 2.779572538126318e-05, "loss": 2.2323, "step": 145384 }, { "epoch": 0.91, "learning_rate": 2.779198500936885e-05, "loss": 2.2203, "step": 145392 }, { "epoch": 0.91, "learning_rate": 2.7788245438169363e-05, "loss": 2.2265, "step": 145400 }, { "epoch": 0.91, "learning_rate": 2.778450666775773e-05, "loss": 2.2368, "step": 145408 }, { "epoch": 0.91, "learning_rate": 2.7780768698226872e-05, "loss": 2.2152, "step": 145416 }, { "epoch": 0.91, "learning_rate": 2.7777031529669705e-05, "loss": 2.2139, "step": 145424 }, { "epoch": 0.91, "learning_rate": 2.7773295162179162e-05, "loss": 2.2234, "step": 145432 }, { "epoch": 0.91, "learning_rate": 2.776955959584811e-05, "loss": 2.225, "step": 145440 }, { "epoch": 0.91, "learning_rate": 2.7765824830769434e-05, "loss": 2.229, "step": 145448 }, { "epoch": 0.91, "learning_rate": 2.776209086703596e-05, "loss": 2.2064, "step": 145456 }, { "epoch": 0.91, "learning_rate": 2.7758357704740524e-05, "loss": 2.2007, "step": 145464 }, { "epoch": 0.91, "learning_rate": 2.775462534397595e-05, "loss": 2.2326, "step": 145472 }, { "epoch": 0.91, "learning_rate": 2.775089378483498e-05, "loss": 2.2288, "step": 145480 }, { "epoch": 0.91, "learning_rate": 2.7747163027410416e-05, "loss": 2.2126, "step": 145488 }, { "epoch": 0.91, "learning_rate": 2.7743433071795017e-05, "loss": 2.2338, "step": 145496 }, { "epoch": 0.91, "learning_rate": 2.773970391808147e-05, "loss": 2.2341, "step": 145504 }, { "epoch": 0.91, "learning_rate": 2.7735975566362514e-05, "loss": 2.2333, "step": 145512 }, { "epoch": 0.91, "learning_rate": 2.773224801673082e-05, "loss": 2.2267, "step": 145520 }, { "epoch": 0.91, "learning_rate": 2.7728521269279067e-05, "loss": 2.2307, "step": 145528 }, { "epoch": 0.91, "learning_rate": 2.7724795324099894e-05, "loss": 2.2236, "step": 145536 }, { "epoch": 0.91, "learning_rate": 2.7721070181285917e-05, "loss": 2.2259, "step": 145544 }, { "epoch": 0.91, "learning_rate": 2.7717345840929776e-05, "loss": 2.2302, "step": 145552 }, { "epoch": 0.91, "learning_rate": 2.7713622303124037e-05, "loss": 2.2217, "step": 145560 }, { "epoch": 0.91, "learning_rate": 2.7709899567961257e-05, "loss": 2.2181, "step": 145568 }, { "epoch": 0.91, "learning_rate": 2.7706177635534004e-05, "loss": 2.23, "step": 145576 }, { "epoch": 0.91, "learning_rate": 2.7702456505934803e-05, "loss": 2.2137, "step": 145584 }, { "epoch": 0.91, "learning_rate": 2.7698736179256148e-05, "loss": 2.2394, "step": 145592 }, { "epoch": 0.91, "learning_rate": 2.7695016655590544e-05, "loss": 2.2096, "step": 145600 }, { "epoch": 0.91, "learning_rate": 2.7691297935030447e-05, "loss": 2.2266, "step": 145608 }, { "epoch": 0.91, "learning_rate": 2.7687580017668302e-05, "loss": 2.2238, "step": 145616 }, { "epoch": 0.91, "learning_rate": 2.768386290359655e-05, "loss": 2.2422, "step": 145624 }, { "epoch": 0.91, "learning_rate": 2.76801465929076e-05, "loss": 2.2321, "step": 145632 }, { "epoch": 0.91, "learning_rate": 2.7676431085693815e-05, "loss": 2.2289, "step": 145640 }, { "epoch": 0.91, "learning_rate": 2.767271638204759e-05, "loss": 2.2241, "step": 145648 }, { "epoch": 0.91, "learning_rate": 2.7669002482061257e-05, "loss": 2.221, "step": 145656 }, { "epoch": 0.91, "learning_rate": 2.7665289385827164e-05, "loss": 2.2232, "step": 145664 }, { "epoch": 0.91, "learning_rate": 2.766157709343759e-05, "loss": 2.2269, "step": 145672 }, { "epoch": 0.91, "learning_rate": 2.7657865604984835e-05, "loss": 2.2201, "step": 145680 }, { "epoch": 0.91, "learning_rate": 2.765415492056119e-05, "loss": 2.215, "step": 145688 }, { "epoch": 0.91, "learning_rate": 2.7650445040258865e-05, "loss": 2.2272, "step": 145696 }, { "epoch": 0.91, "learning_rate": 2.7646735964170102e-05, "loss": 2.2226, "step": 145704 }, { "epoch": 0.91, "learning_rate": 2.7643027692387137e-05, "loss": 2.2232, "step": 145712 }, { "epoch": 0.91, "learning_rate": 2.7639320225002108e-05, "loss": 2.2296, "step": 145720 }, { "epoch": 0.91, "learning_rate": 2.763561356210722e-05, "loss": 2.214, "step": 145728 }, { "epoch": 0.91, "learning_rate": 2.7631907703794602e-05, "loss": 2.236, "step": 145736 }, { "epoch": 0.91, "learning_rate": 2.7628202650156405e-05, "loss": 2.2137, "step": 145744 }, { "epoch": 0.91, "learning_rate": 2.7624498401284716e-05, "loss": 2.2076, "step": 145752 }, { "epoch": 0.91, "learning_rate": 2.7620794957271624e-05, "loss": 2.2263, "step": 145760 }, { "epoch": 0.91, "learning_rate": 2.761709231820921e-05, "loss": 2.2162, "step": 145768 }, { "epoch": 0.91, "learning_rate": 2.7613390484189516e-05, "loss": 2.2128, "step": 145776 }, { "epoch": 0.91, "learning_rate": 2.7609689455304554e-05, "loss": 2.2234, "step": 145784 }, { "epoch": 0.91, "learning_rate": 2.7605989231646356e-05, "loss": 2.2379, "step": 145792 }, { "epoch": 0.91, "learning_rate": 2.7602289813306902e-05, "loss": 2.2185, "step": 145800 }, { "epoch": 0.91, "learning_rate": 2.7598591200378148e-05, "loss": 2.2083, "step": 145808 }, { "epoch": 0.91, "learning_rate": 2.7594893392952065e-05, "loss": 2.2112, "step": 145816 }, { "epoch": 0.91, "learning_rate": 2.7591196391120567e-05, "loss": 2.2342, "step": 145824 }, { "epoch": 0.91, "learning_rate": 2.7587500194975553e-05, "loss": 2.2143, "step": 145832 }, { "epoch": 0.91, "learning_rate": 2.7583804804608925e-05, "loss": 2.222, "step": 145840 }, { "epoch": 0.91, "learning_rate": 2.7580110220112554e-05, "loss": 2.2223, "step": 145848 }, { "epoch": 0.91, "learning_rate": 2.757641644157827e-05, "loss": 2.2256, "step": 145856 }, { "epoch": 0.91, "learning_rate": 2.7572723469097916e-05, "loss": 2.2329, "step": 145864 }, { "epoch": 0.91, "learning_rate": 2.756903130276329e-05, "loss": 2.2404, "step": 145872 }, { "epoch": 0.91, "learning_rate": 2.7565339942666198e-05, "loss": 2.2283, "step": 145880 }, { "epoch": 0.91, "learning_rate": 2.756164938889838e-05, "loss": 2.2443, "step": 145888 }, { "epoch": 0.91, "learning_rate": 2.755795964155159e-05, "loss": 2.2198, "step": 145896 }, { "epoch": 0.91, "learning_rate": 2.7554270700717593e-05, "loss": 2.206, "step": 145904 }, { "epoch": 0.91, "learning_rate": 2.7550582566488043e-05, "loss": 2.2204, "step": 145912 }, { "epoch": 0.91, "learning_rate": 2.754689523895465e-05, "loss": 2.2317, "step": 145920 }, { "epoch": 0.91, "learning_rate": 2.75432087182091e-05, "loss": 2.2313, "step": 145928 }, { "epoch": 0.91, "learning_rate": 2.7539523004343008e-05, "loss": 2.2184, "step": 145936 }, { "epoch": 0.91, "learning_rate": 2.7535838097448026e-05, "loss": 2.2115, "step": 145944 }, { "epoch": 0.91, "learning_rate": 2.753215399761574e-05, "loss": 2.2208, "step": 145952 }, { "epoch": 0.91, "learning_rate": 2.752847070493776e-05, "loss": 2.2275, "step": 145960 }, { "epoch": 0.91, "learning_rate": 2.752478821950564e-05, "loss": 2.219, "step": 145968 }, { "epoch": 0.91, "learning_rate": 2.7521106541410913e-05, "loss": 2.2237, "step": 145976 }, { "epoch": 0.91, "learning_rate": 2.751742567074514e-05, "loss": 2.2341, "step": 145984 }, { "epoch": 0.91, "learning_rate": 2.7513745607599807e-05, "loss": 2.2306, "step": 145992 }, { "epoch": 0.91, "learning_rate": 2.7510066352066388e-05, "loss": 2.2276, "step": 146000 }, { "epoch": 0.91, "learning_rate": 2.750638790423638e-05, "loss": 2.2282, "step": 146008 }, { "epoch": 0.91, "learning_rate": 2.7502710264201215e-05, "loss": 2.2194, "step": 146016 }, { "epoch": 0.91, "learning_rate": 2.7499033432052308e-05, "loss": 2.221, "step": 146024 }, { "epoch": 0.91, "learning_rate": 2.7495357407881082e-05, "loss": 2.2328, "step": 146032 }, { "epoch": 0.91, "learning_rate": 2.7491682191778922e-05, "loss": 2.2323, "step": 146040 }, { "epoch": 0.91, "learning_rate": 2.748800778383718e-05, "loss": 2.2244, "step": 146048 }, { "epoch": 0.91, "learning_rate": 2.748433418414722e-05, "loss": 2.2145, "step": 146056 }, { "epoch": 0.91, "learning_rate": 2.7480661392800368e-05, "loss": 2.2148, "step": 146064 }, { "epoch": 0.91, "learning_rate": 2.7476989409887898e-05, "loss": 2.2204, "step": 146072 }, { "epoch": 0.91, "learning_rate": 2.7473318235501146e-05, "loss": 2.2242, "step": 146080 }, { "epoch": 0.91, "learning_rate": 2.746964786973133e-05, "loss": 2.246, "step": 146088 }, { "epoch": 0.91, "learning_rate": 2.7465978312669745e-05, "loss": 2.2226, "step": 146096 }, { "epoch": 0.91, "learning_rate": 2.746230956440756e-05, "loss": 2.2384, "step": 146104 }, { "epoch": 0.91, "learning_rate": 2.745864162503602e-05, "loss": 2.2258, "step": 146112 }, { "epoch": 0.91, "learning_rate": 2.745497449464632e-05, "loss": 2.2215, "step": 146120 }, { "epoch": 0.91, "learning_rate": 2.7451308173329583e-05, "loss": 2.209, "step": 146128 }, { "epoch": 0.91, "learning_rate": 2.7447642661176988e-05, "loss": 2.216, "step": 146136 }, { "epoch": 0.91, "learning_rate": 2.7443977958279633e-05, "loss": 2.2154, "step": 146144 }, { "epoch": 0.91, "learning_rate": 2.744031406472865e-05, "loss": 2.2397, "step": 146152 }, { "epoch": 0.91, "learning_rate": 2.743665098061512e-05, "loss": 2.2232, "step": 146160 }, { "epoch": 0.91, "learning_rate": 2.7432988706030083e-05, "loss": 2.2233, "step": 146168 }, { "epoch": 0.91, "learning_rate": 2.7429327241064614e-05, "loss": 2.2448, "step": 146176 }, { "epoch": 0.91, "learning_rate": 2.742566658580972e-05, "loss": 2.2319, "step": 146184 }, { "epoch": 0.91, "learning_rate": 2.7422006740356404e-05, "loss": 2.2209, "step": 146192 }, { "epoch": 0.91, "learning_rate": 2.7418347704795665e-05, "loss": 2.2204, "step": 146200 }, { "epoch": 0.91, "learning_rate": 2.7414689479218458e-05, "loss": 2.2342, "step": 146208 }, { "epoch": 0.91, "learning_rate": 2.7411032063715712e-05, "loss": 2.2258, "step": 146216 }, { "epoch": 0.91, "learning_rate": 2.740737545837838e-05, "loss": 2.2252, "step": 146224 }, { "epoch": 0.91, "learning_rate": 2.740371966329735e-05, "loss": 2.2271, "step": 146232 }, { "epoch": 0.91, "learning_rate": 2.74000646785635e-05, "loss": 2.2207, "step": 146240 }, { "epoch": 0.91, "learning_rate": 2.73964105042677e-05, "loss": 2.2254, "step": 146248 }, { "epoch": 0.91, "learning_rate": 2.7392757140500803e-05, "loss": 2.2264, "step": 146256 }, { "epoch": 0.91, "learning_rate": 2.7389104587353604e-05, "loss": 2.2343, "step": 146264 }, { "epoch": 0.91, "learning_rate": 2.7385452844916936e-05, "loss": 2.2444, "step": 146272 }, { "epoch": 0.91, "learning_rate": 2.7381801913281575e-05, "loss": 2.2301, "step": 146280 }, { "epoch": 0.91, "learning_rate": 2.7378151792538264e-05, "loss": 2.2268, "step": 146288 }, { "epoch": 0.91, "learning_rate": 2.737450248277777e-05, "loss": 2.2186, "step": 146296 }, { "epoch": 0.91, "learning_rate": 2.7370853984090793e-05, "loss": 2.2344, "step": 146304 }, { "epoch": 0.91, "learning_rate": 2.7367206296568065e-05, "loss": 2.2101, "step": 146312 }, { "epoch": 0.91, "learning_rate": 2.736355942030024e-05, "loss": 2.2301, "step": 146320 }, { "epoch": 0.91, "learning_rate": 2.7359913355377976e-05, "loss": 2.2187, "step": 146328 }, { "epoch": 0.91, "learning_rate": 2.7356268101891958e-05, "loss": 2.2245, "step": 146336 }, { "epoch": 0.91, "learning_rate": 2.7352623659932754e-05, "loss": 2.2402, "step": 146344 }, { "epoch": 0.91, "learning_rate": 2.7348980029590998e-05, "loss": 2.2344, "step": 146352 }, { "epoch": 0.91, "learning_rate": 2.734533721095725e-05, "loss": 2.2154, "step": 146360 }, { "epoch": 0.91, "learning_rate": 2.73416952041221e-05, "loss": 2.2081, "step": 146368 }, { "epoch": 0.91, "learning_rate": 2.7338054009176066e-05, "loss": 2.2405, "step": 146376 }, { "epoch": 0.91, "learning_rate": 2.7334413626209665e-05, "loss": 2.2271, "step": 146384 }, { "epoch": 0.91, "learning_rate": 2.733077405531341e-05, "loss": 2.2213, "step": 146392 }, { "epoch": 0.92, "learning_rate": 2.732713529657779e-05, "loss": 2.2337, "step": 146400 }, { "epoch": 0.92, "learning_rate": 2.7323497350093237e-05, "loss": 2.2213, "step": 146408 }, { "epoch": 0.92, "learning_rate": 2.731986021595021e-05, "loss": 2.2085, "step": 146416 }, { "epoch": 0.92, "learning_rate": 2.7316223894239134e-05, "loss": 2.2161, "step": 146424 }, { "epoch": 0.92, "learning_rate": 2.7312588385050387e-05, "loss": 2.2242, "step": 146432 }, { "epoch": 0.92, "learning_rate": 2.730895368847437e-05, "loss": 2.2289, "step": 146440 }, { "epoch": 0.92, "learning_rate": 2.7305319804601424e-05, "loss": 2.2137, "step": 146448 }, { "epoch": 0.92, "learning_rate": 2.730168673352189e-05, "loss": 2.2095, "step": 146456 }, { "epoch": 0.92, "learning_rate": 2.7298054475326107e-05, "loss": 2.214, "step": 146464 }, { "epoch": 0.92, "learning_rate": 2.729442303010436e-05, "loss": 2.2222, "step": 146472 }, { "epoch": 0.92, "learning_rate": 2.729079239794691e-05, "loss": 2.2378, "step": 146480 }, { "epoch": 0.92, "learning_rate": 2.7287162578944043e-05, "loss": 2.223, "step": 146488 }, { "epoch": 0.92, "learning_rate": 2.7283533573185977e-05, "loss": 2.209, "step": 146496 }, { "epoch": 0.92, "learning_rate": 2.7279905380762953e-05, "loss": 2.2268, "step": 146504 }, { "epoch": 0.92, "learning_rate": 2.7276278001765134e-05, "loss": 2.2205, "step": 146512 }, { "epoch": 0.92, "learning_rate": 2.7272651436282714e-05, "loss": 2.2053, "step": 146520 }, { "epoch": 0.92, "learning_rate": 2.726902568440588e-05, "loss": 2.2086, "step": 146528 }, { "epoch": 0.92, "learning_rate": 2.7265400746224705e-05, "loss": 2.2233, "step": 146536 }, { "epoch": 0.92, "learning_rate": 2.7261776621829348e-05, "loss": 2.2247, "step": 146544 }, { "epoch": 0.92, "learning_rate": 2.7258153311309918e-05, "loss": 2.2476, "step": 146552 }, { "epoch": 0.92, "learning_rate": 2.7254530814756452e-05, "loss": 2.207, "step": 146560 }, { "epoch": 0.92, "learning_rate": 2.725090913225903e-05, "loss": 2.2034, "step": 146568 }, { "epoch": 0.92, "learning_rate": 2.7247288263907677e-05, "loss": 2.2278, "step": 146576 }, { "epoch": 0.92, "learning_rate": 2.7243668209792416e-05, "loss": 2.2295, "step": 146584 }, { "epoch": 0.92, "learning_rate": 2.724004897000324e-05, "loss": 2.2248, "step": 146592 }, { "epoch": 0.92, "learning_rate": 2.7236430544630114e-05, "loss": 2.2206, "step": 146600 }, { "epoch": 0.92, "learning_rate": 2.7232812933763006e-05, "loss": 2.2106, "step": 146608 }, { "epoch": 0.92, "learning_rate": 2.722919613749185e-05, "loss": 2.2152, "step": 146616 }, { "epoch": 0.92, "learning_rate": 2.722558015590655e-05, "loss": 2.2175, "step": 146624 }, { "epoch": 0.92, "learning_rate": 2.7221964989097004e-05, "loss": 2.2177, "step": 146632 }, { "epoch": 0.92, "learning_rate": 2.721835063715309e-05, "loss": 2.2157, "step": 146640 }, { "epoch": 0.92, "learning_rate": 2.7214737100164645e-05, "loss": 2.2175, "step": 146648 }, { "epoch": 0.92, "learning_rate": 2.7211124378221533e-05, "loss": 2.209, "step": 146656 }, { "epoch": 0.92, "learning_rate": 2.7207512471413533e-05, "loss": 2.2198, "step": 146664 }, { "epoch": 0.92, "learning_rate": 2.7203901379830453e-05, "loss": 2.214, "step": 146672 }, { "epoch": 0.92, "learning_rate": 2.720029110356207e-05, "loss": 2.2309, "step": 146680 }, { "epoch": 0.92, "learning_rate": 2.719668164269813e-05, "loss": 2.2063, "step": 146688 }, { "epoch": 0.92, "learning_rate": 2.719307299732836e-05, "loss": 2.2335, "step": 146696 }, { "epoch": 0.92, "learning_rate": 2.7189465167542482e-05, "loss": 2.2124, "step": 146704 }, { "epoch": 0.92, "learning_rate": 2.718585815343017e-05, "loss": 2.2242, "step": 146712 }, { "epoch": 0.92, "learning_rate": 2.718225195508113e-05, "loss": 2.2318, "step": 146720 }, { "epoch": 0.92, "learning_rate": 2.7178646572584965e-05, "loss": 2.2176, "step": 146728 }, { "epoch": 0.92, "learning_rate": 2.717504200603133e-05, "loss": 2.2259, "step": 146736 }, { "epoch": 0.92, "learning_rate": 2.7171438255509856e-05, "loss": 2.2071, "step": 146744 }, { "epoch": 0.92, "learning_rate": 2.7167835321110092e-05, "loss": 2.2342, "step": 146752 }, { "epoch": 0.92, "learning_rate": 2.716423320292162e-05, "loss": 2.2144, "step": 146760 }, { "epoch": 0.92, "learning_rate": 2.716063190103402e-05, "loss": 2.2354, "step": 146768 }, { "epoch": 0.92, "learning_rate": 2.7157031415536765e-05, "loss": 2.2267, "step": 146776 }, { "epoch": 0.92, "learning_rate": 2.7153431746519408e-05, "loss": 2.2229, "step": 146784 }, { "epoch": 0.92, "learning_rate": 2.714983289407142e-05, "loss": 2.2415, "step": 146792 }, { "epoch": 0.92, "learning_rate": 2.7146234858282277e-05, "loss": 2.2145, "step": 146800 }, { "epoch": 0.92, "learning_rate": 2.7142637639241425e-05, "loss": 2.2136, "step": 146808 }, { "epoch": 0.92, "learning_rate": 2.7139041237038275e-05, "loss": 2.221, "step": 146816 }, { "epoch": 0.92, "learning_rate": 2.7135445651762255e-05, "loss": 2.2087, "step": 146824 }, { "epoch": 0.92, "learning_rate": 2.713185088350274e-05, "loss": 2.2119, "step": 146832 }, { "epoch": 0.92, "learning_rate": 2.71282569323491e-05, "loss": 2.2158, "step": 146840 }, { "epoch": 0.92, "learning_rate": 2.7124663798390688e-05, "loss": 2.2249, "step": 146848 }, { "epoch": 0.92, "learning_rate": 2.7121071481716813e-05, "loss": 2.2473, "step": 146856 }, { "epoch": 0.92, "learning_rate": 2.7117479982416793e-05, "loss": 2.2138, "step": 146864 }, { "epoch": 0.92, "learning_rate": 2.7113889300579915e-05, "loss": 2.2246, "step": 146872 }, { "epoch": 0.92, "learning_rate": 2.711029943629544e-05, "loss": 2.2153, "step": 146880 }, { "epoch": 0.92, "learning_rate": 2.7106710389652594e-05, "loss": 2.2168, "step": 146888 }, { "epoch": 0.92, "learning_rate": 2.7103122160740634e-05, "loss": 2.2233, "step": 146896 }, { "epoch": 0.92, "learning_rate": 2.7099534749648746e-05, "loss": 2.239, "step": 146904 }, { "epoch": 0.92, "learning_rate": 2.7095948156466105e-05, "loss": 2.2125, "step": 146912 }, { "epoch": 0.92, "learning_rate": 2.70923623812819e-05, "loss": 2.2219, "step": 146920 }, { "epoch": 0.92, "learning_rate": 2.7088777424185248e-05, "loss": 2.2099, "step": 146928 }, { "epoch": 0.92, "learning_rate": 2.7085193285265298e-05, "loss": 2.2139, "step": 146936 }, { "epoch": 0.92, "learning_rate": 2.7081609964611108e-05, "loss": 2.2315, "step": 146944 }, { "epoch": 0.92, "learning_rate": 2.7078027462311807e-05, "loss": 2.2306, "step": 146952 }, { "epoch": 0.92, "learning_rate": 2.707444577845644e-05, "loss": 2.2148, "step": 146960 }, { "epoch": 0.92, "learning_rate": 2.7070864913134037e-05, "loss": 2.2317, "step": 146968 }, { "epoch": 0.92, "learning_rate": 2.7067284866433627e-05, "loss": 2.2429, "step": 146976 }, { "epoch": 0.92, "learning_rate": 2.7063705638444213e-05, "loss": 2.2289, "step": 146984 }, { "epoch": 0.92, "learning_rate": 2.7060127229254765e-05, "loss": 2.2175, "step": 146992 }, { "epoch": 0.92, "learning_rate": 2.705654963895426e-05, "loss": 2.2305, "step": 147000 }, { "epoch": 0.92, "learning_rate": 2.7052972867631616e-05, "loss": 2.21, "step": 147008 }, { "epoch": 0.92, "learning_rate": 2.7049396915375775e-05, "loss": 2.2046, "step": 147016 }, { "epoch": 0.92, "learning_rate": 2.7045821782275617e-05, "loss": 2.2417, "step": 147024 }, { "epoch": 0.92, "learning_rate": 2.7042247468420023e-05, "loss": 2.2248, "step": 147032 }, { "epoch": 0.92, "learning_rate": 2.703867397389786e-05, "loss": 2.2212, "step": 147040 }, { "epoch": 0.92, "learning_rate": 2.7035101298797964e-05, "loss": 2.2166, "step": 147048 }, { "epoch": 0.92, "learning_rate": 2.7031529443209142e-05, "loss": 2.2227, "step": 147056 }, { "epoch": 0.92, "learning_rate": 2.70279584072202e-05, "loss": 2.1995, "step": 147064 }, { "epoch": 0.92, "learning_rate": 2.7024388190919914e-05, "loss": 2.2211, "step": 147072 }, { "epoch": 0.92, "learning_rate": 2.7020818794397022e-05, "loss": 2.2317, "step": 147080 }, { "epoch": 0.92, "learning_rate": 2.701725021774029e-05, "loss": 2.2267, "step": 147088 }, { "epoch": 0.92, "learning_rate": 2.7013682461038427e-05, "loss": 2.2147, "step": 147096 }, { "epoch": 0.92, "learning_rate": 2.70101155243801e-05, "loss": 2.2179, "step": 147104 }, { "epoch": 0.92, "learning_rate": 2.7006549407854008e-05, "loss": 2.2276, "step": 147112 }, { "epoch": 0.92, "learning_rate": 2.7002984111548806e-05, "loss": 2.2143, "step": 147120 }, { "epoch": 0.92, "learning_rate": 2.699941963555311e-05, "loss": 2.2236, "step": 147128 }, { "epoch": 0.92, "learning_rate": 2.6995855979955555e-05, "loss": 2.2424, "step": 147136 }, { "epoch": 0.92, "learning_rate": 2.699229314484471e-05, "loss": 2.2099, "step": 147144 }, { "epoch": 0.92, "learning_rate": 2.6988731130309184e-05, "loss": 2.2235, "step": 147152 }, { "epoch": 0.92, "learning_rate": 2.6985169936437487e-05, "loss": 2.2189, "step": 147160 }, { "epoch": 0.92, "learning_rate": 2.6981609563318168e-05, "loss": 2.243, "step": 147168 }, { "epoch": 0.92, "learning_rate": 2.6978050011039758e-05, "loss": 2.2292, "step": 147176 }, { "epoch": 0.92, "learning_rate": 2.6974491279690712e-05, "loss": 2.2149, "step": 147184 }, { "epoch": 0.92, "learning_rate": 2.6970933369359525e-05, "loss": 2.224, "step": 147192 }, { "epoch": 0.92, "learning_rate": 2.696737628013464e-05, "loss": 2.2149, "step": 147200 }, { "epoch": 0.92, "learning_rate": 2.6963820012104486e-05, "loss": 2.2377, "step": 147208 }, { "epoch": 0.92, "learning_rate": 2.6960264565357475e-05, "loss": 2.2164, "step": 147216 }, { "epoch": 0.92, "learning_rate": 2.6956709939981983e-05, "loss": 2.2225, "step": 147224 }, { "epoch": 0.92, "learning_rate": 2.6953156136066405e-05, "loss": 2.2243, "step": 147232 }, { "epoch": 0.92, "learning_rate": 2.6949603153699067e-05, "loss": 2.2139, "step": 147240 }, { "epoch": 0.92, "learning_rate": 2.6946050992968297e-05, "loss": 2.2182, "step": 147248 }, { "epoch": 0.92, "learning_rate": 2.6942499653962418e-05, "loss": 2.2411, "step": 147256 }, { "epoch": 0.92, "learning_rate": 2.6938949136769703e-05, "loss": 2.2102, "step": 147264 }, { "epoch": 0.92, "learning_rate": 2.6935399441478414e-05, "loss": 2.2246, "step": 147272 }, { "epoch": 0.92, "learning_rate": 2.6931850568176815e-05, "loss": 2.2127, "step": 147280 }, { "epoch": 0.92, "learning_rate": 2.6928302516953118e-05, "loss": 2.2331, "step": 147288 }, { "epoch": 0.92, "learning_rate": 2.6924755287895525e-05, "loss": 2.2351, "step": 147296 }, { "epoch": 0.92, "learning_rate": 2.6921208881092234e-05, "loss": 2.2346, "step": 147304 }, { "epoch": 0.92, "learning_rate": 2.6917663296631406e-05, "loss": 2.2189, "step": 147312 }, { "epoch": 0.92, "learning_rate": 2.6914118534601168e-05, "loss": 2.2111, "step": 147320 }, { "epoch": 0.92, "learning_rate": 2.691057459508966e-05, "loss": 2.2195, "step": 147328 }, { "epoch": 0.92, "learning_rate": 2.6907031478184986e-05, "loss": 2.2132, "step": 147336 }, { "epoch": 0.92, "learning_rate": 2.690348918397522e-05, "loss": 2.2127, "step": 147344 }, { "epoch": 0.92, "learning_rate": 2.6899947712548423e-05, "loss": 2.2208, "step": 147352 }, { "epoch": 0.92, "learning_rate": 2.6896407063992636e-05, "loss": 2.2245, "step": 147360 }, { "epoch": 0.92, "learning_rate": 2.6892867238395896e-05, "loss": 2.2231, "step": 147368 }, { "epoch": 0.92, "learning_rate": 2.6889328235846177e-05, "loss": 2.2092, "step": 147376 }, { "epoch": 0.92, "learning_rate": 2.688579005643147e-05, "loss": 2.2249, "step": 147384 }, { "epoch": 0.92, "learning_rate": 2.6882252700239763e-05, "loss": 2.2201, "step": 147392 }, { "epoch": 0.92, "learning_rate": 2.6878716167358946e-05, "loss": 2.2104, "step": 147400 }, { "epoch": 0.92, "learning_rate": 2.687518045787697e-05, "loss": 2.2267, "step": 147408 }, { "epoch": 0.92, "learning_rate": 2.6871645571881716e-05, "loss": 2.2267, "step": 147416 }, { "epoch": 0.92, "learning_rate": 2.686811150946108e-05, "loss": 2.2202, "step": 147424 }, { "epoch": 0.92, "learning_rate": 2.686457827070291e-05, "loss": 2.2255, "step": 147432 }, { "epoch": 0.92, "learning_rate": 2.6861045855695034e-05, "loss": 2.2155, "step": 147440 }, { "epoch": 0.92, "learning_rate": 2.685751426452528e-05, "loss": 2.2238, "step": 147448 }, { "epoch": 0.92, "learning_rate": 2.6853983497281443e-05, "loss": 2.2179, "step": 147456 }, { "epoch": 0.92, "learning_rate": 2.6850453554051286e-05, "loss": 2.2303, "step": 147464 }, { "epoch": 0.92, "learning_rate": 2.6846924434922583e-05, "loss": 2.2303, "step": 147472 }, { "epoch": 0.92, "learning_rate": 2.6843396139983057e-05, "loss": 2.2341, "step": 147480 }, { "epoch": 0.92, "learning_rate": 2.6839868669320417e-05, "loss": 2.2397, "step": 147488 }, { "epoch": 0.92, "learning_rate": 2.6836342023022366e-05, "loss": 2.2157, "step": 147496 }, { "epoch": 0.92, "learning_rate": 2.6832816201176575e-05, "loss": 2.2214, "step": 147504 }, { "epoch": 0.92, "learning_rate": 2.682929120387069e-05, "loss": 2.2341, "step": 147512 }, { "epoch": 0.92, "learning_rate": 2.682576703119235e-05, "loss": 2.2137, "step": 147520 }, { "epoch": 0.92, "learning_rate": 2.6822243683229165e-05, "loss": 2.2261, "step": 147528 }, { "epoch": 0.92, "learning_rate": 2.6818721160068717e-05, "loss": 2.2151, "step": 147536 }, { "epoch": 0.92, "learning_rate": 2.6815199461798596e-05, "loss": 2.2137, "step": 147544 }, { "epoch": 0.92, "learning_rate": 2.6811678588506328e-05, "loss": 2.2355, "step": 147552 }, { "epoch": 0.92, "learning_rate": 2.680815854027947e-05, "loss": 2.227, "step": 147560 }, { "epoch": 0.92, "learning_rate": 2.6804639317205495e-05, "loss": 2.2329, "step": 147568 }, { "epoch": 0.92, "learning_rate": 2.680112091937192e-05, "loss": 2.229, "step": 147576 }, { "epoch": 0.92, "learning_rate": 2.6797603346866213e-05, "loss": 2.2239, "step": 147584 }, { "epoch": 0.92, "learning_rate": 2.6794086599775797e-05, "loss": 2.208, "step": 147592 }, { "epoch": 0.92, "learning_rate": 2.679057067818811e-05, "loss": 2.2414, "step": 147600 }, { "epoch": 0.92, "learning_rate": 2.678705558219059e-05, "loss": 2.2283, "step": 147608 }, { "epoch": 0.92, "learning_rate": 2.678354131187057e-05, "loss": 2.2205, "step": 147616 }, { "epoch": 0.92, "learning_rate": 2.6780027867315444e-05, "loss": 2.228, "step": 147624 }, { "epoch": 0.92, "learning_rate": 2.6776515248612554e-05, "loss": 2.2033, "step": 147632 }, { "epoch": 0.92, "learning_rate": 2.6773003455849223e-05, "loss": 2.2161, "step": 147640 }, { "epoch": 0.92, "learning_rate": 2.6769492489112758e-05, "loss": 2.2373, "step": 147648 }, { "epoch": 0.92, "learning_rate": 2.6765982348490427e-05, "loss": 2.2213, "step": 147656 }, { "epoch": 0.92, "learning_rate": 2.6762473034069515e-05, "loss": 2.2215, "step": 147664 }, { "epoch": 0.92, "learning_rate": 2.6758964545937248e-05, "loss": 2.2208, "step": 147672 }, { "epoch": 0.92, "learning_rate": 2.6755456884180846e-05, "loss": 2.2177, "step": 147680 }, { "epoch": 0.92, "learning_rate": 2.675195004888753e-05, "loss": 2.2258, "step": 147688 }, { "epoch": 0.92, "learning_rate": 2.674844404014446e-05, "loss": 2.2347, "step": 147696 }, { "epoch": 0.92, "learning_rate": 2.674493885803879e-05, "loss": 2.2162, "step": 147704 }, { "epoch": 0.92, "learning_rate": 2.6741434502657693e-05, "loss": 2.2322, "step": 147712 }, { "epoch": 0.92, "learning_rate": 2.6737930974088254e-05, "loss": 2.2213, "step": 147720 }, { "epoch": 0.92, "learning_rate": 2.6734428272417572e-05, "loss": 2.2242, "step": 147728 }, { "epoch": 0.92, "learning_rate": 2.6730926397732753e-05, "loss": 2.2407, "step": 147736 }, { "epoch": 0.92, "learning_rate": 2.6727425350120834e-05, "loss": 2.2248, "step": 147744 }, { "epoch": 0.92, "learning_rate": 2.6723925129668844e-05, "loss": 2.2462, "step": 147752 }, { "epoch": 0.92, "learning_rate": 2.6720425736463815e-05, "loss": 2.231, "step": 147760 }, { "epoch": 0.92, "learning_rate": 2.6716927170592733e-05, "loss": 2.2268, "step": 147768 }, { "epoch": 0.92, "learning_rate": 2.671342943214259e-05, "loss": 2.1959, "step": 147776 }, { "epoch": 0.92, "learning_rate": 2.670993252120031e-05, "loss": 2.2202, "step": 147784 }, { "epoch": 0.92, "learning_rate": 2.670643643785284e-05, "loss": 2.2096, "step": 147792 }, { "epoch": 0.92, "learning_rate": 2.6702941182187114e-05, "loss": 2.2203, "step": 147800 }, { "epoch": 0.92, "learning_rate": 2.669944675428999e-05, "loss": 2.2047, "step": 147808 }, { "epoch": 0.92, "learning_rate": 2.6695953154248353e-05, "loss": 2.2169, "step": 147816 }, { "epoch": 0.92, "learning_rate": 2.6692460382149075e-05, "loss": 2.2421, "step": 147824 }, { "epoch": 0.92, "learning_rate": 2.6688968438078953e-05, "loss": 2.1969, "step": 147832 }, { "epoch": 0.92, "learning_rate": 2.6685477322124825e-05, "loss": 2.2235, "step": 147840 }, { "epoch": 0.92, "learning_rate": 2.668198703437346e-05, "loss": 2.2201, "step": 147848 }, { "epoch": 0.92, "learning_rate": 2.6678497574911636e-05, "loss": 2.2339, "step": 147856 }, { "epoch": 0.92, "learning_rate": 2.667500894382611e-05, "loss": 2.2172, "step": 147864 }, { "epoch": 0.92, "learning_rate": 2.667152114120359e-05, "loss": 2.2296, "step": 147872 }, { "epoch": 0.92, "learning_rate": 2.6668034167130794e-05, "loss": 2.2291, "step": 147880 }, { "epoch": 0.92, "learning_rate": 2.6664548021694418e-05, "loss": 2.2215, "step": 147888 }, { "epoch": 0.92, "learning_rate": 2.6661062704981105e-05, "loss": 2.2122, "step": 147896 }, { "epoch": 0.92, "learning_rate": 2.6657578217077523e-05, "loss": 2.2318, "step": 147904 }, { "epoch": 0.92, "learning_rate": 2.6654094558070286e-05, "loss": 2.2093, "step": 147912 }, { "epoch": 0.92, "learning_rate": 2.6650611728045993e-05, "loss": 2.2354, "step": 147920 }, { "epoch": 0.92, "learning_rate": 2.6647129727091246e-05, "loss": 2.2268, "step": 147928 }, { "epoch": 0.92, "learning_rate": 2.6643648555292593e-05, "loss": 2.2308, "step": 147936 }, { "epoch": 0.92, "learning_rate": 2.6640168212736572e-05, "loss": 2.224, "step": 147944 }, { "epoch": 0.92, "learning_rate": 2.663668869950972e-05, "loss": 2.2302, "step": 147952 }, { "epoch": 0.92, "learning_rate": 2.6633210015698528e-05, "loss": 2.2111, "step": 147960 }, { "epoch": 0.92, "learning_rate": 2.662973216138947e-05, "loss": 2.2175, "step": 147968 }, { "epoch": 0.92, "learning_rate": 2.662625513666903e-05, "loss": 2.2446, "step": 147976 }, { "epoch": 0.92, "learning_rate": 2.6622778941623615e-05, "loss": 2.2235, "step": 147984 }, { "epoch": 0.92, "learning_rate": 2.6619303576339682e-05, "loss": 2.2134, "step": 147992 }, { "epoch": 0.93, "learning_rate": 2.661582904090359e-05, "loss": 2.2253, "step": 148000 }, { "epoch": 0.93, "learning_rate": 2.661235533540173e-05, "loss": 2.2265, "step": 148008 }, { "epoch": 0.93, "learning_rate": 2.6608882459920482e-05, "loss": 2.2337, "step": 148016 }, { "epoch": 0.93, "learning_rate": 2.6605410414546146e-05, "loss": 2.1978, "step": 148024 }, { "epoch": 0.93, "learning_rate": 2.6601939199365068e-05, "loss": 2.2044, "step": 148032 }, { "epoch": 0.93, "learning_rate": 2.6598468814463516e-05, "loss": 2.2166, "step": 148040 }, { "epoch": 0.93, "learning_rate": 2.6594999259927777e-05, "loss": 2.2185, "step": 148048 }, { "epoch": 0.93, "learning_rate": 2.659153053584411e-05, "loss": 2.2293, "step": 148056 }, { "epoch": 0.93, "learning_rate": 2.6588062642298738e-05, "loss": 2.2307, "step": 148064 }, { "epoch": 0.93, "learning_rate": 2.658459557937788e-05, "loss": 2.2214, "step": 148072 }, { "epoch": 0.93, "learning_rate": 2.6581129347167727e-05, "loss": 2.221, "step": 148080 }, { "epoch": 0.93, "learning_rate": 2.6577663945754437e-05, "loss": 2.2186, "step": 148088 }, { "epoch": 0.93, "learning_rate": 2.6574199375224185e-05, "loss": 2.2062, "step": 148096 }, { "epoch": 0.93, "learning_rate": 2.6570735635663084e-05, "loss": 2.2357, "step": 148104 }, { "epoch": 0.93, "learning_rate": 2.656727272715724e-05, "loss": 2.2093, "step": 148112 }, { "epoch": 0.93, "learning_rate": 2.6563810649792752e-05, "loss": 2.2058, "step": 148120 }, { "epoch": 0.93, "learning_rate": 2.6560349403655683e-05, "loss": 2.2334, "step": 148128 }, { "epoch": 0.93, "learning_rate": 2.6556888988832074e-05, "loss": 2.2101, "step": 148136 }, { "epoch": 0.93, "learning_rate": 2.6553429405407965e-05, "loss": 2.2258, "step": 148144 }, { "epoch": 0.93, "learning_rate": 2.6549970653469354e-05, "loss": 2.2218, "step": 148152 }, { "epoch": 0.93, "learning_rate": 2.6546512733102215e-05, "loss": 2.2139, "step": 148160 }, { "epoch": 0.93, "learning_rate": 2.654305564439253e-05, "loss": 2.2227, "step": 148168 }, { "epoch": 0.93, "learning_rate": 2.653959938742624e-05, "loss": 2.2119, "step": 148176 }, { "epoch": 0.93, "learning_rate": 2.6536143962289255e-05, "loss": 2.2266, "step": 148184 }, { "epoch": 0.93, "learning_rate": 2.6532689369067486e-05, "loss": 2.2209, "step": 148192 }, { "epoch": 0.93, "learning_rate": 2.6529235607846814e-05, "loss": 2.2226, "step": 148200 }, { "epoch": 0.93, "learning_rate": 2.652578267871311e-05, "loss": 2.221, "step": 148208 }, { "epoch": 0.93, "learning_rate": 2.6522330581752197e-05, "loss": 2.2333, "step": 148216 }, { "epoch": 0.93, "learning_rate": 2.6518879317049894e-05, "loss": 2.23, "step": 148224 }, { "epoch": 0.93, "learning_rate": 2.651542888469203e-05, "loss": 2.2136, "step": 148232 }, { "epoch": 0.93, "learning_rate": 2.6511979284764337e-05, "loss": 2.2135, "step": 148240 }, { "epoch": 0.93, "learning_rate": 2.650853051735261e-05, "loss": 2.234, "step": 148248 }, { "epoch": 0.93, "learning_rate": 2.650508258254256e-05, "loss": 2.2287, "step": 148256 }, { "epoch": 0.93, "learning_rate": 2.650163548041993e-05, "loss": 2.2358, "step": 148264 }, { "epoch": 0.93, "learning_rate": 2.649818921107039e-05, "loss": 2.2141, "step": 148272 }, { "epoch": 0.93, "learning_rate": 2.649474377457963e-05, "loss": 2.2188, "step": 148280 }, { "epoch": 0.93, "learning_rate": 2.6491299171033295e-05, "loss": 2.2019, "step": 148288 }, { "epoch": 0.93, "learning_rate": 2.648785540051703e-05, "loss": 2.2262, "step": 148296 }, { "epoch": 0.93, "learning_rate": 2.6484412463116426e-05, "loss": 2.2297, "step": 148304 }, { "epoch": 0.93, "learning_rate": 2.64809703589171e-05, "loss": 2.217, "step": 148312 }, { "epoch": 0.93, "learning_rate": 2.647752908800461e-05, "loss": 2.2226, "step": 148320 }, { "epoch": 0.93, "learning_rate": 2.64740886504645e-05, "loss": 2.2117, "step": 148328 }, { "epoch": 0.93, "learning_rate": 2.6470649046382322e-05, "loss": 2.2153, "step": 148336 }, { "epoch": 0.93, "learning_rate": 2.6467210275843564e-05, "loss": 2.2243, "step": 148344 }, { "epoch": 0.93, "learning_rate": 2.646377233893371e-05, "loss": 2.2125, "step": 148352 }, { "epoch": 0.93, "learning_rate": 2.6460335235738255e-05, "loss": 2.2088, "step": 148360 }, { "epoch": 0.93, "learning_rate": 2.6456898966342625e-05, "loss": 2.2192, "step": 148368 }, { "epoch": 0.93, "learning_rate": 2.6453463530832247e-05, "loss": 2.2168, "step": 148376 }, { "epoch": 0.93, "learning_rate": 2.6450028929292524e-05, "loss": 2.2125, "step": 148384 }, { "epoch": 0.93, "learning_rate": 2.6446595161808858e-05, "loss": 2.2223, "step": 148392 }, { "epoch": 0.93, "learning_rate": 2.64431622284666e-05, "loss": 2.2228, "step": 148400 }, { "epoch": 0.93, "learning_rate": 2.643973012935108e-05, "loss": 2.219, "step": 148408 }, { "epoch": 0.93, "learning_rate": 2.6436298864547638e-05, "loss": 2.2159, "step": 148416 }, { "epoch": 0.93, "learning_rate": 2.643286843414159e-05, "loss": 2.2293, "step": 148424 }, { "epoch": 0.93, "learning_rate": 2.642943883821818e-05, "loss": 2.2409, "step": 148432 }, { "epoch": 0.93, "learning_rate": 2.6426010076862685e-05, "loss": 2.217, "step": 148440 }, { "epoch": 0.93, "learning_rate": 2.642258215016037e-05, "loss": 2.2205, "step": 148448 }, { "epoch": 0.93, "learning_rate": 2.641915505819641e-05, "loss": 2.2084, "step": 148456 }, { "epoch": 0.93, "learning_rate": 2.6415728801056028e-05, "loss": 2.2262, "step": 148464 }, { "epoch": 0.93, "learning_rate": 2.641230337882439e-05, "loss": 2.2187, "step": 148472 }, { "epoch": 0.93, "learning_rate": 2.6408878791586666e-05, "loss": 2.2158, "step": 148480 }, { "epoch": 0.93, "learning_rate": 2.6405455039427984e-05, "loss": 2.2156, "step": 148488 }, { "epoch": 0.93, "learning_rate": 2.6402032122433452e-05, "loss": 2.2226, "step": 148496 }, { "epoch": 0.93, "learning_rate": 2.6398610040688175e-05, "loss": 2.2284, "step": 148504 }, { "epoch": 0.93, "learning_rate": 2.6395188794277226e-05, "loss": 2.2236, "step": 148512 }, { "epoch": 0.93, "learning_rate": 2.6391768383285647e-05, "loss": 2.2088, "step": 148520 }, { "epoch": 0.93, "learning_rate": 2.6388348807798487e-05, "loss": 2.2229, "step": 148528 }, { "epoch": 0.93, "learning_rate": 2.6384930067900744e-05, "loss": 2.2213, "step": 148536 }, { "epoch": 0.93, "learning_rate": 2.6381512163677402e-05, "loss": 2.2078, "step": 148544 }, { "epoch": 0.93, "learning_rate": 2.637809509521345e-05, "loss": 2.2167, "step": 148552 }, { "epoch": 0.93, "learning_rate": 2.637467886259382e-05, "loss": 2.2122, "step": 148560 }, { "epoch": 0.93, "learning_rate": 2.6371263465903444e-05, "loss": 2.2279, "step": 148568 }, { "epoch": 0.93, "learning_rate": 2.6367848905227238e-05, "loss": 2.2288, "step": 148576 }, { "epoch": 0.93, "learning_rate": 2.636443518065008e-05, "loss": 2.2245, "step": 148584 }, { "epoch": 0.93, "learning_rate": 2.636102229225683e-05, "loss": 2.2319, "step": 148592 }, { "epoch": 0.93, "learning_rate": 2.6357610240132354e-05, "loss": 2.2282, "step": 148600 }, { "epoch": 0.93, "learning_rate": 2.6354199024361447e-05, "loss": 2.2157, "step": 148608 }, { "epoch": 0.93, "learning_rate": 2.6350788645028944e-05, "loss": 2.2247, "step": 148616 }, { "epoch": 0.93, "learning_rate": 2.6347379102219598e-05, "loss": 2.2324, "step": 148624 }, { "epoch": 0.93, "learning_rate": 2.634397039601818e-05, "loss": 2.2344, "step": 148632 }, { "epoch": 0.93, "learning_rate": 2.634056252650945e-05, "loss": 2.2242, "step": 148640 }, { "epoch": 0.93, "learning_rate": 2.63371554937781e-05, "loss": 2.2245, "step": 148648 }, { "epoch": 0.93, "learning_rate": 2.633374929790884e-05, "loss": 2.2311, "step": 148656 }, { "epoch": 0.93, "learning_rate": 2.633034393898636e-05, "loss": 2.2174, "step": 148664 }, { "epoch": 0.93, "learning_rate": 2.6326939417095297e-05, "loss": 2.2215, "step": 148672 }, { "epoch": 0.93, "learning_rate": 2.6323535732320304e-05, "loss": 2.2342, "step": 148680 }, { "epoch": 0.93, "learning_rate": 2.6320132884745985e-05, "loss": 2.232, "step": 148688 }, { "epoch": 0.93, "learning_rate": 2.6316730874456947e-05, "loss": 2.2127, "step": 148696 }, { "epoch": 0.93, "learning_rate": 2.631332970153776e-05, "loss": 2.2246, "step": 148704 }, { "epoch": 0.93, "learning_rate": 2.6309929366072972e-05, "loss": 2.2218, "step": 148712 }, { "epoch": 0.93, "learning_rate": 2.6306529868147123e-05, "loss": 2.22, "step": 148720 }, { "epoch": 0.93, "learning_rate": 2.630313120784472e-05, "loss": 2.2174, "step": 148728 }, { "epoch": 0.93, "learning_rate": 2.6299733385250248e-05, "loss": 2.2266, "step": 148736 }, { "epoch": 0.93, "learning_rate": 2.6296336400448195e-05, "loss": 2.2172, "step": 148744 }, { "epoch": 0.93, "learning_rate": 2.6292940253523002e-05, "loss": 2.2245, "step": 148752 }, { "epoch": 0.93, "learning_rate": 2.6289544944559084e-05, "loss": 2.2178, "step": 148760 }, { "epoch": 0.93, "learning_rate": 2.628615047364088e-05, "loss": 2.2302, "step": 148768 }, { "epoch": 0.93, "learning_rate": 2.6282756840852752e-05, "loss": 2.2271, "step": 148776 }, { "epoch": 0.93, "learning_rate": 2.627936404627906e-05, "loss": 2.2195, "step": 148784 }, { "epoch": 0.93, "learning_rate": 2.627597209000417e-05, "loss": 2.2162, "step": 148792 }, { "epoch": 0.93, "learning_rate": 2.6272580972112404e-05, "loss": 2.2207, "step": 148800 }, { "epoch": 0.93, "learning_rate": 2.626919069268804e-05, "loss": 2.2188, "step": 148808 }, { "epoch": 0.93, "learning_rate": 2.6265801251815392e-05, "loss": 2.2082, "step": 148816 }, { "epoch": 0.93, "learning_rate": 2.6262412649578706e-05, "loss": 2.2225, "step": 148824 }, { "epoch": 0.93, "learning_rate": 2.6259024886062243e-05, "loss": 2.2304, "step": 148832 }, { "epoch": 0.93, "learning_rate": 2.625563796135019e-05, "loss": 2.2262, "step": 148840 }, { "epoch": 0.93, "learning_rate": 2.6252251875526758e-05, "loss": 2.2108, "step": 148848 }, { "epoch": 0.93, "learning_rate": 2.6248866628676157e-05, "loss": 2.222, "step": 148856 }, { "epoch": 0.93, "learning_rate": 2.6245482220882495e-05, "loss": 2.2207, "step": 148864 }, { "epoch": 0.93, "learning_rate": 2.624209865222994e-05, "loss": 2.2258, "step": 148872 }, { "epoch": 0.93, "learning_rate": 2.6238715922802604e-05, "loss": 2.2149, "step": 148880 }, { "epoch": 0.93, "learning_rate": 2.6235334032684568e-05, "loss": 2.2272, "step": 148888 }, { "epoch": 0.93, "learning_rate": 2.6231952981959916e-05, "loss": 2.2352, "step": 148896 }, { "epoch": 0.93, "learning_rate": 2.6228572770712705e-05, "loss": 2.2171, "step": 148904 }, { "epoch": 0.93, "learning_rate": 2.6225193399026964e-05, "loss": 2.2227, "step": 148912 }, { "epoch": 0.93, "learning_rate": 2.6221814866986714e-05, "loss": 2.2262, "step": 148920 }, { "epoch": 0.93, "learning_rate": 2.6218437174675918e-05, "loss": 2.2128, "step": 148928 }, { "epoch": 0.93, "learning_rate": 2.621506032217858e-05, "loss": 2.2256, "step": 148936 }, { "epoch": 0.93, "learning_rate": 2.621168430957863e-05, "loss": 2.2257, "step": 148944 }, { "epoch": 0.93, "learning_rate": 2.6208309136959992e-05, "loss": 2.2166, "step": 148952 }, { "epoch": 0.93, "learning_rate": 2.620493480440659e-05, "loss": 2.2331, "step": 148960 }, { "epoch": 0.93, "learning_rate": 2.6201561312002292e-05, "loss": 2.2211, "step": 148968 }, { "epoch": 0.93, "learning_rate": 2.6198188659830968e-05, "loss": 2.2386, "step": 148976 }, { "epoch": 0.93, "learning_rate": 2.6194816847976483e-05, "loss": 2.2155, "step": 148984 }, { "epoch": 0.93, "learning_rate": 2.6191445876522634e-05, "loss": 2.2249, "step": 148992 }, { "epoch": 0.93, "learning_rate": 2.6188075745553232e-05, "loss": 2.2183, "step": 149000 }, { "epoch": 0.93, "learning_rate": 2.6184706455152063e-05, "loss": 2.2122, "step": 149008 }, { "epoch": 0.93, "learning_rate": 2.6181338005402888e-05, "loss": 2.2063, "step": 149016 }, { "epoch": 0.93, "learning_rate": 2.617797039638944e-05, "loss": 2.2211, "step": 149024 }, { "epoch": 0.93, "learning_rate": 2.6174603628195443e-05, "loss": 2.2101, "step": 149032 }, { "epoch": 0.93, "learning_rate": 2.6171237700904594e-05, "loss": 2.2336, "step": 149040 }, { "epoch": 0.93, "learning_rate": 2.6167872614600585e-05, "loss": 2.211, "step": 149048 }, { "epoch": 0.93, "learning_rate": 2.616450836936704e-05, "loss": 2.2246, "step": 149056 }, { "epoch": 0.93, "learning_rate": 2.6161144965287616e-05, "loss": 2.2287, "step": 149064 }, { "epoch": 0.93, "learning_rate": 2.615778240244594e-05, "loss": 2.2224, "step": 149072 }, { "epoch": 0.93, "learning_rate": 2.6154420680925574e-05, "loss": 2.2357, "step": 149080 }, { "epoch": 0.93, "learning_rate": 2.6151059800810118e-05, "loss": 2.2206, "step": 149088 }, { "epoch": 0.93, "learning_rate": 2.6147699762183113e-05, "loss": 2.2339, "step": 149096 }, { "epoch": 0.93, "learning_rate": 2.614434056512808e-05, "loss": 2.2181, "step": 149104 }, { "epoch": 0.93, "learning_rate": 2.614098220972855e-05, "loss": 2.2046, "step": 149112 }, { "epoch": 0.93, "learning_rate": 2.6137624696067987e-05, "loss": 2.2247, "step": 149120 }, { "epoch": 0.93, "learning_rate": 2.6134268024229886e-05, "loss": 2.2185, "step": 149128 }, { "epoch": 0.93, "learning_rate": 2.613091219429768e-05, "loss": 2.2105, "step": 149136 }, { "epoch": 0.93, "learning_rate": 2.6127557206354786e-05, "loss": 2.2188, "step": 149144 }, { "epoch": 0.93, "learning_rate": 2.6124203060484635e-05, "loss": 2.2281, "step": 149152 }, { "epoch": 0.93, "learning_rate": 2.6120849756770592e-05, "loss": 2.227, "step": 149160 }, { "epoch": 0.93, "learning_rate": 2.6117497295296018e-05, "loss": 2.2284, "step": 149168 }, { "epoch": 0.93, "learning_rate": 2.6114145676144275e-05, "loss": 2.2272, "step": 149176 }, { "epoch": 0.93, "learning_rate": 2.6110794899398666e-05, "loss": 2.2286, "step": 149184 }, { "epoch": 0.93, "learning_rate": 2.610744496514249e-05, "loss": 2.2289, "step": 149192 }, { "epoch": 0.93, "learning_rate": 2.610409587345905e-05, "loss": 2.225, "step": 149200 }, { "epoch": 0.93, "learning_rate": 2.6100747624431582e-05, "loss": 2.2178, "step": 149208 }, { "epoch": 0.93, "learning_rate": 2.6097400218143332e-05, "loss": 2.2429, "step": 149216 }, { "epoch": 0.93, "learning_rate": 2.6094053654677514e-05, "loss": 2.2368, "step": 149224 }, { "epoch": 0.93, "learning_rate": 2.609070793411733e-05, "loss": 2.2042, "step": 149232 }, { "epoch": 0.93, "learning_rate": 2.6087363056545954e-05, "loss": 2.2245, "step": 149240 }, { "epoch": 0.93, "learning_rate": 2.608401902204653e-05, "loss": 2.2104, "step": 149248 }, { "epoch": 0.93, "learning_rate": 2.6080675830702193e-05, "loss": 2.2372, "step": 149256 }, { "epoch": 0.93, "learning_rate": 2.6077333482596082e-05, "loss": 2.2223, "step": 149264 }, { "epoch": 0.93, "learning_rate": 2.6073991977811246e-05, "loss": 2.2246, "step": 149272 }, { "epoch": 0.93, "learning_rate": 2.6070651316430784e-05, "loss": 2.2451, "step": 149280 }, { "epoch": 0.93, "learning_rate": 2.6067311498537745e-05, "loss": 2.2363, "step": 149288 }, { "epoch": 0.93, "learning_rate": 2.6063972524215135e-05, "loss": 2.2142, "step": 149296 }, { "epoch": 0.93, "learning_rate": 2.6060634393545984e-05, "loss": 2.2118, "step": 149304 }, { "epoch": 0.93, "learning_rate": 2.6057297106613266e-05, "loss": 2.2217, "step": 149312 }, { "epoch": 0.93, "learning_rate": 2.6053960663499948e-05, "loss": 2.2184, "step": 149320 }, { "epoch": 0.93, "learning_rate": 2.605062506428899e-05, "loss": 2.2133, "step": 149328 }, { "epoch": 0.93, "learning_rate": 2.604729030906328e-05, "loss": 2.2082, "step": 149336 }, { "epoch": 0.93, "learning_rate": 2.604395639790576e-05, "loss": 2.2219, "step": 149344 }, { "epoch": 0.93, "learning_rate": 2.6040623330899295e-05, "loss": 2.2233, "step": 149352 }, { "epoch": 0.93, "learning_rate": 2.603729110812673e-05, "loss": 2.2207, "step": 149360 }, { "epoch": 0.93, "learning_rate": 2.603395972967093e-05, "loss": 2.2165, "step": 149368 }, { "epoch": 0.93, "learning_rate": 2.6030629195614697e-05, "loss": 2.2113, "step": 149376 }, { "epoch": 0.93, "learning_rate": 2.602729950604083e-05, "loss": 2.2195, "step": 149384 }, { "epoch": 0.93, "learning_rate": 2.602397066103212e-05, "loss": 2.2131, "step": 149392 }, { "epoch": 0.93, "learning_rate": 2.6020642660671307e-05, "loss": 2.2259, "step": 149400 }, { "epoch": 0.93, "learning_rate": 2.6017315505041118e-05, "loss": 2.2209, "step": 149408 }, { "epoch": 0.93, "learning_rate": 2.601398919422429e-05, "loss": 2.2252, "step": 149416 }, { "epoch": 0.93, "learning_rate": 2.601066372830351e-05, "loss": 2.209, "step": 149424 }, { "epoch": 0.93, "learning_rate": 2.6007339107361427e-05, "loss": 2.2161, "step": 149432 }, { "epoch": 0.93, "learning_rate": 2.6004015331480718e-05, "loss": 2.201, "step": 149440 }, { "epoch": 0.93, "learning_rate": 2.6000692400743998e-05, "loss": 2.2213, "step": 149448 }, { "epoch": 0.93, "learning_rate": 2.5997370315233893e-05, "loss": 2.2025, "step": 149456 }, { "epoch": 0.93, "learning_rate": 2.5994049075032956e-05, "loss": 2.2012, "step": 149464 }, { "epoch": 0.93, "learning_rate": 2.5990728680223786e-05, "loss": 2.2157, "step": 149472 }, { "epoch": 0.93, "learning_rate": 2.5987409130888924e-05, "loss": 2.2133, "step": 149480 }, { "epoch": 0.93, "learning_rate": 2.5984090427110875e-05, "loss": 2.2296, "step": 149488 }, { "epoch": 0.93, "learning_rate": 2.598077256897215e-05, "loss": 2.2299, "step": 149496 }, { "epoch": 0.93, "learning_rate": 2.5977455556555253e-05, "loss": 2.2261, "step": 149504 }, { "epoch": 0.93, "learning_rate": 2.5974139389942614e-05, "loss": 2.2123, "step": 149512 }, { "epoch": 0.93, "learning_rate": 2.5970824069216694e-05, "loss": 2.2136, "step": 149520 }, { "epoch": 0.93, "learning_rate": 2.59675095944599e-05, "loss": 2.2065, "step": 149528 }, { "epoch": 0.93, "learning_rate": 2.596419596575464e-05, "loss": 2.2184, "step": 149536 }, { "epoch": 0.93, "learning_rate": 2.5960883183183286e-05, "loss": 2.2241, "step": 149544 }, { "epoch": 0.93, "learning_rate": 2.5957571246828187e-05, "loss": 2.226, "step": 149552 }, { "epoch": 0.93, "learning_rate": 2.5954260156771704e-05, "loss": 2.2218, "step": 149560 }, { "epoch": 0.93, "learning_rate": 2.5950949913096123e-05, "loss": 2.1947, "step": 149568 }, { "epoch": 0.93, "learning_rate": 2.594764051588374e-05, "loss": 2.2182, "step": 149576 }, { "epoch": 0.93, "learning_rate": 2.5944331965216852e-05, "loss": 2.2178, "step": 149584 }, { "epoch": 0.93, "learning_rate": 2.5941024261177683e-05, "loss": 2.2311, "step": 149592 }, { "epoch": 0.94, "learning_rate": 2.593771740384847e-05, "loss": 2.2214, "step": 149600 }, { "epoch": 0.94, "learning_rate": 2.593441139331143e-05, "loss": 2.2198, "step": 149608 }, { "epoch": 0.94, "learning_rate": 2.5931106229648744e-05, "loss": 2.2234, "step": 149616 }, { "epoch": 0.94, "learning_rate": 2.5927801912942572e-05, "loss": 2.2051, "step": 149624 }, { "epoch": 0.94, "learning_rate": 2.592449844327507e-05, "loss": 2.2202, "step": 149632 }, { "epoch": 0.94, "learning_rate": 2.5921195820728368e-05, "loss": 2.2086, "step": 149640 }, { "epoch": 0.94, "learning_rate": 2.591789404538455e-05, "loss": 2.2254, "step": 149648 }, { "epoch": 0.94, "learning_rate": 2.5914593117325713e-05, "loss": 2.2106, "step": 149656 }, { "epoch": 0.94, "learning_rate": 2.5911293036633915e-05, "loss": 2.2145, "step": 149664 }, { "epoch": 0.94, "learning_rate": 2.590799380339122e-05, "loss": 2.1994, "step": 149672 }, { "epoch": 0.94, "learning_rate": 2.5904695417679592e-05, "loss": 2.2177, "step": 149680 }, { "epoch": 0.94, "learning_rate": 2.590139787958107e-05, "loss": 2.2168, "step": 149688 }, { "epoch": 0.94, "learning_rate": 2.5898101189177637e-05, "loss": 2.2073, "step": 149696 }, { "epoch": 0.94, "learning_rate": 2.5894805346551216e-05, "loss": 2.2096, "step": 149704 }, { "epoch": 0.94, "learning_rate": 2.5891510351783766e-05, "loss": 2.2434, "step": 149712 }, { "epoch": 0.94, "learning_rate": 2.5888216204957204e-05, "loss": 2.2214, "step": 149720 }, { "epoch": 0.94, "learning_rate": 2.58849229061534e-05, "loss": 2.2246, "step": 149728 }, { "epoch": 0.94, "learning_rate": 2.5881630455454252e-05, "loss": 2.21, "step": 149736 }, { "epoch": 0.94, "learning_rate": 2.587833885294159e-05, "loss": 2.2221, "step": 149744 }, { "epoch": 0.94, "learning_rate": 2.5875048098697258e-05, "loss": 2.2076, "step": 149752 }, { "epoch": 0.94, "learning_rate": 2.5871758192803063e-05, "loss": 2.2357, "step": 149760 }, { "epoch": 0.94, "learning_rate": 2.5868469135340778e-05, "loss": 2.2296, "step": 149768 }, { "epoch": 0.94, "learning_rate": 2.5865180926392185e-05, "loss": 2.2211, "step": 149776 }, { "epoch": 0.94, "learning_rate": 2.586189356603903e-05, "loss": 2.2391, "step": 149784 }, { "epoch": 0.94, "learning_rate": 2.585860705436302e-05, "loss": 2.2065, "step": 149792 }, { "epoch": 0.94, "learning_rate": 2.585532139144588e-05, "loss": 2.2212, "step": 149800 }, { "epoch": 0.94, "learning_rate": 2.5852036577369276e-05, "loss": 2.2191, "step": 149808 }, { "epoch": 0.94, "learning_rate": 2.5848752612214873e-05, "loss": 2.2125, "step": 149816 }, { "epoch": 0.94, "learning_rate": 2.584546949606431e-05, "loss": 2.2225, "step": 149824 }, { "epoch": 0.94, "learning_rate": 2.5842187228999215e-05, "loss": 2.2225, "step": 149832 }, { "epoch": 0.94, "learning_rate": 2.583890581110117e-05, "loss": 2.2133, "step": 149840 }, { "epoch": 0.94, "learning_rate": 2.5835625242451765e-05, "loss": 2.211, "step": 149848 }, { "epoch": 0.94, "learning_rate": 2.5832345523132552e-05, "loss": 2.2039, "step": 149856 }, { "epoch": 0.94, "learning_rate": 2.582906665322505e-05, "loss": 2.2104, "step": 149864 }, { "epoch": 0.94, "learning_rate": 2.58257886328108e-05, "loss": 2.2098, "step": 149872 }, { "epoch": 0.94, "learning_rate": 2.582251146197126e-05, "loss": 2.2069, "step": 149880 }, { "epoch": 0.94, "learning_rate": 2.5819235140787946e-05, "loss": 2.2282, "step": 149888 }, { "epoch": 0.94, "learning_rate": 2.581595966934226e-05, "loss": 2.2082, "step": 149896 }, { "epoch": 0.94, "learning_rate": 2.5812685047715656e-05, "loss": 2.2153, "step": 149904 }, { "epoch": 0.94, "learning_rate": 2.580941127598955e-05, "loss": 2.2053, "step": 149912 }, { "epoch": 0.94, "learning_rate": 2.58061383542453e-05, "loss": 2.2136, "step": 149920 }, { "epoch": 0.94, "learning_rate": 2.5802866282564296e-05, "loss": 2.2136, "step": 149928 }, { "epoch": 0.94, "learning_rate": 2.579959506102787e-05, "loss": 2.2167, "step": 149936 }, { "epoch": 0.94, "learning_rate": 2.5796324689717344e-05, "loss": 2.2044, "step": 149944 }, { "epoch": 0.94, "learning_rate": 2.579305516871403e-05, "loss": 2.2205, "step": 149952 }, { "epoch": 0.94, "learning_rate": 2.57897864980992e-05, "loss": 2.2315, "step": 149960 }, { "epoch": 0.94, "learning_rate": 2.578651867795412e-05, "loss": 2.2019, "step": 149968 }, { "epoch": 0.94, "learning_rate": 2.5783251708360024e-05, "loss": 2.2274, "step": 149976 }, { "epoch": 0.94, "learning_rate": 2.5779985589398115e-05, "loss": 2.2302, "step": 149984 }, { "epoch": 0.94, "learning_rate": 2.5776720321149616e-05, "loss": 2.2125, "step": 149992 }, { "epoch": 0.94, "learning_rate": 2.5773455903695694e-05, "loss": 2.2098, "step": 150000 }, { "epoch": 0.94, "learning_rate": 2.5770192337117488e-05, "loss": 2.2179, "step": 150008 }, { "epoch": 0.94, "learning_rate": 2.576692962149615e-05, "loss": 2.2381, "step": 150016 }, { "epoch": 0.94, "learning_rate": 2.576366775691278e-05, "loss": 2.2242, "step": 150024 }, { "epoch": 0.94, "learning_rate": 2.5760406743448463e-05, "loss": 2.2194, "step": 150032 }, { "epoch": 0.94, "learning_rate": 2.5757146581184288e-05, "loss": 2.2352, "step": 150040 }, { "epoch": 0.94, "learning_rate": 2.575388727020129e-05, "loss": 2.2139, "step": 150048 }, { "epoch": 0.94, "learning_rate": 2.5750628810580478e-05, "loss": 2.2181, "step": 150056 }, { "epoch": 0.94, "learning_rate": 2.574737120240289e-05, "loss": 2.2209, "step": 150064 }, { "epoch": 0.94, "learning_rate": 2.5744114445749508e-05, "loss": 2.2114, "step": 150072 }, { "epoch": 0.94, "learning_rate": 2.5740858540701274e-05, "loss": 2.2212, "step": 150080 }, { "epoch": 0.94, "learning_rate": 2.5737603487339136e-05, "loss": 2.2133, "step": 150088 }, { "epoch": 0.94, "learning_rate": 2.573434928574402e-05, "loss": 2.2351, "step": 150096 }, { "epoch": 0.94, "learning_rate": 2.573109593599684e-05, "loss": 2.2102, "step": 150104 }, { "epoch": 0.94, "learning_rate": 2.5727843438178443e-05, "loss": 2.2254, "step": 150112 }, { "epoch": 0.94, "learning_rate": 2.57245917923697e-05, "loss": 2.2273, "step": 150120 }, { "epoch": 0.94, "learning_rate": 2.5721340998651472e-05, "loss": 2.2219, "step": 150128 }, { "epoch": 0.94, "learning_rate": 2.5718091057104538e-05, "loss": 2.2158, "step": 150136 }, { "epoch": 0.94, "learning_rate": 2.571484196780971e-05, "loss": 2.2284, "step": 150144 }, { "epoch": 0.94, "learning_rate": 2.571159373084775e-05, "loss": 2.2225, "step": 150152 }, { "epoch": 0.94, "learning_rate": 2.5708346346299427e-05, "loss": 2.2308, "step": 150160 }, { "epoch": 0.94, "learning_rate": 2.5705099814245464e-05, "loss": 2.2037, "step": 150168 }, { "epoch": 0.94, "learning_rate": 2.5701854134766557e-05, "loss": 2.2183, "step": 150176 }, { "epoch": 0.94, "learning_rate": 2.569860930794341e-05, "loss": 2.2322, "step": 150184 }, { "epoch": 0.94, "learning_rate": 2.569536533385668e-05, "loss": 2.2199, "step": 150192 }, { "epoch": 0.94, "learning_rate": 2.5692122212587016e-05, "loss": 2.2427, "step": 150200 }, { "epoch": 0.94, "learning_rate": 2.568887994421505e-05, "loss": 2.2266, "step": 150208 }, { "epoch": 0.94, "learning_rate": 2.5685638528821376e-05, "loss": 2.2242, "step": 150216 }, { "epoch": 0.94, "learning_rate": 2.568239796648657e-05, "loss": 2.2183, "step": 150224 }, { "epoch": 0.94, "learning_rate": 2.5679158257291213e-05, "loss": 2.2013, "step": 150232 }, { "epoch": 0.94, "learning_rate": 2.5675919401315833e-05, "loss": 2.1997, "step": 150240 }, { "epoch": 0.94, "learning_rate": 2.5672681398640936e-05, "loss": 2.2176, "step": 150248 }, { "epoch": 0.94, "learning_rate": 2.566944424934704e-05, "loss": 2.2182, "step": 150256 }, { "epoch": 0.94, "learning_rate": 2.5666207953514615e-05, "loss": 2.2087, "step": 150264 }, { "epoch": 0.94, "learning_rate": 2.5662972511224097e-05, "loss": 2.2037, "step": 150272 }, { "epoch": 0.94, "learning_rate": 2.565973792255595e-05, "loss": 2.2236, "step": 150280 }, { "epoch": 0.94, "learning_rate": 2.5656504187590562e-05, "loss": 2.2138, "step": 150288 }, { "epoch": 0.94, "learning_rate": 2.5653271306408346e-05, "loss": 2.2062, "step": 150296 }, { "epoch": 0.94, "learning_rate": 2.5650039279089645e-05, "loss": 2.2238, "step": 150304 }, { "epoch": 0.94, "learning_rate": 2.5646808105714816e-05, "loss": 2.2124, "step": 150312 }, { "epoch": 0.94, "learning_rate": 2.5643577786364216e-05, "loss": 2.2196, "step": 150320 }, { "epoch": 0.94, "learning_rate": 2.5640348321118102e-05, "loss": 2.231, "step": 150328 }, { "epoch": 0.94, "learning_rate": 2.563711971005679e-05, "loss": 2.2215, "step": 150336 }, { "epoch": 0.94, "learning_rate": 2.563389195326056e-05, "loss": 2.2069, "step": 150344 }, { "epoch": 0.94, "learning_rate": 2.56306650508096e-05, "loss": 2.2238, "step": 150352 }, { "epoch": 0.94, "learning_rate": 2.5627439002784182e-05, "loss": 2.2147, "step": 150360 }, { "epoch": 0.94, "learning_rate": 2.5624213809264473e-05, "loss": 2.2085, "step": 150368 }, { "epoch": 0.94, "learning_rate": 2.562098947033068e-05, "loss": 2.202, "step": 150376 }, { "epoch": 0.94, "learning_rate": 2.561776598606294e-05, "loss": 2.2325, "step": 150384 }, { "epoch": 0.94, "learning_rate": 2.5614543356541393e-05, "loss": 2.2202, "step": 150392 }, { "epoch": 0.94, "learning_rate": 2.561132158184616e-05, "loss": 2.2163, "step": 150400 }, { "epoch": 0.94, "learning_rate": 2.5608100662057333e-05, "loss": 2.226, "step": 150408 }, { "epoch": 0.94, "learning_rate": 2.5604880597254977e-05, "loss": 2.2133, "step": 150416 }, { "epoch": 0.94, "learning_rate": 2.5601661387519148e-05, "loss": 2.22, "step": 150424 }, { "epoch": 0.94, "learning_rate": 2.5598443032929886e-05, "loss": 2.2203, "step": 150432 }, { "epoch": 0.94, "learning_rate": 2.5595225533567175e-05, "loss": 2.2257, "step": 150440 }, { "epoch": 0.94, "learning_rate": 2.5592008889511026e-05, "loss": 2.2159, "step": 150448 }, { "epoch": 0.94, "learning_rate": 2.5588793100841402e-05, "loss": 2.219, "step": 150456 }, { "epoch": 0.94, "learning_rate": 2.5585578167638223e-05, "loss": 2.2316, "step": 150464 }, { "epoch": 0.94, "learning_rate": 2.5582364089981454e-05, "loss": 2.2026, "step": 150472 }, { "epoch": 0.94, "learning_rate": 2.557915086795097e-05, "loss": 2.2042, "step": 150480 }, { "epoch": 0.94, "learning_rate": 2.5575938501626644e-05, "loss": 2.2129, "step": 150488 }, { "epoch": 0.94, "learning_rate": 2.5572726991088363e-05, "loss": 2.2388, "step": 150496 }, { "epoch": 0.94, "learning_rate": 2.5569516336415937e-05, "loss": 2.2166, "step": 150504 }, { "epoch": 0.94, "learning_rate": 2.5566306537689223e-05, "loss": 2.2145, "step": 150512 }, { "epoch": 0.94, "learning_rate": 2.556309759498797e-05, "loss": 2.2288, "step": 150520 }, { "epoch": 0.94, "learning_rate": 2.5559889508391976e-05, "loss": 2.2066, "step": 150528 }, { "epoch": 0.94, "learning_rate": 2.555668227798101e-05, "loss": 2.2149, "step": 150536 }, { "epoch": 0.94, "learning_rate": 2.5553475903834767e-05, "loss": 2.1916, "step": 150544 }, { "epoch": 0.94, "learning_rate": 2.555027038603298e-05, "loss": 2.2299, "step": 150552 }, { "epoch": 0.94, "learning_rate": 2.5547065724655357e-05, "loss": 2.1988, "step": 150560 }, { "epoch": 0.94, "learning_rate": 2.5543861919781532e-05, "loss": 2.2238, "step": 150568 }, { "epoch": 0.94, "learning_rate": 2.554065897149116e-05, "loss": 2.2228, "step": 150576 }, { "epoch": 0.94, "learning_rate": 2.5537456879863873e-05, "loss": 2.2294, "step": 150584 }, { "epoch": 0.94, "learning_rate": 2.5534255644979283e-05, "loss": 2.2179, "step": 150592 }, { "epoch": 0.94, "learning_rate": 2.5531055266916965e-05, "loss": 2.2237, "step": 150600 }, { "epoch": 0.94, "learning_rate": 2.5527855745756467e-05, "loss": 2.2135, "step": 150608 }, { "epoch": 0.94, "learning_rate": 2.552465708157736e-05, "loss": 2.2275, "step": 150616 }, { "epoch": 0.94, "learning_rate": 2.5521459274459137e-05, "loss": 2.2116, "step": 150624 }, { "epoch": 0.94, "learning_rate": 2.5518262324481295e-05, "loss": 2.2254, "step": 150632 }, { "epoch": 0.94, "learning_rate": 2.5515066231723335e-05, "loss": 2.2295, "step": 150640 }, { "epoch": 0.94, "learning_rate": 2.5511870996264696e-05, "loss": 2.2159, "step": 150648 }, { "epoch": 0.94, "learning_rate": 2.5508676618184807e-05, "loss": 2.2227, "step": 150656 }, { "epoch": 0.94, "learning_rate": 2.5505483097563093e-05, "loss": 2.2027, "step": 150664 }, { "epoch": 0.94, "learning_rate": 2.5502290434478944e-05, "loss": 2.2307, "step": 150672 }, { "epoch": 0.94, "learning_rate": 2.5499098629011714e-05, "loss": 2.2281, "step": 150680 }, { "epoch": 0.94, "learning_rate": 2.5495907681240773e-05, "loss": 2.213, "step": 150688 }, { "epoch": 0.94, "learning_rate": 2.549271759124543e-05, "loss": 2.2158, "step": 150696 }, { "epoch": 0.94, "learning_rate": 2.5489528359105e-05, "loss": 2.2204, "step": 150704 }, { "epoch": 0.94, "learning_rate": 2.548633998489877e-05, "loss": 2.2235, "step": 150712 }, { "epoch": 0.94, "learning_rate": 2.5483152468705995e-05, "loss": 2.2159, "step": 150720 }, { "epoch": 0.94, "learning_rate": 2.5479965810605937e-05, "loss": 2.2072, "step": 150728 }, { "epoch": 0.94, "learning_rate": 2.5476780010677787e-05, "loss": 2.228, "step": 150736 }, { "epoch": 0.94, "learning_rate": 2.5473595069000757e-05, "loss": 2.2123, "step": 150744 }, { "epoch": 0.94, "learning_rate": 2.5470410985654046e-05, "loss": 2.2138, "step": 150752 }, { "epoch": 0.94, "learning_rate": 2.5467227760716776e-05, "loss": 2.2171, "step": 150760 }, { "epoch": 0.94, "learning_rate": 2.5464045394268106e-05, "loss": 2.2094, "step": 150768 }, { "epoch": 0.94, "learning_rate": 2.5460863886387142e-05, "loss": 2.233, "step": 150776 }, { "epoch": 0.94, "learning_rate": 2.5457683237152968e-05, "loss": 2.22, "step": 150784 }, { "epoch": 0.94, "learning_rate": 2.5454503446644678e-05, "loss": 2.219, "step": 150792 }, { "epoch": 0.94, "learning_rate": 2.5451324514941294e-05, "loss": 2.2131, "step": 150800 }, { "epoch": 0.94, "learning_rate": 2.5448146442121868e-05, "loss": 2.2116, "step": 150808 }, { "epoch": 0.94, "learning_rate": 2.5444969228265404e-05, "loss": 2.2253, "step": 150816 }, { "epoch": 0.94, "learning_rate": 2.5441792873450864e-05, "loss": 2.2297, "step": 150824 }, { "epoch": 0.94, "learning_rate": 2.5438617377757247e-05, "loss": 2.1875, "step": 150832 }, { "epoch": 0.94, "learning_rate": 2.5435442741263478e-05, "loss": 2.227, "step": 150840 }, { "epoch": 0.94, "learning_rate": 2.5432268964048468e-05, "loss": 2.2225, "step": 150848 }, { "epoch": 0.94, "learning_rate": 2.5429096046191135e-05, "loss": 2.222, "step": 150856 }, { "epoch": 0.94, "learning_rate": 2.542592398777036e-05, "loss": 2.2237, "step": 150864 }, { "epoch": 0.94, "learning_rate": 2.542275278886499e-05, "loss": 2.2295, "step": 150872 }, { "epoch": 0.94, "learning_rate": 2.5419582449553864e-05, "loss": 2.2302, "step": 150880 }, { "epoch": 0.94, "learning_rate": 2.5416412969915804e-05, "loss": 2.2208, "step": 150888 }, { "epoch": 0.94, "learning_rate": 2.5413244350029585e-05, "loss": 2.2288, "step": 150896 }, { "epoch": 0.94, "learning_rate": 2.5410076589974003e-05, "loss": 2.2494, "step": 150904 }, { "epoch": 0.94, "learning_rate": 2.5406909689827797e-05, "loss": 2.212, "step": 150912 }, { "epoch": 0.94, "learning_rate": 2.5403743649669696e-05, "loss": 2.2229, "step": 150920 }, { "epoch": 0.94, "learning_rate": 2.5400578469578405e-05, "loss": 2.2333, "step": 150928 }, { "epoch": 0.94, "learning_rate": 2.5397414149632616e-05, "loss": 2.2342, "step": 150936 }, { "epoch": 0.94, "learning_rate": 2.5394250689911004e-05, "loss": 2.2211, "step": 150944 }, { "epoch": 0.94, "learning_rate": 2.5391088090492188e-05, "loss": 2.213, "step": 150952 }, { "epoch": 0.94, "learning_rate": 2.538792635145481e-05, "loss": 2.2249, "step": 150960 }, { "epoch": 0.94, "learning_rate": 2.5384765472877477e-05, "loss": 2.2306, "step": 150968 }, { "epoch": 0.94, "learning_rate": 2.538160545483874e-05, "loss": 2.2206, "step": 150976 }, { "epoch": 0.94, "learning_rate": 2.537844629741719e-05, "loss": 2.2154, "step": 150984 }, { "epoch": 0.94, "learning_rate": 2.537528800069135e-05, "loss": 2.2267, "step": 150992 }, { "epoch": 0.94, "learning_rate": 2.537213056473973e-05, "loss": 2.2174, "step": 151000 }, { "epoch": 0.94, "learning_rate": 2.5368973989640827e-05, "loss": 2.2024, "step": 151008 }, { "epoch": 0.94, "learning_rate": 2.536581827547311e-05, "loss": 2.2211, "step": 151016 }, { "epoch": 0.94, "learning_rate": 2.5362663422315048e-05, "loss": 2.2136, "step": 151024 }, { "epoch": 0.94, "learning_rate": 2.535950943024506e-05, "loss": 2.2247, "step": 151032 }, { "epoch": 0.94, "learning_rate": 2.5356356299341545e-05, "loss": 2.2311, "step": 151040 }, { "epoch": 0.94, "learning_rate": 2.535320402968291e-05, "loss": 2.2091, "step": 151048 }, { "epoch": 0.94, "learning_rate": 2.5350052621347502e-05, "loss": 2.2278, "step": 151056 }, { "epoch": 0.94, "learning_rate": 2.534690207441367e-05, "loss": 2.2298, "step": 151064 }, { "epoch": 0.94, "learning_rate": 2.534375238895975e-05, "loss": 2.217, "step": 151072 }, { "epoch": 0.94, "learning_rate": 2.5340603565064035e-05, "loss": 2.2181, "step": 151080 }, { "epoch": 0.94, "learning_rate": 2.5337455602804793e-05, "loss": 2.2156, "step": 151088 }, { "epoch": 0.94, "learning_rate": 2.5334308502260306e-05, "loss": 2.2355, "step": 151096 }, { "epoch": 0.94, "learning_rate": 2.5331162263508794e-05, "loss": 2.2385, "step": 151104 }, { "epoch": 0.94, "learning_rate": 2.532801688662847e-05, "loss": 2.221, "step": 151112 }, { "epoch": 0.94, "learning_rate": 2.532487237169755e-05, "loss": 2.208, "step": 151120 }, { "epoch": 0.94, "learning_rate": 2.532172871879419e-05, "loss": 2.2274, "step": 151128 }, { "epoch": 0.94, "learning_rate": 2.531858592799654e-05, "loss": 2.2283, "step": 151136 }, { "epoch": 0.94, "learning_rate": 2.5315443999382732e-05, "loss": 2.2273, "step": 151144 }, { "epoch": 0.94, "learning_rate": 2.5312302933030878e-05, "loss": 2.2268, "step": 151152 }, { "epoch": 0.94, "learning_rate": 2.530916272901908e-05, "loss": 2.2265, "step": 151160 }, { "epoch": 0.94, "learning_rate": 2.5306023387425376e-05, "loss": 2.2279, "step": 151168 }, { "epoch": 0.94, "learning_rate": 2.5302884908327816e-05, "loss": 2.2223, "step": 151176 }, { "epoch": 0.94, "learning_rate": 2.5299747291804456e-05, "loss": 2.222, "step": 151184 }, { "epoch": 0.94, "learning_rate": 2.5296610537933245e-05, "loss": 2.2322, "step": 151192 }, { "epoch": 0.94, "learning_rate": 2.5293474646792204e-05, "loss": 2.232, "step": 151200 }, { "epoch": 0.95, "learning_rate": 2.5290339618459267e-05, "loss": 2.2174, "step": 151208 }, { "epoch": 0.95, "learning_rate": 2.528720545301239e-05, "loss": 2.2248, "step": 151216 }, { "epoch": 0.95, "learning_rate": 2.5284072150529482e-05, "loss": 2.2187, "step": 151224 }, { "epoch": 0.95, "learning_rate": 2.5280939711088425e-05, "loss": 2.2392, "step": 151232 }, { "epoch": 0.95, "learning_rate": 2.5277808134767112e-05, "loss": 2.2267, "step": 151240 }, { "epoch": 0.95, "learning_rate": 2.5274677421643383e-05, "loss": 2.2265, "step": 151248 }, { "epoch": 0.95, "learning_rate": 2.527154757179506e-05, "loss": 2.2383, "step": 151256 }, { "epoch": 0.95, "learning_rate": 2.5268418585299976e-05, "loss": 2.2426, "step": 151264 }, { "epoch": 0.95, "learning_rate": 2.526529046223589e-05, "loss": 2.2327, "step": 151272 }, { "epoch": 0.95, "learning_rate": 2.5262163202680584e-05, "loss": 2.23, "step": 151280 }, { "epoch": 0.95, "learning_rate": 2.52590368067118e-05, "loss": 2.2128, "step": 151288 }, { "epoch": 0.95, "learning_rate": 2.5255911274407264e-05, "loss": 2.2336, "step": 151296 }, { "epoch": 0.95, "learning_rate": 2.5252786605844657e-05, "loss": 2.23, "step": 151304 }, { "epoch": 0.95, "learning_rate": 2.5249662801101687e-05, "loss": 2.2232, "step": 151312 }, { "epoch": 0.95, "learning_rate": 2.5246539860256002e-05, "loss": 2.2172, "step": 151320 }, { "epoch": 0.95, "learning_rate": 2.5243417783385214e-05, "loss": 2.2231, "step": 151328 }, { "epoch": 0.95, "learning_rate": 2.524029657056698e-05, "loss": 2.2301, "step": 151336 }, { "epoch": 0.95, "learning_rate": 2.5237176221878865e-05, "loss": 2.2184, "step": 151344 }, { "epoch": 0.95, "learning_rate": 2.523405673739846e-05, "loss": 2.2203, "step": 151352 }, { "epoch": 0.95, "learning_rate": 2.523093811720329e-05, "loss": 2.2135, "step": 151360 }, { "epoch": 0.95, "learning_rate": 2.52278203613709e-05, "loss": 2.2222, "step": 151368 }, { "epoch": 0.95, "learning_rate": 2.522470346997881e-05, "loss": 2.2114, "step": 151376 }, { "epoch": 0.95, "learning_rate": 2.5221587443104484e-05, "loss": 2.2203, "step": 151384 }, { "epoch": 0.95, "learning_rate": 2.521847228082539e-05, "loss": 2.2274, "step": 151392 }, { "epoch": 0.95, "learning_rate": 2.5215357983219e-05, "loss": 2.2205, "step": 151400 }, { "epoch": 0.95, "learning_rate": 2.521224455036269e-05, "loss": 2.2335, "step": 151408 }, { "epoch": 0.95, "learning_rate": 2.52091319823339e-05, "loss": 2.1936, "step": 151416 }, { "epoch": 0.95, "learning_rate": 2.5206020279209975e-05, "loss": 2.2279, "step": 151424 }, { "epoch": 0.95, "learning_rate": 2.5202909441068308e-05, "loss": 2.202, "step": 151432 }, { "epoch": 0.95, "learning_rate": 2.5199799467986208e-05, "loss": 2.2152, "step": 151440 }, { "epoch": 0.95, "learning_rate": 2.519669036004099e-05, "loss": 2.2215, "step": 151448 }, { "epoch": 0.95, "learning_rate": 2.5193582117309973e-05, "loss": 2.226, "step": 151456 }, { "epoch": 0.95, "learning_rate": 2.5190474739870395e-05, "loss": 2.2147, "step": 151464 }, { "epoch": 0.95, "learning_rate": 2.5187368227799524e-05, "loss": 2.2212, "step": 151472 }, { "epoch": 0.95, "learning_rate": 2.518426258117459e-05, "loss": 2.2174, "step": 151480 }, { "epoch": 0.95, "learning_rate": 2.518115780007279e-05, "loss": 2.2272, "step": 151488 }, { "epoch": 0.95, "learning_rate": 2.5178053884571306e-05, "loss": 2.2187, "step": 151496 }, { "epoch": 0.95, "learning_rate": 2.5174950834747322e-05, "loss": 2.2263, "step": 151504 }, { "epoch": 0.95, "learning_rate": 2.5171848650677964e-05, "loss": 2.2376, "step": 151512 }, { "epoch": 0.95, "learning_rate": 2.5168747332440344e-05, "loss": 2.2249, "step": 151520 }, { "epoch": 0.95, "learning_rate": 2.5165646880111594e-05, "loss": 2.2142, "step": 151528 }, { "epoch": 0.95, "learning_rate": 2.5162547293768763e-05, "loss": 2.2081, "step": 151536 }, { "epoch": 0.95, "learning_rate": 2.5159448573488908e-05, "loss": 2.2017, "step": 151544 }, { "epoch": 0.95, "learning_rate": 2.5156350719349075e-05, "loss": 2.2349, "step": 151552 }, { "epoch": 0.95, "learning_rate": 2.515325373142627e-05, "loss": 2.2291, "step": 151560 }, { "epoch": 0.95, "learning_rate": 2.51501576097975e-05, "loss": 2.2043, "step": 151568 }, { "epoch": 0.95, "learning_rate": 2.514706235453971e-05, "loss": 2.2255, "step": 151576 }, { "epoch": 0.95, "learning_rate": 2.5143967965729854e-05, "loss": 2.2263, "step": 151584 }, { "epoch": 0.95, "learning_rate": 2.5140874443444883e-05, "loss": 2.2243, "step": 151592 }, { "epoch": 0.95, "learning_rate": 2.513778178776167e-05, "loss": 2.2254, "step": 151600 }, { "epoch": 0.95, "learning_rate": 2.5134689998757123e-05, "loss": 2.2242, "step": 151608 }, { "epoch": 0.95, "learning_rate": 2.5131599076508087e-05, "loss": 2.2058, "step": 151616 }, { "epoch": 0.95, "learning_rate": 2.5128509021091408e-05, "loss": 2.2154, "step": 151624 }, { "epoch": 0.95, "learning_rate": 2.5125419832583917e-05, "loss": 2.2185, "step": 151632 }, { "epoch": 0.95, "learning_rate": 2.5122331511062387e-05, "loss": 2.2243, "step": 151640 }, { "epoch": 0.95, "learning_rate": 2.511924405660362e-05, "loss": 2.2181, "step": 151648 }, { "epoch": 0.95, "learning_rate": 2.511615746928436e-05, "loss": 2.2272, "step": 151656 }, { "epoch": 0.95, "learning_rate": 2.511307174918134e-05, "loss": 2.2297, "step": 151664 }, { "epoch": 0.95, "learning_rate": 2.510998689637126e-05, "loss": 2.2278, "step": 151672 }, { "epoch": 0.95, "learning_rate": 2.5106902910930837e-05, "loss": 2.2325, "step": 151680 }, { "epoch": 0.95, "learning_rate": 2.5103819792936707e-05, "loss": 2.2124, "step": 151688 }, { "epoch": 0.95, "learning_rate": 2.5100737542465537e-05, "loss": 2.2123, "step": 151696 }, { "epoch": 0.95, "learning_rate": 2.509765615959396e-05, "loss": 2.2309, "step": 151704 }, { "epoch": 0.95, "learning_rate": 2.5094575644398543e-05, "loss": 2.2154, "step": 151712 }, { "epoch": 0.95, "learning_rate": 2.5091495996955903e-05, "loss": 2.203, "step": 151720 }, { "epoch": 0.95, "learning_rate": 2.50884172173426e-05, "loss": 2.224, "step": 151728 }, { "epoch": 0.95, "learning_rate": 2.5085339305635148e-05, "loss": 2.2129, "step": 151736 }, { "epoch": 0.95, "learning_rate": 2.5082262261910083e-05, "loss": 2.2201, "step": 151744 }, { "epoch": 0.95, "learning_rate": 2.50791860862439e-05, "loss": 2.2175, "step": 151752 }, { "epoch": 0.95, "learning_rate": 2.5076110778713065e-05, "loss": 2.222, "step": 151760 }, { "epoch": 0.95, "learning_rate": 2.507303633939403e-05, "loss": 2.2124, "step": 151768 }, { "epoch": 0.95, "learning_rate": 2.5069962768363226e-05, "loss": 2.2068, "step": 151776 }, { "epoch": 0.95, "learning_rate": 2.506689006569709e-05, "loss": 2.2189, "step": 151784 }, { "epoch": 0.95, "learning_rate": 2.5063818231471964e-05, "loss": 2.212, "step": 151792 }, { "epoch": 0.95, "learning_rate": 2.5060747265764238e-05, "loss": 2.2097, "step": 151800 }, { "epoch": 0.95, "learning_rate": 2.5057677168650273e-05, "loss": 2.2216, "step": 151808 }, { "epoch": 0.95, "learning_rate": 2.5054607940206353e-05, "loss": 2.2286, "step": 151816 }, { "epoch": 0.95, "learning_rate": 2.5051539580508815e-05, "loss": 2.2203, "step": 151824 }, { "epoch": 0.95, "learning_rate": 2.5048472089633924e-05, "loss": 2.2191, "step": 151832 }, { "epoch": 0.95, "learning_rate": 2.504540546765792e-05, "loss": 2.2199, "step": 151840 }, { "epoch": 0.95, "learning_rate": 2.5042339714657082e-05, "loss": 2.2253, "step": 151848 }, { "epoch": 0.95, "learning_rate": 2.503927483070758e-05, "loss": 2.2246, "step": 151856 }, { "epoch": 0.95, "learning_rate": 2.503621081588564e-05, "loss": 2.232, "step": 151864 }, { "epoch": 0.95, "learning_rate": 2.5033147670267425e-05, "loss": 2.2293, "step": 151872 }, { "epoch": 0.95, "learning_rate": 2.503008539392907e-05, "loss": 2.2203, "step": 151880 }, { "epoch": 0.95, "learning_rate": 2.5027023986946723e-05, "loss": 2.2172, "step": 151888 }, { "epoch": 0.95, "learning_rate": 2.5023963449396486e-05, "loss": 2.2218, "step": 151896 }, { "epoch": 0.95, "learning_rate": 2.5020903781354437e-05, "loss": 2.2042, "step": 151904 }, { "epoch": 0.95, "learning_rate": 2.501784498289665e-05, "loss": 2.221, "step": 151912 }, { "epoch": 0.95, "learning_rate": 2.501478705409916e-05, "loss": 2.2121, "step": 151920 }, { "epoch": 0.95, "learning_rate": 2.501172999503798e-05, "loss": 2.2311, "step": 151928 }, { "epoch": 0.95, "learning_rate": 2.500867380578913e-05, "loss": 2.2233, "step": 151936 }, { "epoch": 0.95, "learning_rate": 2.500561848642857e-05, "loss": 2.2093, "step": 151944 }, { "epoch": 0.95, "learning_rate": 2.5002564037032255e-05, "loss": 2.2321, "step": 151952 }, { "epoch": 0.95, "learning_rate": 2.4999510457676138e-05, "loss": 2.2092, "step": 151960 }, { "epoch": 0.95, "learning_rate": 2.4996457748436113e-05, "loss": 2.2241, "step": 151968 }, { "epoch": 0.95, "learning_rate": 2.4993405909388078e-05, "loss": 2.2058, "step": 151976 }, { "epoch": 0.95, "learning_rate": 2.4990354940607887e-05, "loss": 2.2299, "step": 151984 }, { "epoch": 0.95, "learning_rate": 2.4987304842171406e-05, "loss": 2.2344, "step": 151992 }, { "epoch": 0.95, "learning_rate": 2.4984255614154463e-05, "loss": 2.2211, "step": 152000 }, { "epoch": 0.95, "learning_rate": 2.4981207256632843e-05, "loss": 2.2212, "step": 152008 }, { "epoch": 0.95, "learning_rate": 2.497815976968234e-05, "loss": 2.228, "step": 152016 }, { "epoch": 0.95, "learning_rate": 2.4975113153378734e-05, "loss": 2.2254, "step": 152024 }, { "epoch": 0.95, "learning_rate": 2.497206740779772e-05, "loss": 2.2019, "step": 152032 }, { "epoch": 0.95, "learning_rate": 2.4969022533015056e-05, "loss": 2.2151, "step": 152040 }, { "epoch": 0.95, "learning_rate": 2.4965978529106423e-05, "loss": 2.2173, "step": 152048 }, { "epoch": 0.95, "learning_rate": 2.4962935396147484e-05, "loss": 2.2131, "step": 152056 }, { "epoch": 0.95, "learning_rate": 2.4959893134213908e-05, "loss": 2.2294, "step": 152064 }, { "epoch": 0.95, "learning_rate": 2.4956851743381313e-05, "loss": 2.2088, "step": 152072 }, { "epoch": 0.95, "learning_rate": 2.4953811223725323e-05, "loss": 2.2159, "step": 152080 }, { "epoch": 0.95, "learning_rate": 2.4950771575321518e-05, "loss": 2.2413, "step": 152088 }, { "epoch": 0.95, "learning_rate": 2.494773279824546e-05, "loss": 2.2225, "step": 152096 }, { "epoch": 0.95, "learning_rate": 2.49446948925727e-05, "loss": 2.2218, "step": 152104 }, { "epoch": 0.95, "learning_rate": 2.494165785837876e-05, "loss": 2.2312, "step": 152112 }, { "epoch": 0.95, "learning_rate": 2.4938621695739134e-05, "loss": 2.2248, "step": 152120 }, { "epoch": 0.95, "learning_rate": 2.493558640472931e-05, "loss": 2.234, "step": 152128 }, { "epoch": 0.95, "learning_rate": 2.4932551985424743e-05, "loss": 2.2296, "step": 152136 }, { "epoch": 0.95, "learning_rate": 2.4929518437900863e-05, "loss": 2.2111, "step": 152144 }, { "epoch": 0.95, "learning_rate": 2.49264857622331e-05, "loss": 2.2245, "step": 152152 }, { "epoch": 0.95, "learning_rate": 2.492345395849683e-05, "loss": 2.2221, "step": 152160 }, { "epoch": 0.95, "learning_rate": 2.4920423026767423e-05, "loss": 2.2299, "step": 152168 }, { "epoch": 0.95, "learning_rate": 2.4917392967120245e-05, "loss": 2.2225, "step": 152176 }, { "epoch": 0.95, "learning_rate": 2.491436377963061e-05, "loss": 2.2305, "step": 152184 }, { "epoch": 0.95, "learning_rate": 2.4911335464373832e-05, "loss": 2.2209, "step": 152192 }, { "epoch": 0.95, "learning_rate": 2.4908308021425182e-05, "loss": 2.2264, "step": 152200 }, { "epoch": 0.95, "learning_rate": 2.490528145085993e-05, "loss": 2.2301, "step": 152208 }, { "epoch": 0.95, "learning_rate": 2.490225575275334e-05, "loss": 2.214, "step": 152216 }, { "epoch": 0.95, "learning_rate": 2.4899230927180593e-05, "loss": 2.2301, "step": 152224 }, { "epoch": 0.95, "learning_rate": 2.48962069742169e-05, "loss": 2.2186, "step": 152232 }, { "epoch": 0.95, "learning_rate": 2.489318389393746e-05, "loss": 2.2287, "step": 152240 }, { "epoch": 0.95, "learning_rate": 2.4890161686417385e-05, "loss": 2.2369, "step": 152248 }, { "epoch": 0.95, "learning_rate": 2.4887140351731845e-05, "loss": 2.2088, "step": 152256 }, { "epoch": 0.95, "learning_rate": 2.488411988995592e-05, "loss": 2.214, "step": 152264 }, { "epoch": 0.95, "learning_rate": 2.4881100301164727e-05, "loss": 2.2262, "step": 152272 }, { "epoch": 0.95, "learning_rate": 2.4878081585433323e-05, "loss": 2.222, "step": 152280 }, { "epoch": 0.95, "learning_rate": 2.4875063742836738e-05, "loss": 2.2306, "step": 152288 }, { "epoch": 0.95, "learning_rate": 2.4872046773450024e-05, "loss": 2.2087, "step": 152296 }, { "epoch": 0.95, "learning_rate": 2.486903067734816e-05, "loss": 2.2218, "step": 152304 }, { "epoch": 0.95, "learning_rate": 2.486601545460613e-05, "loss": 2.208, "step": 152312 }, { "epoch": 0.95, "learning_rate": 2.486300110529891e-05, "loss": 2.2242, "step": 152320 }, { "epoch": 0.95, "learning_rate": 2.4859987629501426e-05, "loss": 2.2171, "step": 152328 }, { "epoch": 0.95, "learning_rate": 2.4856975027288577e-05, "loss": 2.2157, "step": 152336 }, { "epoch": 0.95, "learning_rate": 2.485396329873528e-05, "loss": 2.224, "step": 152344 }, { "epoch": 0.95, "learning_rate": 2.4850952443916403e-05, "loss": 2.2223, "step": 152352 }, { "epoch": 0.95, "learning_rate": 2.484794246290678e-05, "loss": 2.2302, "step": 152360 }, { "epoch": 0.95, "learning_rate": 2.4844933355781265e-05, "loss": 2.2203, "step": 152368 }, { "epoch": 0.95, "learning_rate": 2.4841925122614648e-05, "loss": 2.2085, "step": 152376 }, { "epoch": 0.95, "learning_rate": 2.4838917763481706e-05, "loss": 2.2323, "step": 152384 }, { "epoch": 0.95, "learning_rate": 2.4835911278457227e-05, "loss": 2.2313, "step": 152392 }, { "epoch": 0.95, "learning_rate": 2.4832905667615937e-05, "loss": 2.2044, "step": 152400 }, { "epoch": 0.95, "learning_rate": 2.482990093103256e-05, "loss": 2.2184, "step": 152408 }, { "epoch": 0.95, "learning_rate": 2.4826897068781775e-05, "loss": 2.2151, "step": 152416 }, { "epoch": 0.95, "learning_rate": 2.4823894080938282e-05, "loss": 2.2266, "step": 152424 }, { "epoch": 0.95, "learning_rate": 2.4820891967576744e-05, "loss": 2.2322, "step": 152432 }, { "epoch": 0.95, "learning_rate": 2.4817890728771763e-05, "loss": 2.2269, "step": 152440 }, { "epoch": 0.95, "learning_rate": 2.4814890364597974e-05, "loss": 2.2088, "step": 152448 }, { "epoch": 0.95, "learning_rate": 2.481189087512996e-05, "loss": 2.2369, "step": 152456 }, { "epoch": 0.95, "learning_rate": 2.4808892260442272e-05, "loss": 2.227, "step": 152464 }, { "epoch": 0.95, "learning_rate": 2.4805894520609485e-05, "loss": 2.2191, "step": 152472 }, { "epoch": 0.95, "learning_rate": 2.4802897655706102e-05, "loss": 2.222, "step": 152480 }, { "epoch": 0.95, "learning_rate": 2.4799901665806635e-05, "loss": 2.2226, "step": 152488 }, { "epoch": 0.95, "learning_rate": 2.4796906550985567e-05, "loss": 2.2297, "step": 152496 }, { "epoch": 0.95, "learning_rate": 2.479391231131734e-05, "loss": 2.2248, "step": 152504 }, { "epoch": 0.95, "learning_rate": 2.4790918946876417e-05, "loss": 2.2297, "step": 152512 }, { "epoch": 0.95, "learning_rate": 2.478792645773719e-05, "loss": 2.2204, "step": 152520 }, { "epoch": 0.95, "learning_rate": 2.4784934843974057e-05, "loss": 2.2249, "step": 152528 }, { "epoch": 0.95, "learning_rate": 2.4781944105661405e-05, "loss": 2.2288, "step": 152536 }, { "epoch": 0.95, "learning_rate": 2.4778954242873574e-05, "loss": 2.2194, "step": 152544 }, { "epoch": 0.95, "learning_rate": 2.4775965255684887e-05, "loss": 2.2275, "step": 152552 }, { "epoch": 0.95, "learning_rate": 2.4772977144169658e-05, "loss": 2.2079, "step": 152560 }, { "epoch": 0.95, "learning_rate": 2.4769989908402173e-05, "loss": 2.207, "step": 152568 }, { "epoch": 0.95, "learning_rate": 2.4767003548456683e-05, "loss": 2.2257, "step": 152576 }, { "epoch": 0.95, "learning_rate": 2.4764018064407445e-05, "loss": 2.2307, "step": 152584 }, { "epoch": 0.95, "learning_rate": 2.4761033456328672e-05, "loss": 2.1986, "step": 152592 }, { "epoch": 0.95, "learning_rate": 2.4758049724294556e-05, "loss": 2.2179, "step": 152600 }, { "epoch": 0.95, "learning_rate": 2.4755066868379285e-05, "loss": 2.2383, "step": 152608 }, { "epoch": 0.95, "learning_rate": 2.475208488865699e-05, "loss": 2.229, "step": 152616 }, { "epoch": 0.95, "learning_rate": 2.4749103785201844e-05, "loss": 2.2006, "step": 152624 }, { "epoch": 0.95, "learning_rate": 2.4746123558087918e-05, "loss": 2.2153, "step": 152632 }, { "epoch": 0.95, "learning_rate": 2.4743144207389306e-05, "loss": 2.2213, "step": 152640 }, { "epoch": 0.95, "learning_rate": 2.474016573318011e-05, "loss": 2.2119, "step": 152648 }, { "epoch": 0.95, "learning_rate": 2.473718813553433e-05, "loss": 2.2232, "step": 152656 }, { "epoch": 0.95, "learning_rate": 2.473421141452602e-05, "loss": 2.2235, "step": 152664 }, { "epoch": 0.95, "learning_rate": 2.4731235570229167e-05, "loss": 2.2186, "step": 152672 }, { "epoch": 0.95, "learning_rate": 2.4728260602717748e-05, "loss": 2.2247, "step": 152680 }, { "epoch": 0.95, "learning_rate": 2.472528651206574e-05, "loss": 2.2344, "step": 152688 }, { "epoch": 0.95, "learning_rate": 2.4722313298347055e-05, "loss": 2.2218, "step": 152696 }, { "epoch": 0.95, "learning_rate": 2.471934096163563e-05, "loss": 2.2319, "step": 152704 }, { "epoch": 0.95, "learning_rate": 2.4716369502005343e-05, "loss": 2.2293, "step": 152712 }, { "epoch": 0.95, "learning_rate": 2.471339891953006e-05, "loss": 2.2333, "step": 152720 }, { "epoch": 0.95, "learning_rate": 2.471042921428365e-05, "loss": 2.2089, "step": 152728 }, { "epoch": 0.95, "learning_rate": 2.470746038633993e-05, "loss": 2.2169, "step": 152736 }, { "epoch": 0.95, "learning_rate": 2.47044924357727e-05, "loss": 2.2189, "step": 152744 }, { "epoch": 0.95, "learning_rate": 2.470152536265575e-05, "loss": 2.2143, "step": 152752 }, { "epoch": 0.95, "learning_rate": 2.469855916706284e-05, "loss": 2.2237, "step": 152760 }, { "epoch": 0.95, "learning_rate": 2.4695593849067705e-05, "loss": 2.2371, "step": 152768 }, { "epoch": 0.95, "learning_rate": 2.4692629408744074e-05, "loss": 2.2092, "step": 152776 }, { "epoch": 0.95, "learning_rate": 2.468966584616564e-05, "loss": 2.2339, "step": 152784 }, { "epoch": 0.95, "learning_rate": 2.4686703161406062e-05, "loss": 2.2379, "step": 152792 }, { "epoch": 0.95, "learning_rate": 2.468374135453902e-05, "loss": 2.2349, "step": 152800 }, { "epoch": 0.96, "learning_rate": 2.4680780425638126e-05, "loss": 2.2193, "step": 152808 }, { "epoch": 0.96, "learning_rate": 2.4677820374776996e-05, "loss": 2.2138, "step": 152816 }, { "epoch": 0.96, "learning_rate": 2.4674861202029203e-05, "loss": 2.2158, "step": 152824 }, { "epoch": 0.96, "learning_rate": 2.4671902907468323e-05, "loss": 2.2103, "step": 152832 }, { "epoch": 0.96, "learning_rate": 2.466894549116792e-05, "loss": 2.2272, "step": 152840 }, { "epoch": 0.96, "learning_rate": 2.466598895320148e-05, "loss": 2.2189, "step": 152848 }, { "epoch": 0.96, "learning_rate": 2.4663033293642522e-05, "loss": 2.2176, "step": 152856 }, { "epoch": 0.96, "learning_rate": 2.466007851256453e-05, "loss": 2.2325, "step": 152864 }, { "epoch": 0.96, "learning_rate": 2.465712461004094e-05, "loss": 2.2121, "step": 152872 }, { "epoch": 0.96, "learning_rate": 2.4654171586145203e-05, "loss": 2.2014, "step": 152880 }, { "epoch": 0.96, "learning_rate": 2.4651219440950723e-05, "loss": 2.2179, "step": 152888 }, { "epoch": 0.96, "learning_rate": 2.4648268174530893e-05, "loss": 2.2119, "step": 152896 }, { "epoch": 0.96, "learning_rate": 2.4645317786959086e-05, "loss": 2.2267, "step": 152904 }, { "epoch": 0.96, "learning_rate": 2.4642368278308642e-05, "loss": 2.2312, "step": 152912 }, { "epoch": 0.96, "learning_rate": 2.4639419648652896e-05, "loss": 2.2066, "step": 152920 }, { "epoch": 0.96, "learning_rate": 2.4636471898065142e-05, "loss": 2.2221, "step": 152928 }, { "epoch": 0.96, "learning_rate": 2.4633525026618656e-05, "loss": 2.2261, "step": 152936 }, { "epoch": 0.96, "learning_rate": 2.4630579034386716e-05, "loss": 2.2214, "step": 152944 }, { "epoch": 0.96, "learning_rate": 2.462763392144255e-05, "loss": 2.2236, "step": 152952 }, { "epoch": 0.96, "learning_rate": 2.4624689687859364e-05, "loss": 2.2429, "step": 152960 }, { "epoch": 0.96, "learning_rate": 2.4621746333710372e-05, "loss": 2.2128, "step": 152968 }, { "epoch": 0.96, "learning_rate": 2.461880385906873e-05, "loss": 2.2211, "step": 152976 }, { "epoch": 0.96, "learning_rate": 2.4615862264007595e-05, "loss": 2.2201, "step": 152984 }, { "epoch": 0.96, "learning_rate": 2.4612921548600092e-05, "loss": 2.2142, "step": 152992 }, { "epoch": 0.96, "learning_rate": 2.460998171291934e-05, "loss": 2.2202, "step": 153000 }, { "epoch": 0.96, "learning_rate": 2.4607042757038392e-05, "loss": 2.2128, "step": 153008 }, { "epoch": 0.96, "learning_rate": 2.460410468103035e-05, "loss": 2.2307, "step": 153016 }, { "epoch": 0.96, "learning_rate": 2.4601167484968233e-05, "loss": 2.231, "step": 153024 }, { "epoch": 0.96, "learning_rate": 2.4598231168925067e-05, "loss": 2.2058, "step": 153032 }, { "epoch": 0.96, "learning_rate": 2.459529573297384e-05, "loss": 2.2111, "step": 153040 }, { "epoch": 0.96, "learning_rate": 2.4592361177187524e-05, "loss": 2.2191, "step": 153048 }, { "epoch": 0.96, "learning_rate": 2.4589427501639108e-05, "loss": 2.2328, "step": 153056 }, { "epoch": 0.96, "learning_rate": 2.458649470640148e-05, "loss": 2.2118, "step": 153064 }, { "epoch": 0.96, "learning_rate": 2.4583562791547562e-05, "loss": 2.2287, "step": 153072 }, { "epoch": 0.96, "learning_rate": 2.4580631757150264e-05, "loss": 2.2221, "step": 153080 }, { "epoch": 0.96, "learning_rate": 2.457770160328242e-05, "loss": 2.2266, "step": 153088 }, { "epoch": 0.96, "learning_rate": 2.457477233001689e-05, "loss": 2.2341, "step": 153096 }, { "epoch": 0.96, "learning_rate": 2.4571843937426506e-05, "loss": 2.2283, "step": 153104 }, { "epoch": 0.96, "learning_rate": 2.4568916425584042e-05, "loss": 2.2228, "step": 153112 }, { "epoch": 0.96, "learning_rate": 2.4565989794562297e-05, "loss": 2.2158, "step": 153120 }, { "epoch": 0.96, "learning_rate": 2.4563064044434017e-05, "loss": 2.2302, "step": 153128 }, { "epoch": 0.96, "learning_rate": 2.456013917527195e-05, "loss": 2.2262, "step": 153136 }, { "epoch": 0.96, "learning_rate": 2.4557215187148796e-05, "loss": 2.2264, "step": 153144 }, { "epoch": 0.96, "learning_rate": 2.4554292080137243e-05, "loss": 2.2253, "step": 153152 }, { "epoch": 0.96, "learning_rate": 2.455136985430997e-05, "loss": 2.2219, "step": 153160 }, { "epoch": 0.96, "learning_rate": 2.4548448509739628e-05, "loss": 2.2202, "step": 153168 }, { "epoch": 0.96, "learning_rate": 2.4545528046498816e-05, "loss": 2.2074, "step": 153176 }, { "epoch": 0.96, "learning_rate": 2.4542608464660167e-05, "loss": 2.2147, "step": 153184 }, { "epoch": 0.96, "learning_rate": 2.453968976429625e-05, "loss": 2.2185, "step": 153192 }, { "epoch": 0.96, "learning_rate": 2.453677194547962e-05, "loss": 2.2098, "step": 153200 }, { "epoch": 0.96, "learning_rate": 2.4533855008282823e-05, "loss": 2.2098, "step": 153208 }, { "epoch": 0.96, "learning_rate": 2.4530938952778366e-05, "loss": 2.217, "step": 153216 }, { "epoch": 0.96, "learning_rate": 2.452802377903874e-05, "loss": 2.2256, "step": 153224 }, { "epoch": 0.96, "learning_rate": 2.4525109487136432e-05, "loss": 2.2211, "step": 153232 }, { "epoch": 0.96, "learning_rate": 2.4522196077143884e-05, "loss": 2.2395, "step": 153240 }, { "epoch": 0.96, "learning_rate": 2.451928354913352e-05, "loss": 2.2218, "step": 153248 }, { "epoch": 0.96, "learning_rate": 2.451637190317774e-05, "loss": 2.2084, "step": 153256 }, { "epoch": 0.96, "learning_rate": 2.4513461139348932e-05, "loss": 2.2294, "step": 153264 }, { "epoch": 0.96, "learning_rate": 2.4510551257719483e-05, "loss": 2.2362, "step": 153272 }, { "epoch": 0.96, "learning_rate": 2.4507642258361695e-05, "loss": 2.2187, "step": 153280 }, { "epoch": 0.96, "learning_rate": 2.4504734141347914e-05, "loss": 2.224, "step": 153288 }, { "epoch": 0.96, "learning_rate": 2.4501826906750418e-05, "loss": 2.2278, "step": 153296 }, { "epoch": 0.96, "learning_rate": 2.4498920554641482e-05, "loss": 2.2167, "step": 153304 }, { "epoch": 0.96, "learning_rate": 2.4496015085093372e-05, "loss": 2.2218, "step": 153312 }, { "epoch": 0.96, "learning_rate": 2.4493110498178303e-05, "loss": 2.2152, "step": 153320 }, { "epoch": 0.96, "learning_rate": 2.4490206793968496e-05, "loss": 2.2276, "step": 153328 }, { "epoch": 0.96, "learning_rate": 2.4487303972536135e-05, "loss": 2.2219, "step": 153336 }, { "epoch": 0.96, "learning_rate": 2.4484402033953374e-05, "loss": 2.2271, "step": 153344 }, { "epoch": 0.96, "learning_rate": 2.4481500978292374e-05, "loss": 2.2177, "step": 153352 }, { "epoch": 0.96, "learning_rate": 2.447860080562524e-05, "loss": 2.2443, "step": 153360 }, { "epoch": 0.96, "learning_rate": 2.4475701516024065e-05, "loss": 2.2308, "step": 153368 }, { "epoch": 0.96, "learning_rate": 2.447280310956095e-05, "loss": 2.2181, "step": 153376 }, { "epoch": 0.96, "learning_rate": 2.4469905586307934e-05, "loss": 2.2009, "step": 153384 }, { "epoch": 0.96, "learning_rate": 2.4467008946337043e-05, "loss": 2.2071, "step": 153392 }, { "epoch": 0.96, "learning_rate": 2.4464113189720307e-05, "loss": 2.2356, "step": 153400 }, { "epoch": 0.96, "learning_rate": 2.44612183165297e-05, "loss": 2.2155, "step": 153408 }, { "epoch": 0.96, "learning_rate": 2.445832432683719e-05, "loss": 2.2199, "step": 153416 }, { "epoch": 0.96, "learning_rate": 2.445543122071473e-05, "loss": 2.2096, "step": 153424 }, { "epoch": 0.96, "learning_rate": 2.4452538998234238e-05, "loss": 2.2147, "step": 153432 }, { "epoch": 0.96, "learning_rate": 2.44496476594676e-05, "loss": 2.2202, "step": 153440 }, { "epoch": 0.96, "learning_rate": 2.4446757204486727e-05, "loss": 2.2273, "step": 153448 }, { "epoch": 0.96, "learning_rate": 2.444386763336345e-05, "loss": 2.2249, "step": 153456 }, { "epoch": 0.96, "learning_rate": 2.4440978946169628e-05, "loss": 2.2044, "step": 153464 }, { "epoch": 0.96, "learning_rate": 2.4438091142977038e-05, "loss": 2.2217, "step": 153472 }, { "epoch": 0.96, "learning_rate": 2.44352042238575e-05, "loss": 2.2199, "step": 153480 }, { "epoch": 0.96, "learning_rate": 2.4432318188882786e-05, "loss": 2.2096, "step": 153488 }, { "epoch": 0.96, "learning_rate": 2.4429433038124615e-05, "loss": 2.217, "step": 153496 }, { "epoch": 0.96, "learning_rate": 2.4426548771654745e-05, "loss": 2.2312, "step": 153504 }, { "epoch": 0.96, "learning_rate": 2.4423665389544857e-05, "loss": 2.2162, "step": 153512 }, { "epoch": 0.96, "learning_rate": 2.4420782891866637e-05, "loss": 2.2312, "step": 153520 }, { "epoch": 0.96, "learning_rate": 2.4417901278691747e-05, "loss": 2.2057, "step": 153528 }, { "epoch": 0.96, "learning_rate": 2.4415020550091823e-05, "loss": 2.2331, "step": 153536 }, { "epoch": 0.96, "learning_rate": 2.4412140706138485e-05, "loss": 2.2085, "step": 153544 }, { "epoch": 0.96, "learning_rate": 2.440926174690332e-05, "loss": 2.2107, "step": 153552 }, { "epoch": 0.96, "learning_rate": 2.4406383672457896e-05, "loss": 2.224, "step": 153560 }, { "epoch": 0.96, "learning_rate": 2.4403506482873772e-05, "loss": 2.2057, "step": 153568 }, { "epoch": 0.96, "learning_rate": 2.440063017822247e-05, "loss": 2.2312, "step": 153576 }, { "epoch": 0.96, "learning_rate": 2.4397754758575497e-05, "loss": 2.2279, "step": 153584 }, { "epoch": 0.96, "learning_rate": 2.4394880224004335e-05, "loss": 2.2363, "step": 153592 }, { "epoch": 0.96, "learning_rate": 2.439200657458045e-05, "loss": 2.2363, "step": 153600 } ], "logging_steps": 8, "max_steps": 160000, "num_input_tokens_seen": 0, "num_train_epochs": 9223372036854775807, "save_steps": 1600, "total_flos": 2.828530564580839e+21, "train_batch_size": 26, "trial_name": null, "trial_params": null }