{"current_steps": 5, "total_steps": 6250, "loss": 1.0428, "learning_rate": 4.999992104320636e-05, "epoch": 0.0008, "percentage": 0.08, "elapsed_time": "0:00:20", "remaining_time": "6:59:52", "throughput": 1319.95, "total_tokens": 26624} {"current_steps": 10, "total_steps": 6250, "loss": 1.1061, "learning_rate": 4.999968417332415e-05, "epoch": 0.0016, "percentage": 0.16, "elapsed_time": "0:00:43", "remaining_time": "7:36:30", "throughput": 1171.15, "total_tokens": 51408} {"current_steps": 15, "total_steps": 6250, "loss": 1.0426, "learning_rate": 4.999928939184958e-05, "epoch": 0.0024, "percentage": 0.24, "elapsed_time": "0:01:10", "remaining_time": "8:08:50", "throughput": 1063.46, "total_tokens": 75040} {"current_steps": 20, "total_steps": 6250, "loss": 1.1472, "learning_rate": 4.9998736701276295e-05, "epoch": 0.0032, "percentage": 0.32, "elapsed_time": "0:01:36", "remaining_time": "8:22:35", "throughput": 1021.09, "total_tokens": 98848} {"current_steps": 25, "total_steps": 6250, "loss": 0.9781, "learning_rate": 4.9998026105095405e-05, "epoch": 0.004, "percentage": 0.4, "elapsed_time": "0:02:04", "remaining_time": "8:34:50", "throughput": 992.31, "total_tokens": 123104} {"current_steps": 30, "total_steps": 6250, "loss": 0.9889, "learning_rate": 4.999715760779541e-05, "epoch": 0.0048, "percentage": 0.48, "elapsed_time": "0:02:40", "remaining_time": "9:13:18", "throughput": 950.17, "total_tokens": 152144} {"current_steps": 35, "total_steps": 6250, "loss": 0.9345, "learning_rate": 4.999613121486222e-05, "epoch": 0.0056, "percentage": 0.56, "elapsed_time": "0:03:06", "remaining_time": "9:12:49", "throughput": 948.72, "total_tokens": 177216} {"current_steps": 40, "total_steps": 6250, "loss": 0.8539, "learning_rate": 4.999494693277907e-05, "epoch": 0.0064, "percentage": 0.64, "elapsed_time": "0:03:36", "remaining_time": "9:20:42", "throughput": 937.48, "total_tokens": 203152} {"current_steps": 45, "total_steps": 6250, "loss": 0.9183, "learning_rate": 4.999360476902656e-05, "epoch": 0.0072, "percentage": 0.72, "elapsed_time": "0:04:00", "remaining_time": "9:12:48", "throughput": 971.0, "total_tokens": 233568} {"current_steps": 50, "total_steps": 6250, "loss": 0.873, "learning_rate": 4.99921047320825e-05, "epoch": 0.008, "percentage": 0.8, "elapsed_time": "0:04:28", "remaining_time": "9:13:59", "throughput": 987.67, "total_tokens": 264752} {"current_steps": 55, "total_steps": 6250, "loss": 0.8676, "learning_rate": 4.9990446831421955e-05, "epoch": 0.0088, "percentage": 0.88, "elapsed_time": "0:04:52", "remaining_time": "9:09:27", "throughput": 994.38, "total_tokens": 291040} {"current_steps": 60, "total_steps": 6250, "loss": 0.9004, "learning_rate": 4.998863107751711e-05, "epoch": 0.0096, "percentage": 0.96, "elapsed_time": "0:05:18", "remaining_time": "9:07:41", "throughput": 1010.13, "total_tokens": 321760} {"current_steps": 65, "total_steps": 6250, "loss": 0.8536, "learning_rate": 4.9986657481837277e-05, "epoch": 0.0104, "percentage": 1.04, "elapsed_time": "0:05:40", "remaining_time": "9:00:02", "throughput": 1019.52, "total_tokens": 347168} {"current_steps": 70, "total_steps": 6250, "loss": 0.8027, "learning_rate": 4.998452605684874e-05, "epoch": 0.0112, "percentage": 1.12, "elapsed_time": "0:06:00", "remaining_time": "8:51:02", "throughput": 1035.97, "total_tokens": 373888} {"current_steps": 75, "total_steps": 6250, "loss": 0.8075, "learning_rate": 4.998223681601473e-05, "epoch": 0.012, "percentage": 1.2, "elapsed_time": "0:06:20", "remaining_time": "8:42:07", "throughput": 1047.99, "total_tokens": 398752} {"current_steps": 80, "total_steps": 6250, "loss": 0.7919, "learning_rate": 4.997978977379536e-05, "epoch": 0.0128, "percentage": 1.28, "elapsed_time": "0:06:39", "remaining_time": "8:32:58", "throughput": 1055.8, "total_tokens": 421344} {"current_steps": 85, "total_steps": 6250, "loss": 0.7512, "learning_rate": 4.9977184945647473e-05, "epoch": 0.0136, "percentage": 1.36, "elapsed_time": "0:07:03", "remaining_time": "8:31:38", "throughput": 1066.25, "total_tokens": 451296} {"current_steps": 90, "total_steps": 6250, "loss": 0.7713, "learning_rate": 4.997442234802456e-05, "epoch": 0.0144, "percentage": 1.44, "elapsed_time": "0:07:24", "remaining_time": "8:27:35", "throughput": 1084.14, "total_tokens": 482416} {"current_steps": 95, "total_steps": 6250, "loss": 0.7965, "learning_rate": 4.997150199837671e-05, "epoch": 0.0152, "percentage": 1.52, "elapsed_time": "0:07:49", "remaining_time": "8:27:25", "throughput": 1091.71, "total_tokens": 513008} {"current_steps": 100, "total_steps": 6250, "loss": 0.8623, "learning_rate": 4.996842391515044e-05, "epoch": 0.016, "percentage": 1.6, "elapsed_time": "0:08:11", "remaining_time": "8:23:56", "throughput": 1094.25, "total_tokens": 537984} {"current_steps": 105, "total_steps": 6250, "loss": 0.7797, "learning_rate": 4.996518811778858e-05, "epoch": 0.0168, "percentage": 1.68, "elapsed_time": "0:08:33", "remaining_time": "8:21:20", "throughput": 1098.33, "total_tokens": 564528} {"current_steps": 110, "total_steps": 6250, "loss": 0.7732, "learning_rate": 4.99617946267302e-05, "epoch": 0.0176, "percentage": 1.76, "elapsed_time": "0:08:54", "remaining_time": "8:17:19", "throughput": 1101.04, "total_tokens": 588608} {"current_steps": 115, "total_steps": 6250, "loss": 0.7478, "learning_rate": 4.9958243463410414e-05, "epoch": 0.0184, "percentage": 1.84, "elapsed_time": "0:09:25", "remaining_time": "8:22:28", "throughput": 1098.41, "total_tokens": 620752} {"current_steps": 120, "total_steps": 6250, "loss": 0.7194, "learning_rate": 4.995453465026032e-05, "epoch": 0.0192, "percentage": 1.92, "elapsed_time": "0:09:48", "remaining_time": "8:21:04", "throughput": 1103.07, "total_tokens": 649200} {"current_steps": 125, "total_steps": 6250, "loss": 0.7506, "learning_rate": 4.995066821070679e-05, "epoch": 0.02, "percentage": 2.0, "elapsed_time": "0:10:12", "remaining_time": "8:19:52", "throughput": 1109.65, "total_tokens": 679200} {"current_steps": 130, "total_steps": 6250, "loss": 0.6886, "learning_rate": 4.9946644169172355e-05, "epoch": 0.0208, "percentage": 2.08, "elapsed_time": "0:10:33", "remaining_time": "8:17:24", "throughput": 1107.56, "total_tokens": 702144} {"current_steps": 135, "total_steps": 6250, "loss": 0.8481, "learning_rate": 4.9942462551075056e-05, "epoch": 0.0216, "percentage": 2.16, "elapsed_time": "0:11:01", "remaining_time": "8:19:14", "throughput": 1104.08, "total_tokens": 730128} {"current_steps": 140, "total_steps": 6250, "loss": 0.7999, "learning_rate": 4.993812338282826e-05, "epoch": 0.0224, "percentage": 2.24, "elapsed_time": "0:11:23", "remaining_time": "8:16:59", "throughput": 1108.3, "total_tokens": 757248} {"current_steps": 145, "total_steps": 6250, "loss": 0.7877, "learning_rate": 4.993362669184051e-05, "epoch": 0.0232, "percentage": 2.32, "elapsed_time": "0:11:48", "remaining_time": "8:17:02", "throughput": 1109.8, "total_tokens": 786096} {"current_steps": 150, "total_steps": 6250, "loss": 0.9312, "learning_rate": 4.992897250651535e-05, "epoch": 0.024, "percentage": 2.4, "elapsed_time": "0:12:12", "remaining_time": "8:16:39", "throughput": 1111.09, "total_tokens": 814192} {"current_steps": 155, "total_steps": 6250, "loss": 0.8767, "learning_rate": 4.992416085625115e-05, "epoch": 0.0248, "percentage": 2.48, "elapsed_time": "0:12:36", "remaining_time": "8:15:56", "throughput": 1110.22, "total_tokens": 840144} {"current_steps": 160, "total_steps": 6250, "loss": 0.8646, "learning_rate": 4.9919191771440905e-05, "epoch": 0.0256, "percentage": 2.56, "elapsed_time": "0:13:01", "remaining_time": "8:15:30", "throughput": 1114.29, "total_tokens": 870368} {"current_steps": 165, "total_steps": 6250, "loss": 0.7159, "learning_rate": 4.991406528347206e-05, "epoch": 0.0264, "percentage": 2.64, "elapsed_time": "0:13:26", "remaining_time": "8:15:58", "throughput": 1111.99, "total_tokens": 897296} {"current_steps": 170, "total_steps": 6250, "loss": 0.7573, "learning_rate": 4.990878142472628e-05, "epoch": 0.0272, "percentage": 2.72, "elapsed_time": "0:13:52", "remaining_time": "8:16:09", "throughput": 1110.79, "total_tokens": 924576} {"current_steps": 175, "total_steps": 6250, "loss": 0.8083, "learning_rate": 4.990334022857932e-05, "epoch": 0.028, "percentage": 2.8, "elapsed_time": "0:14:14", "remaining_time": "8:14:13", "throughput": 1107.27, "total_tokens": 945856} {"current_steps": 180, "total_steps": 6250, "loss": 0.7074, "learning_rate": 4.9897741729400705e-05, "epoch": 0.0288, "percentage": 2.88, "elapsed_time": "0:14:34", "remaining_time": "8:11:43", "throughput": 1109.16, "total_tokens": 970416} {"current_steps": 185, "total_steps": 6250, "loss": 0.7709, "learning_rate": 4.9891985962553606e-05, "epoch": 0.0296, "percentage": 2.96, "elapsed_time": "0:14:58", "remaining_time": "8:10:45", "throughput": 1107.02, "total_tokens": 994288} {"current_steps": 190, "total_steps": 6250, "loss": 0.7, "learning_rate": 4.988607296439458e-05, "epoch": 0.0304, "percentage": 3.04, "elapsed_time": "0:15:26", "remaining_time": "8:12:24", "throughput": 1111.78, "total_tokens": 1029872} {"current_steps": 195, "total_steps": 6250, "loss": 0.8251, "learning_rate": 4.988000277227334e-05, "epoch": 0.0312, "percentage": 3.12, "elapsed_time": "0:15:50", "remaining_time": "8:12:03", "throughput": 1115.99, "total_tokens": 1061072} {"current_steps": 200, "total_steps": 6250, "loss": 0.6707, "learning_rate": 4.987377542453251e-05, "epoch": 0.032, "percentage": 3.2, "elapsed_time": "0:16:13", "remaining_time": "8:10:48", "throughput": 1118.97, "total_tokens": 1089312} {"current_steps": 205, "total_steps": 6250, "loss": 0.7264, "learning_rate": 4.98673909605074e-05, "epoch": 0.0328, "percentage": 3.28, "elapsed_time": "0:16:36", "remaining_time": "8:09:38", "throughput": 1118.42, "total_tokens": 1114272} {"current_steps": 210, "total_steps": 6250, "loss": 0.7906, "learning_rate": 4.9860849420525766e-05, "epoch": 0.0336, "percentage": 3.36, "elapsed_time": "0:16:57", "remaining_time": "8:07:45", "throughput": 1120.2, "total_tokens": 1139808} {"current_steps": 215, "total_steps": 6250, "loss": 0.8062, "learning_rate": 4.985415084590752e-05, "epoch": 0.0344, "percentage": 3.44, "elapsed_time": "0:17:19", "remaining_time": "8:06:31", "throughput": 1118.39, "total_tokens": 1163072} {"current_steps": 220, "total_steps": 6250, "loss": 0.7432, "learning_rate": 4.9847295278964514e-05, "epoch": 0.0352, "percentage": 3.52, "elapsed_time": "0:17:42", "remaining_time": "8:05:19", "throughput": 1123.79, "total_tokens": 1193936} {"current_steps": 225, "total_steps": 6250, "loss": 0.7586, "learning_rate": 4.984028276300021e-05, "epoch": 0.036, "percentage": 3.6, "elapsed_time": "0:18:04", "remaining_time": "8:03:54", "throughput": 1124.9, "total_tokens": 1219696} {"current_steps": 230, "total_steps": 6250, "loss": 0.7532, "learning_rate": 4.98331133423095e-05, "epoch": 0.0368, "percentage": 3.68, "elapsed_time": "0:18:25", "remaining_time": "8:02:21", "throughput": 1128.76, "total_tokens": 1248096} {"current_steps": 235, "total_steps": 6250, "loss": 0.786, "learning_rate": 4.9825787062178315e-05, "epoch": 0.0376, "percentage": 3.76, "elapsed_time": "0:18:58", "remaining_time": "8:05:48", "throughput": 1121.03, "total_tokens": 1276624} {"current_steps": 240, "total_steps": 6250, "loss": 0.7947, "learning_rate": 4.981830396888344e-05, "epoch": 0.0384, "percentage": 3.84, "elapsed_time": "0:19:30", "remaining_time": "8:08:27", "throughput": 1113.74, "total_tokens": 1303472} {"current_steps": 245, "total_steps": 6250, "loss": 0.6988, "learning_rate": 4.981066410969215e-05, "epoch": 0.0392, "percentage": 3.92, "elapsed_time": "0:20:00", "remaining_time": "8:10:27", "throughput": 1105.12, "total_tokens": 1326816} {"current_steps": 250, "total_steps": 6250, "loss": 0.7078, "learning_rate": 4.980286753286195e-05, "epoch": 0.04, "percentage": 4.0, "elapsed_time": "0:20:34", "remaining_time": "8:13:39", "throughput": 1094.68, "total_tokens": 1351008} {"current_steps": 255, "total_steps": 6250, "loss": 0.7491, "learning_rate": 4.979491428764026e-05, "epoch": 0.0408, "percentage": 4.08, "elapsed_time": "0:21:05", "remaining_time": "8:15:47", "throughput": 1086.4, "total_tokens": 1374656} {"current_steps": 260, "total_steps": 6250, "loss": 0.75, "learning_rate": 4.9786804424264085e-05, "epoch": 0.0416, "percentage": 4.16, "elapsed_time": "0:21:42", "remaining_time": "8:20:05", "throughput": 1074.36, "total_tokens": 1399264} {"current_steps": 265, "total_steps": 6250, "loss": 0.798, "learning_rate": 4.977853799395976e-05, "epoch": 0.0424, "percentage": 4.24, "elapsed_time": "0:22:18", "remaining_time": "8:23:42", "throughput": 1062.87, "total_tokens": 1422304} {"current_steps": 270, "total_steps": 6250, "loss": 0.8814, "learning_rate": 4.977011504894252e-05, "epoch": 0.0432, "percentage": 4.32, "elapsed_time": "0:22:47", "remaining_time": "8:24:47", "throughput": 1058.29, "total_tokens": 1447184} {"current_steps": 275, "total_steps": 6250, "loss": 0.7203, "learning_rate": 4.976153564241628e-05, "epoch": 0.044, "percentage": 4.4, "elapsed_time": "0:23:16", "remaining_time": "8:25:48", "throughput": 1055.48, "total_tokens": 1474304} {"current_steps": 280, "total_steps": 6250, "loss": 0.6936, "learning_rate": 4.975279982857324e-05, "epoch": 0.0448, "percentage": 4.48, "elapsed_time": "0:23:48", "remaining_time": "8:27:29", "throughput": 1050.95, "total_tokens": 1500896} {"current_steps": 285, "total_steps": 6250, "loss": 0.7872, "learning_rate": 4.9743907662593524e-05, "epoch": 0.0456, "percentage": 4.56, "elapsed_time": "0:24:18", "remaining_time": "8:28:54", "throughput": 1047.84, "total_tokens": 1528688} {"current_steps": 290, "total_steps": 6250, "loss": 0.7517, "learning_rate": 4.9734859200644905e-05, "epoch": 0.0464, "percentage": 4.64, "elapsed_time": "0:24:43", "remaining_time": "8:28:06", "throughput": 1052.53, "total_tokens": 1561328} {"current_steps": 295, "total_steps": 6250, "loss": 0.6726, "learning_rate": 4.972565449988239e-05, "epoch": 0.0472, "percentage": 4.72, "elapsed_time": "0:25:06", "remaining_time": "8:26:45", "throughput": 1055.0, "total_tokens": 1589088} {"current_steps": 300, "total_steps": 6250, "loss": 0.7259, "learning_rate": 4.971629361844785e-05, "epoch": 0.048, "percentage": 4.8, "elapsed_time": "0:25:33", "remaining_time": "8:26:51", "throughput": 1053.71, "total_tokens": 1615712} {"current_steps": 305, "total_steps": 6250, "loss": 0.8337, "learning_rate": 4.9706776615469716e-05, "epoch": 0.0488, "percentage": 4.88, "elapsed_time": "0:25:54", "remaining_time": "8:25:05", "throughput": 1053.95, "total_tokens": 1638640} {"current_steps": 310, "total_steps": 6250, "loss": 0.731, "learning_rate": 4.9697103551062556e-05, "epoch": 0.0496, "percentage": 4.96, "elapsed_time": "0:26:19", "remaining_time": "8:24:30", "throughput": 1053.51, "total_tokens": 1664304} {"current_steps": 315, "total_steps": 6250, "loss": 0.7285, "learning_rate": 4.968727448632669e-05, "epoch": 0.0504, "percentage": 5.04, "elapsed_time": "0:26:49", "remaining_time": "8:25:20", "throughput": 1054.93, "total_tokens": 1697648} {"current_steps": 320, "total_steps": 6250, "loss": 0.723, "learning_rate": 4.967728948334784e-05, "epoch": 0.0512, "percentage": 5.12, "elapsed_time": "0:27:14", "remaining_time": "8:24:50", "throughput": 1056.29, "total_tokens": 1726608} {"current_steps": 325, "total_steps": 6250, "loss": 0.7918, "learning_rate": 4.96671486051967e-05, "epoch": 0.052, "percentage": 5.2, "elapsed_time": "0:27:36", "remaining_time": "8:23:25", "throughput": 1056.78, "total_tokens": 1750912} {"current_steps": 330, "total_steps": 6250, "loss": 0.6448, "learning_rate": 4.965685191592859e-05, "epoch": 0.0528, "percentage": 5.28, "elapsed_time": "0:27:58", "remaining_time": "8:21:57", "throughput": 1062.0, "total_tokens": 1782912} {"current_steps": 335, "total_steps": 6250, "loss": 0.7874, "learning_rate": 4.964639948058297e-05, "epoch": 0.0536, "percentage": 5.36, "elapsed_time": "0:28:19", "remaining_time": "8:20:11", "throughput": 1061.77, "total_tokens": 1804704} {"current_steps": 340, "total_steps": 6250, "loss": 0.7025, "learning_rate": 4.963579136518312e-05, "epoch": 0.0544, "percentage": 5.44, "elapsed_time": "0:28:57", "remaining_time": "8:23:27", "throughput": 1051.46, "total_tokens": 1827248} {"current_steps": 345, "total_steps": 6250, "loss": 0.6676, "learning_rate": 4.962502763673565e-05, "epoch": 0.0552, "percentage": 5.52, "elapsed_time": "0:30:03", "remaining_time": "8:34:34", "throughput": 1027.96, "total_tokens": 1854304} {"current_steps": 350, "total_steps": 6250, "loss": 0.7774, "learning_rate": 4.9614108363230135e-05, "epoch": 0.056, "percentage": 5.6, "elapsed_time": "0:31:04", "remaining_time": "8:43:45", "throughput": 1007.8, "total_tokens": 1878768} {"current_steps": 355, "total_steps": 6250, "loss": 0.7641, "learning_rate": 4.9603033613638626e-05, "epoch": 0.0568, "percentage": 5.68, "elapsed_time": "0:32:18", "remaining_time": "8:56:22", "throughput": 983.33, "total_tokens": 1905744} {"current_steps": 360, "total_steps": 6250, "loss": 0.7169, "learning_rate": 4.959180345791528e-05, "epoch": 0.0576, "percentage": 5.76, "elapsed_time": "0:33:35", "remaining_time": "9:09:28", "throughput": 958.48, "total_tokens": 1931392} {"current_steps": 365, "total_steps": 6250, "loss": 0.7033, "learning_rate": 4.958041796699583e-05, "epoch": 0.0584, "percentage": 5.84, "elapsed_time": "0:34:45", "remaining_time": "9:20:27", "throughput": 937.03, "total_tokens": 1954304} {"current_steps": 370, "total_steps": 6250, "loss": 0.6569, "learning_rate": 4.956887721279726e-05, "epoch": 0.0592, "percentage": 5.92, "elapsed_time": "0:36:10", "remaining_time": "9:34:53", "throughput": 915.58, "total_tokens": 1987264} {"current_steps": 375, "total_steps": 6250, "loss": 0.7809, "learning_rate": 4.9557181268217227e-05, "epoch": 0.06, "percentage": 6.0, "elapsed_time": "0:37:35", "remaining_time": "9:49:00", "throughput": 891.11, "total_tokens": 2010160} {"current_steps": 380, "total_steps": 6250, "loss": 0.811, "learning_rate": 4.9545330207133664e-05, "epoch": 0.0608, "percentage": 6.08, "elapsed_time": "0:38:53", "remaining_time": "10:00:44", "throughput": 873.78, "total_tokens": 2038880} {"current_steps": 385, "total_steps": 6250, "loss": 0.825, "learning_rate": 4.953332410440435e-05, "epoch": 0.0616, "percentage": 6.16, "elapsed_time": "0:39:19", "remaining_time": "9:59:05", "throughput": 875.3, "total_tokens": 2065344} {"current_steps": 390, "total_steps": 6250, "loss": 0.7479, "learning_rate": 4.952116303586631e-05, "epoch": 0.0624, "percentage": 6.24, "elapsed_time": "0:39:54", "remaining_time": "9:59:31", "throughput": 873.87, "total_tokens": 2092064} {"current_steps": 395, "total_steps": 6250, "loss": 0.7246, "learning_rate": 4.9508847078335495e-05, "epoch": 0.0632, "percentage": 6.32, "elapsed_time": "0:40:20", "remaining_time": "9:58:02", "throughput": 875.48, "total_tokens": 2119360} {"current_steps": 400, "total_steps": 6250, "loss": 0.6956, "learning_rate": 4.949637630960617e-05, "epoch": 0.064, "percentage": 6.4, "elapsed_time": "0:40:45", "remaining_time": "9:56:00", "throughput": 877.89, "total_tokens": 2146560} {"current_steps": 405, "total_steps": 6250, "loss": 0.7315, "learning_rate": 4.94837508084505e-05, "epoch": 0.0648, "percentage": 6.48, "elapsed_time": "0:41:08", "remaining_time": "9:53:43", "throughput": 878.82, "total_tokens": 2169232} {"current_steps": 410, "total_steps": 6250, "loss": 0.7075, "learning_rate": 4.947097065461801e-05, "epoch": 0.0656, "percentage": 6.56, "elapsed_time": "0:41:29", "remaining_time": "9:51:02", "throughput": 880.54, "total_tokens": 2192224} {"current_steps": 415, "total_steps": 6250, "loss": 0.811, "learning_rate": 4.945803592883509e-05, "epoch": 0.0664, "percentage": 6.64, "elapsed_time": "0:41:54", "remaining_time": "9:49:20", "throughput": 881.46, "total_tokens": 2216784} {"current_steps": 420, "total_steps": 6250, "loss": 0.7835, "learning_rate": 4.9444946712804494e-05, "epoch": 0.0672, "percentage": 6.72, "elapsed_time": "0:42:19", "remaining_time": "9:47:26", "throughput": 883.39, "total_tokens": 2243120} {"current_steps": 425, "total_steps": 6250, "loss": 0.7211, "learning_rate": 4.943170308920484e-05, "epoch": 0.068, "percentage": 6.8, "elapsed_time": "0:42:46", "remaining_time": "9:46:22", "throughput": 884.66, "total_tokens": 2270896} {"current_steps": 430, "total_steps": 6250, "loss": 0.72, "learning_rate": 4.941830514169004e-05, "epoch": 0.0688, "percentage": 6.88, "elapsed_time": "0:43:34", "remaining_time": "9:49:51", "throughput": 879.04, "total_tokens": 2298528} {"current_steps": 435, "total_steps": 6250, "loss": 0.7206, "learning_rate": 4.9404752954888824e-05, "epoch": 0.0696, "percentage": 6.96, "elapsed_time": "0:44:08", "remaining_time": "9:50:10", "throughput": 878.88, "total_tokens": 2328080} {"current_steps": 440, "total_steps": 6250, "loss": 0.8018, "learning_rate": 4.939104661440415e-05, "epoch": 0.0704, "percentage": 7.04, "elapsed_time": "0:44:44", "remaining_time": "9:50:53", "throughput": 877.41, "total_tokens": 2355776} {"current_steps": 445, "total_steps": 6250, "loss": 0.8267, "learning_rate": 4.937718620681273e-05, "epoch": 0.0712, "percentage": 7.12, "elapsed_time": "0:45:16", "remaining_time": "9:50:41", "throughput": 875.65, "total_tokens": 2379056} {"current_steps": 450, "total_steps": 6250, "loss": 0.8961, "learning_rate": 4.9363171819664434e-05, "epoch": 0.072, "percentage": 7.2, "elapsed_time": "0:45:49", "remaining_time": "9:50:40", "throughput": 873.44, "total_tokens": 2401664} {"current_steps": 455, "total_steps": 6250, "loss": 0.6942, "learning_rate": 4.934900354148173e-05, "epoch": 0.0728, "percentage": 7.28, "elapsed_time": "0:46:24", "remaining_time": "9:51:07", "throughput": 871.69, "total_tokens": 2427456} {"current_steps": 460, "total_steps": 6250, "loss": 0.7874, "learning_rate": 4.933468146175918e-05, "epoch": 0.0736, "percentage": 7.36, "elapsed_time": "0:46:55", "remaining_time": "9:50:38", "throughput": 870.45, "total_tokens": 2450752} {"current_steps": 465, "total_steps": 6250, "loss": 0.7162, "learning_rate": 4.9320205670962814e-05, "epoch": 0.0744, "percentage": 7.44, "elapsed_time": "0:47:24", "remaining_time": "9:49:52", "throughput": 869.58, "total_tokens": 2473856} {"current_steps": 470, "total_steps": 6250, "loss": 0.7434, "learning_rate": 4.9305576260529607e-05, "epoch": 0.0752, "percentage": 7.52, "elapsed_time": "0:47:56", "remaining_time": "9:49:35", "throughput": 870.11, "total_tokens": 2502928} {"current_steps": 475, "total_steps": 6250, "loss": 0.6932, "learning_rate": 4.929079332286685e-05, "epoch": 0.076, "percentage": 7.6, "elapsed_time": "0:48:34", "remaining_time": "9:50:36", "throughput": 870.13, "total_tokens": 2536144} {"current_steps": 480, "total_steps": 6250, "loss": 0.8053, "learning_rate": 4.927585695135162e-05, "epoch": 0.0768, "percentage": 7.68, "elapsed_time": "0:49:07", "remaining_time": "9:50:29", "throughput": 869.49, "total_tokens": 2562688} {"current_steps": 485, "total_steps": 6250, "loss": 0.7482, "learning_rate": 4.926076724033016e-05, "epoch": 0.0776, "percentage": 7.76, "elapsed_time": "0:49:43", "remaining_time": "9:51:00", "throughput": 869.68, "total_tokens": 2594480} {"current_steps": 490, "total_steps": 6250, "loss": 0.7075, "learning_rate": 4.9245524285117274e-05, "epoch": 0.0784, "percentage": 7.84, "elapsed_time": "0:50:17", "remaining_time": "9:51:15", "throughput": 869.74, "total_tokens": 2624736} {"current_steps": 495, "total_steps": 6250, "loss": 0.6132, "learning_rate": 4.923012818199576e-05, "epoch": 0.0792, "percentage": 7.92, "elapsed_time": "0:50:45", "remaining_time": "9:50:09", "throughput": 869.73, "total_tokens": 2648880} {"current_steps": 500, "total_steps": 6250, "loss": 0.6679, "learning_rate": 4.9214579028215776e-05, "epoch": 0.08, "percentage": 8.0, "elapsed_time": "0:51:16", "remaining_time": "9:49:44", "throughput": 869.66, "total_tokens": 2675888} {"current_steps": 505, "total_steps": 6250, "loss": 0.7016, "learning_rate": 4.919887692199423e-05, "epoch": 0.0808, "percentage": 8.08, "elapsed_time": "0:51:45", "remaining_time": "9:48:52", "throughput": 869.13, "total_tokens": 2699392} {"current_steps": 510, "total_steps": 6250, "loss": 0.7216, "learning_rate": 4.918302196251415e-05, "epoch": 0.0816, "percentage": 8.16, "elapsed_time": "0:52:18", "remaining_time": "9:48:43", "throughput": 868.7, "total_tokens": 2726432} {"current_steps": 515, "total_steps": 6250, "loss": 0.6602, "learning_rate": 4.9167014249924075e-05, "epoch": 0.0824, "percentage": 8.24, "elapsed_time": "0:52:53", "remaining_time": "9:48:59", "throughput": 868.55, "total_tokens": 2756336} {"current_steps": 520, "total_steps": 6250, "loss": 0.6956, "learning_rate": 4.9150853885337426e-05, "epoch": 0.0832, "percentage": 8.32, "elapsed_time": "0:53:26", "remaining_time": "9:48:55", "throughput": 867.45, "total_tokens": 2781648} {"current_steps": 525, "total_steps": 6250, "loss": 0.6427, "learning_rate": 4.913454097083185e-05, "epoch": 0.084, "percentage": 8.4, "elapsed_time": "0:54:00", "remaining_time": "9:48:53", "throughput": 867.35, "total_tokens": 2810336} {"current_steps": 530, "total_steps": 6250, "loss": 0.8328, "learning_rate": 4.911807560944858e-05, "epoch": 0.0848, "percentage": 8.48, "elapsed_time": "0:54:35", "remaining_time": "9:49:15", "throughput": 865.84, "total_tokens": 2836432} {"current_steps": 535, "total_steps": 6250, "loss": 0.8104, "learning_rate": 4.9101457905191774e-05, "epoch": 0.0856, "percentage": 8.56, "elapsed_time": "0:55:07", "remaining_time": "9:48:55", "throughput": 865.7, "total_tokens": 2863616} {"current_steps": 540, "total_steps": 6250, "loss": 0.6858, "learning_rate": 4.9084687963027894e-05, "epoch": 0.0864, "percentage": 8.64, "elapsed_time": "0:55:41", "remaining_time": "9:48:50", "throughput": 865.33, "total_tokens": 2891264} {"current_steps": 545, "total_steps": 6250, "loss": 0.7271, "learning_rate": 4.906776588888502e-05, "epoch": 0.0872, "percentage": 8.72, "elapsed_time": "0:56:12", "remaining_time": "9:48:21", "throughput": 864.76, "total_tokens": 2916256} {"current_steps": 550, "total_steps": 6250, "loss": 0.7527, "learning_rate": 4.905069178965215e-05, "epoch": 0.088, "percentage": 8.8, "elapsed_time": "0:56:45", "remaining_time": "9:48:10", "throughput": 864.58, "total_tokens": 2944112} {"current_steps": 555, "total_steps": 6250, "loss": 0.7341, "learning_rate": 4.903346577317859e-05, "epoch": 0.0888, "percentage": 8.88, "elapsed_time": "0:57:14", "remaining_time": "9:47:19", "throughput": 865.55, "total_tokens": 2972512} {"current_steps": 560, "total_steps": 6250, "loss": 0.7339, "learning_rate": 4.90160879482732e-05, "epoch": 0.0896, "percentage": 8.96, "elapsed_time": "0:57:44", "remaining_time": "9:46:38", "throughput": 865.18, "total_tokens": 2997168} {"current_steps": 565, "total_steps": 6250, "loss": 0.768, "learning_rate": 4.89985584247038e-05, "epoch": 0.0904, "percentage": 9.04, "elapsed_time": "0:58:15", "remaining_time": "9:46:07", "throughput": 864.33, "total_tokens": 3020880} {"current_steps": 570, "total_steps": 6250, "loss": 0.7014, "learning_rate": 4.898087731319636e-05, "epoch": 0.0912, "percentage": 9.12, "elapsed_time": "0:58:43", "remaining_time": "9:45:15", "throughput": 863.86, "total_tokens": 3044224} {"current_steps": 575, "total_steps": 6250, "loss": 0.6203, "learning_rate": 4.89630447254344e-05, "epoch": 0.092, "percentage": 9.2, "elapsed_time": "0:59:14", "remaining_time": "9:44:39", "throughput": 864.22, "total_tokens": 3071680} {"current_steps": 580, "total_steps": 6250, "loss": 0.7461, "learning_rate": 4.894506077405824e-05, "epoch": 0.0928, "percentage": 9.28, "elapsed_time": "0:59:45", "remaining_time": "9:44:14", "throughput": 864.27, "total_tokens": 3099088} {"current_steps": 585, "total_steps": 6250, "loss": 0.7357, "learning_rate": 4.892692557266429e-05, "epoch": 0.0936, "percentage": 9.36, "elapsed_time": "1:00:20", "remaining_time": "9:44:15", "throughput": 864.0, "total_tokens": 3127728} {"current_steps": 590, "total_steps": 6250, "loss": 0.7819, "learning_rate": 4.8908639235804324e-05, "epoch": 0.0944, "percentage": 9.44, "elapsed_time": "1:00:48", "remaining_time": "9:43:25", "throughput": 864.45, "total_tokens": 3154336} {"current_steps": 595, "total_steps": 6250, "loss": 0.7121, "learning_rate": 4.8890201878984796e-05, "epoch": 0.0952, "percentage": 9.52, "elapsed_time": "1:01:17", "remaining_time": "9:42:35", "throughput": 864.3, "total_tokens": 3178768} {"current_steps": 600, "total_steps": 6250, "loss": 0.6698, "learning_rate": 4.887161361866608e-05, "epoch": 0.096, "percentage": 9.6, "elapsed_time": "1:01:52", "remaining_time": "9:42:42", "throughput": 865.1, "total_tokens": 3211968} {"current_steps": 605, "total_steps": 6250, "loss": 0.7606, "learning_rate": 4.885287457226172e-05, "epoch": 0.0968, "percentage": 9.68, "elapsed_time": "1:02:23", "remaining_time": "9:42:07", "throughput": 865.07, "total_tokens": 3238272} {"current_steps": 610, "total_steps": 6250, "loss": 0.7694, "learning_rate": 4.8833984858137715e-05, "epoch": 0.0976, "percentage": 9.76, "elapsed_time": "1:02:57", "remaining_time": "9:42:08", "throughput": 865.65, "total_tokens": 3270208} {"current_steps": 615, "total_steps": 6250, "loss": 0.7227, "learning_rate": 4.8814944595611776e-05, "epoch": 0.0984, "percentage": 9.84, "elapsed_time": "1:03:30", "remaining_time": "9:41:53", "throughput": 865.05, "total_tokens": 3296192} {"current_steps": 620, "total_steps": 6250, "loss": 0.7275, "learning_rate": 4.8795753904952534e-05, "epoch": 0.0992, "percentage": 9.92, "elapsed_time": "1:04:02", "remaining_time": "9:41:32", "throughput": 864.34, "total_tokens": 3321232} {"current_steps": 625, "total_steps": 6250, "loss": 0.6746, "learning_rate": 4.877641290737884e-05, "epoch": 0.1, "percentage": 10.0, "elapsed_time": "1:04:33", "remaining_time": "9:40:59", "throughput": 863.34, "total_tokens": 3343984} {"current_steps": 630, "total_steps": 6250, "loss": 0.8223, "learning_rate": 4.8756921725058934e-05, "epoch": 0.1008, "percentage": 10.08, "elapsed_time": "1:05:09", "remaining_time": "9:41:18", "throughput": 861.36, "total_tokens": 3367824} {"current_steps": 635, "total_steps": 6250, "loss": 0.8487, "learning_rate": 4.8737280481109724e-05, "epoch": 0.1016, "percentage": 10.16, "elapsed_time": "1:05:41", "remaining_time": "9:40:54", "throughput": 861.25, "total_tokens": 3394800} {"current_steps": 640, "total_steps": 6250, "loss": 0.7441, "learning_rate": 4.871748929959598e-05, "epoch": 0.1024, "percentage": 10.24, "elapsed_time": "1:06:11", "remaining_time": "9:40:16", "throughput": 861.39, "total_tokens": 3421360} {"current_steps": 645, "total_steps": 6250, "loss": 0.7631, "learning_rate": 4.869754830552956e-05, "epoch": 0.1032, "percentage": 10.32, "elapsed_time": "1:06:42", "remaining_time": "9:39:41", "throughput": 861.85, "total_tokens": 3449584} {"current_steps": 650, "total_steps": 6250, "loss": 0.7793, "learning_rate": 4.867745762486861e-05, "epoch": 0.104, "percentage": 10.4, "elapsed_time": "1:07:16", "remaining_time": "9:39:33", "throughput": 861.51, "total_tokens": 3477168} {"current_steps": 655, "total_steps": 6250, "loss": 0.7415, "learning_rate": 4.86572173845168e-05, "epoch": 0.1048, "percentage": 10.48, "elapsed_time": "1:07:48", "remaining_time": "9:39:16", "throughput": 861.42, "total_tokens": 3505056} {"current_steps": 660, "total_steps": 6250, "loss": 0.7157, "learning_rate": 4.863682771232248e-05, "epoch": 0.1056, "percentage": 10.56, "elapsed_time": "1:08:18", "remaining_time": "9:38:34", "throughput": 862.38, "total_tokens": 3534576} {"current_steps": 665, "total_steps": 6250, "loss": 0.7287, "learning_rate": 4.861628873707792e-05, "epoch": 0.1064, "percentage": 10.64, "elapsed_time": "1:08:50", "remaining_time": "9:38:09", "throughput": 862.07, "total_tokens": 3560688} {"current_steps": 670, "total_steps": 6250, "loss": 0.7351, "learning_rate": 4.859560058851844e-05, "epoch": 0.1072, "percentage": 10.72, "elapsed_time": "1:09:18", "remaining_time": "9:37:14", "throughput": 862.35, "total_tokens": 3586176} {"current_steps": 675, "total_steps": 6250, "loss": 0.6213, "learning_rate": 4.8574763397321614e-05, "epoch": 0.108, "percentage": 10.8, "elapsed_time": "1:09:49", "remaining_time": "9:36:45", "throughput": 862.9, "total_tokens": 3615472} {"current_steps": 680, "total_steps": 6250, "loss": 0.729, "learning_rate": 4.855377729510648e-05, "epoch": 0.1088, "percentage": 10.88, "elapsed_time": "1:10:19", "remaining_time": "9:36:01", "throughput": 862.27, "total_tokens": 3638256} {"current_steps": 685, "total_steps": 6250, "loss": 0.7242, "learning_rate": 4.8532642414432674e-05, "epoch": 0.1096, "percentage": 10.96, "elapsed_time": "1:10:54", "remaining_time": "9:36:01", "throughput": 862.18, "total_tokens": 3667824} {"current_steps": 690, "total_steps": 6250, "loss": 0.7831, "learning_rate": 4.851135888879958e-05, "epoch": 0.1104, "percentage": 11.04, "elapsed_time": "1:11:27", "remaining_time": "9:35:47", "throughput": 861.93, "total_tokens": 3695408} {"current_steps": 695, "total_steps": 6250, "loss": 0.7181, "learning_rate": 4.8489926852645505e-05, "epoch": 0.1112, "percentage": 11.12, "elapsed_time": "1:11:56", "remaining_time": "9:35:04", "throughput": 861.69, "total_tokens": 3719888} {"current_steps": 700, "total_steps": 6250, "loss": 0.7961, "learning_rate": 4.846834644134686e-05, "epoch": 0.112, "percentage": 11.2, "elapsed_time": "1:12:26", "remaining_time": "9:34:24", "throughput": 861.42, "total_tokens": 3744512} {"current_steps": 705, "total_steps": 6250, "loss": 0.8362, "learning_rate": 4.844661779121722e-05, "epoch": 0.1128, "percentage": 11.28, "elapsed_time": "1:13:00", "remaining_time": "9:34:16", "throughput": 861.02, "total_tokens": 3771968} {"current_steps": 710, "total_steps": 6250, "loss": 0.7645, "learning_rate": 4.8424741039506575e-05, "epoch": 0.1136, "percentage": 11.36, "elapsed_time": "1:13:33", "remaining_time": "9:34:01", "throughput": 861.28, "total_tokens": 3801680} {"current_steps": 715, "total_steps": 6250, "loss": 0.7042, "learning_rate": 4.840271632440038e-05, "epoch": 0.1144, "percentage": 11.44, "elapsed_time": "1:14:06", "remaining_time": "9:33:44", "throughput": 862.17, "total_tokens": 3833952} {"current_steps": 720, "total_steps": 6250, "loss": 0.7476, "learning_rate": 4.8380543785018677e-05, "epoch": 0.1152, "percentage": 11.52, "elapsed_time": "1:14:38", "remaining_time": "9:33:14", "throughput": 862.0, "total_tokens": 3860144} {"current_steps": 725, "total_steps": 6250, "loss": 0.7415, "learning_rate": 4.8358223561415304e-05, "epoch": 0.116, "percentage": 11.6, "elapsed_time": "1:15:10", "remaining_time": "9:32:53", "throughput": 862.5, "total_tokens": 3890304} {"current_steps": 730, "total_steps": 6250, "loss": 0.6717, "learning_rate": 4.833575579457691e-05, "epoch": 0.1168, "percentage": 11.68, "elapsed_time": "1:15:43", "remaining_time": "9:32:35", "throughput": 861.59, "total_tokens": 3914560} {"current_steps": 735, "total_steps": 6250, "loss": 0.7545, "learning_rate": 4.8313140626422125e-05, "epoch": 0.1176, "percentage": 11.76, "elapsed_time": "1:16:12", "remaining_time": "9:31:51", "throughput": 861.66, "total_tokens": 3940128} {"current_steps": 740, "total_steps": 6250, "loss": 0.7809, "learning_rate": 4.829037819980065e-05, "epoch": 0.1184, "percentage": 11.84, "elapsed_time": "1:16:44", "remaining_time": "9:31:28", "throughput": 862.25, "total_tokens": 3970608} {"current_steps": 745, "total_steps": 6250, "loss": 0.7904, "learning_rate": 4.8267468658492335e-05, "epoch": 0.1192, "percentage": 11.92, "elapsed_time": "1:17:18", "remaining_time": "9:31:16", "throughput": 861.65, "total_tokens": 3996960} {"current_steps": 750, "total_steps": 6250, "loss": 0.7688, "learning_rate": 4.8244412147206284e-05, "epoch": 0.12, "percentage": 12.0, "elapsed_time": "1:17:54", "remaining_time": "9:31:17", "throughput": 860.36, "total_tokens": 4021488} {"current_steps": 755, "total_steps": 6250, "loss": 0.7819, "learning_rate": 4.822120881157998e-05, "epoch": 0.1208, "percentage": 12.08, "elapsed_time": "1:18:27", "remaining_time": "9:31:02", "throughput": 859.69, "total_tokens": 4047136} {"current_steps": 760, "total_steps": 6250, "loss": 0.6757, "learning_rate": 4.819785879817827e-05, "epoch": 0.1216, "percentage": 12.16, "elapsed_time": "1:19:04", "remaining_time": "9:31:14", "throughput": 858.27, "total_tokens": 4072256} {"current_steps": 765, "total_steps": 6250, "loss": 0.8952, "learning_rate": 4.817436225449255e-05, "epoch": 0.1224, "percentage": 12.24, "elapsed_time": "1:19:37", "remaining_time": "9:30:52", "throughput": 857.26, "total_tokens": 4095328} {"current_steps": 770, "total_steps": 6250, "loss": 0.6998, "learning_rate": 4.8150719328939755e-05, "epoch": 0.1232, "percentage": 12.32, "elapsed_time": "1:20:09", "remaining_time": "9:30:28", "throughput": 856.41, "total_tokens": 4118896} {"current_steps": 775, "total_steps": 6250, "loss": 0.7675, "learning_rate": 4.812693017086145e-05, "epoch": 0.124, "percentage": 12.4, "elapsed_time": "1:20:40", "remaining_time": "9:29:55", "throughput": 856.24, "total_tokens": 4144576} {"current_steps": 780, "total_steps": 6250, "loss": 0.7332, "learning_rate": 4.810299493052289e-05, "epoch": 0.1248, "percentage": 12.48, "elapsed_time": "1:21:21", "remaining_time": "9:30:30", "throughput": 854.81, "total_tokens": 4172448} {"current_steps": 785, "total_steps": 6250, "loss": 0.6942, "learning_rate": 4.8078913759112066e-05, "epoch": 0.1256, "percentage": 12.56, "elapsed_time": "1:21:54", "remaining_time": "9:30:14", "throughput": 853.8, "total_tokens": 4196032} {"current_steps": 790, "total_steps": 6250, "loss": 0.7536, "learning_rate": 4.805468680873874e-05, "epoch": 0.1264, "percentage": 12.64, "elapsed_time": "1:22:32", "remaining_time": "9:30:29", "throughput": 852.94, "total_tokens": 4224320} {"current_steps": 795, "total_steps": 6250, "loss": 0.6722, "learning_rate": 4.803031423243349e-05, "epoch": 0.1272, "percentage": 12.72, "elapsed_time": "1:23:09", "remaining_time": "9:30:35", "throughput": 852.35, "total_tokens": 4252752} {"current_steps": 800, "total_steps": 6250, "loss": 0.7651, "learning_rate": 4.800579618414676e-05, "epoch": 0.128, "percentage": 12.8, "elapsed_time": "1:23:41", "remaining_time": "9:30:06", "throughput": 852.08, "total_tokens": 4278480} {"current_steps": 805, "total_steps": 6250, "loss": 0.6626, "learning_rate": 4.7981132818747876e-05, "epoch": 0.1288, "percentage": 12.88, "elapsed_time": "1:24:14", "remaining_time": "9:29:47", "throughput": 851.91, "total_tokens": 4305920} {"current_steps": 810, "total_steps": 6250, "loss": 0.8511, "learning_rate": 4.795632429202405e-05, "epoch": 0.1296, "percentage": 12.96, "elapsed_time": "1:24:48", "remaining_time": "9:29:36", "throughput": 850.98, "total_tokens": 4330448} {"current_steps": 815, "total_steps": 6250, "loss": 0.7524, "learning_rate": 4.793137076067942e-05, "epoch": 0.1304, "percentage": 13.04, "elapsed_time": "1:25:19", "remaining_time": "9:28:57", "throughput": 851.11, "total_tokens": 4356880} {"current_steps": 820, "total_steps": 6250, "loss": 0.8498, "learning_rate": 4.790627238233405e-05, "epoch": 0.1312, "percentage": 13.12, "elapsed_time": "1:25:49", "remaining_time": "9:28:19", "throughput": 851.31, "total_tokens": 4383744} {"current_steps": 825, "total_steps": 6250, "loss": 0.647, "learning_rate": 4.788102931552294e-05, "epoch": 0.132, "percentage": 13.2, "elapsed_time": "1:26:23", "remaining_time": "9:28:05", "throughput": 850.98, "total_tokens": 4411120} {"current_steps": 830, "total_steps": 6250, "loss": 0.7766, "learning_rate": 4.7855641719695023e-05, "epoch": 0.1328, "percentage": 13.28, "elapsed_time": "1:26:54", "remaining_time": "9:27:30", "throughput": 850.71, "total_tokens": 4435920} {"current_steps": 835, "total_steps": 6250, "loss": 0.7426, "learning_rate": 4.783010975521216e-05, "epoch": 0.1336, "percentage": 13.36, "elapsed_time": "1:27:50", "remaining_time": "9:29:41", "throughput": 846.69, "total_tokens": 4462768} {"current_steps": 840, "total_steps": 6250, "loss": 0.6919, "learning_rate": 4.78044335833481e-05, "epoch": 0.1344, "percentage": 13.44, "elapsed_time": "1:28:23", "remaining_time": "9:29:19", "throughput": 847.17, "total_tokens": 4493232} {"current_steps": 845, "total_steps": 6250, "loss": 0.7221, "learning_rate": 4.7778613366287505e-05, "epoch": 0.1352, "percentage": 13.52, "elapsed_time": "1:28:46", "remaining_time": "9:27:53", "throughput": 848.53, "total_tokens": 4520048} {"current_steps": 850, "total_steps": 6250, "loss": 0.7344, "learning_rate": 4.775264926712489e-05, "epoch": 0.136, "percentage": 13.6, "elapsed_time": "1:30:15", "remaining_time": "9:33:24", "throughput": 839.43, "total_tokens": 4545984} {"current_steps": 855, "total_steps": 6250, "loss": 0.6648, "learning_rate": 4.772654144986364e-05, "epoch": 0.1368, "percentage": 13.68, "elapsed_time": "1:40:22", "remaining_time": "10:33:24", "throughput": 759.98, "total_tokens": 4577296} {"current_steps": 860, "total_steps": 6250, "loss": 0.7513, "learning_rate": 4.7700290079414896e-05, "epoch": 0.1376, "percentage": 13.76, "elapsed_time": "1:42:18", "remaining_time": "10:41:11", "throughput": 749.77, "total_tokens": 4602272} {"current_steps": 865, "total_steps": 6250, "loss": 0.7792, "learning_rate": 4.767389532159659e-05, "epoch": 0.1384, "percentage": 13.84, "elapsed_time": "1:42:52", "remaining_time": "10:40:25", "throughput": 750.29, "total_tokens": 4631008} {"current_steps": 870, "total_steps": 6250, "loss": 0.7529, "learning_rate": 4.764735734313236e-05, "epoch": 0.1392, "percentage": 13.92, "elapsed_time": "1:43:24", "remaining_time": "10:39:30", "throughput": 751.05, "total_tokens": 4660112} {"current_steps": 875, "total_steps": 6250, "loss": 0.6728, "learning_rate": 4.762067631165049e-05, "epoch": 0.14, "percentage": 14.0, "elapsed_time": "1:43:59", "remaining_time": "10:38:48", "throughput": 751.59, "total_tokens": 4689504} {"current_steps": 880, "total_steps": 6250, "loss": 0.6935, "learning_rate": 4.759385239568289e-05, "epoch": 0.1408, "percentage": 14.08, "elapsed_time": "1:44:33", "remaining_time": "10:38:01", "throughput": 751.64, "total_tokens": 4715312} {"current_steps": 885, "total_steps": 6250, "loss": 0.8062, "learning_rate": 4.756688576466398e-05, "epoch": 0.1416, "percentage": 14.16, "elapsed_time": "1:45:04", "remaining_time": "10:36:58", "throughput": 751.2, "total_tokens": 4735936} {"current_steps": 890, "total_steps": 6250, "loss": 0.7149, "learning_rate": 4.753977658892967e-05, "epoch": 0.1424, "percentage": 14.24, "elapsed_time": "1:45:37", "remaining_time": "10:36:04", "throughput": 751.18, "total_tokens": 4760256} {"current_steps": 895, "total_steps": 6250, "loss": 0.7062, "learning_rate": 4.751252503971624e-05, "epoch": 0.1432, "percentage": 14.32, "elapsed_time": "1:46:11", "remaining_time": "10:35:20", "throughput": 751.71, "total_tokens": 4789264} {"current_steps": 900, "total_steps": 6250, "loss": 0.837, "learning_rate": 4.7485131289159276e-05, "epoch": 0.144, "percentage": 14.4, "elapsed_time": "1:46:44", "remaining_time": "10:34:33", "throughput": 751.82, "total_tokens": 4815344} {"current_steps": 905, "total_steps": 6250, "loss": 0.6907, "learning_rate": 4.745759551029261e-05, "epoch": 0.1448, "percentage": 14.48, "elapsed_time": "1:47:21", "remaining_time": "10:34:03", "throughput": 751.47, "total_tokens": 4840528} {"current_steps": 910, "total_steps": 6250, "loss": 0.7192, "learning_rate": 4.742991787704719e-05, "epoch": 0.1456, "percentage": 14.56, "elapsed_time": "1:47:52", "remaining_time": "10:33:02", "throughput": 752.08, "total_tokens": 4868032} {"current_steps": 915, "total_steps": 6250, "loss": 0.7223, "learning_rate": 4.7402098564249974e-05, "epoch": 0.1464, "percentage": 14.64, "elapsed_time": "1:48:25", "remaining_time": "10:32:09", "throughput": 752.21, "total_tokens": 4893376} {"current_steps": 920, "total_steps": 6250, "loss": 0.6847, "learning_rate": 4.737413774762287e-05, "epoch": 0.1472, "percentage": 14.72, "elapsed_time": "1:48:56", "remaining_time": "10:31:08", "throughput": 752.44, "total_tokens": 4918288} {"current_steps": 925, "total_steps": 6250, "loss": 0.7273, "learning_rate": 4.73460356037816e-05, "epoch": 0.148, "percentage": 14.8, "elapsed_time": "1:49:31", "remaining_time": "10:30:31", "throughput": 752.42, "total_tokens": 4944688} {"current_steps": 930, "total_steps": 6250, "loss": 0.7087, "learning_rate": 4.731779231023456e-05, "epoch": 0.1488, "percentage": 14.88, "elapsed_time": "1:50:03", "remaining_time": "10:29:37", "throughput": 752.54, "total_tokens": 4969744} {"current_steps": 935, "total_steps": 6250, "loss": 0.7771, "learning_rate": 4.728940804538176e-05, "epoch": 0.1496, "percentage": 14.96, "elapsed_time": "1:50:35", "remaining_time": "10:28:37", "throughput": 753.12, "total_tokens": 4997072} {"current_steps": 940, "total_steps": 6250, "loss": 0.7598, "learning_rate": 4.7260882988513624e-05, "epoch": 0.1504, "percentage": 15.04, "elapsed_time": "1:51:07", "remaining_time": "10:27:46", "throughput": 753.57, "total_tokens": 5024672} {"current_steps": 945, "total_steps": 6250, "loss": 0.7961, "learning_rate": 4.723221731980993e-05, "epoch": 0.1512, "percentage": 15.12, "elapsed_time": "1:51:40", "remaining_time": "10:26:56", "throughput": 753.94, "total_tokens": 5051952} {"current_steps": 950, "total_steps": 6250, "loss": 0.773, "learning_rate": 4.720341122033862e-05, "epoch": 0.152, "percentage": 15.2, "elapsed_time": "1:52:11", "remaining_time": "10:25:55", "throughput": 753.82, "total_tokens": 5074528} {"current_steps": 955, "total_steps": 6250, "loss": 0.7216, "learning_rate": 4.717446487205466e-05, "epoch": 0.1528, "percentage": 15.28, "elapsed_time": "1:52:42", "remaining_time": "10:24:56", "throughput": 754.1, "total_tokens": 5099840} {"current_steps": 960, "total_steps": 6250, "loss": 0.6569, "learning_rate": 4.714537845779894e-05, "epoch": 0.1536, "percentage": 15.36, "elapsed_time": "1:53:14", "remaining_time": "10:23:59", "throughput": 753.98, "total_tokens": 5122848} {"current_steps": 965, "total_steps": 6250, "loss": 0.7994, "learning_rate": 4.7116152161297045e-05, "epoch": 0.1544, "percentage": 15.44, "elapsed_time": "1:53:48", "remaining_time": "10:23:19", "throughput": 754.5, "total_tokens": 5152320} {"current_steps": 970, "total_steps": 6250, "loss": 0.7259, "learning_rate": 4.708678616715815e-05, "epoch": 0.1552, "percentage": 15.52, "elapsed_time": "1:54:20", "remaining_time": "10:22:23", "throughput": 754.87, "total_tokens": 5178816} {"current_steps": 975, "total_steps": 6250, "loss": 0.747, "learning_rate": 4.7057280660873835e-05, "epoch": 0.156, "percentage": 15.6, "elapsed_time": "1:54:53", "remaining_time": "10:21:32", "throughput": 755.56, "total_tokens": 5208112} {"current_steps": 980, "total_steps": 6250, "loss": 0.8487, "learning_rate": 4.702763582881692e-05, "epoch": 0.1568, "percentage": 15.68, "elapsed_time": "1:55:26", "remaining_time": "10:20:50", "throughput": 755.19, "total_tokens": 5231200} {"current_steps": 985, "total_steps": 6250, "loss": 0.7654, "learning_rate": 4.699785185824026e-05, "epoch": 0.1576, "percentage": 15.76, "elapsed_time": "1:55:59", "remaining_time": "10:20:01", "throughput": 755.38, "total_tokens": 5257312} {"current_steps": 990, "total_steps": 6250, "loss": 0.7748, "learning_rate": 4.696792893727562e-05, "epoch": 0.1584, "percentage": 15.84, "elapsed_time": "1:56:32", "remaining_time": "10:19:10", "throughput": 755.16, "total_tokens": 5280288} {"current_steps": 995, "total_steps": 6250, "loss": 0.6957, "learning_rate": 4.693786725493242e-05, "epoch": 0.1592, "percentage": 15.92, "elapsed_time": "1:57:07", "remaining_time": "10:18:36", "throughput": 755.33, "total_tokens": 5308272} {"current_steps": 1000, "total_steps": 6250, "loss": 0.7418, "learning_rate": 4.690766700109659e-05, "epoch": 0.16, "percentage": 16.0, "elapsed_time": "1:57:40", "remaining_time": "10:17:48", "throughput": 755.68, "total_tokens": 5335568} {"current_steps": 1005, "total_steps": 6250, "loss": 0.8225, "learning_rate": 4.6877328366529346e-05, "epoch": 0.1608, "percentage": 16.08, "elapsed_time": "1:58:13", "remaining_time": "10:17:02", "throughput": 755.84, "total_tokens": 5361872} {"current_steps": 1010, "total_steps": 6250, "loss": 0.8552, "learning_rate": 4.684685154286599e-05, "epoch": 0.1616, "percentage": 16.16, "elapsed_time": "1:58:47", "remaining_time": "10:16:19", "throughput": 755.84, "total_tokens": 5387456} {"current_steps": 1015, "total_steps": 6250, "loss": 0.6654, "learning_rate": 4.681623672261469e-05, "epoch": 0.1624, "percentage": 16.24, "elapsed_time": "1:59:18", "remaining_time": "10:15:21", "throughput": 755.94, "total_tokens": 5411472} {"current_steps": 1020, "total_steps": 6250, "loss": 0.7339, "learning_rate": 4.678548409915532e-05, "epoch": 0.1632, "percentage": 16.32, "elapsed_time": "1:59:52", "remaining_time": "10:14:41", "throughput": 756.25, "total_tokens": 5439648} {"current_steps": 1025, "total_steps": 6250, "loss": 0.7324, "learning_rate": 4.675459386673815e-05, "epoch": 0.164, "percentage": 16.4, "elapsed_time": "2:00:25", "remaining_time": "10:13:53", "throughput": 756.79, "total_tokens": 5468416} {"current_steps": 1030, "total_steps": 6250, "loss": 0.7065, "learning_rate": 4.6723566220482664e-05, "epoch": 0.1648, "percentage": 16.48, "elapsed_time": "2:01:00", "remaining_time": "10:13:13", "throughput": 757.41, "total_tokens": 5498800} {"current_steps": 1035, "total_steps": 6250, "loss": 0.6822, "learning_rate": 4.669240135637635e-05, "epoch": 0.1656, "percentage": 16.56, "elapsed_time": "2:01:34", "remaining_time": "10:12:35", "throughput": 757.79, "total_tokens": 5527856} {"current_steps": 1040, "total_steps": 6250, "loss": 0.7554, "learning_rate": 4.666109947127343e-05, "epoch": 0.1664, "percentage": 16.64, "elapsed_time": "2:02:07", "remaining_time": "10:11:47", "throughput": 757.55, "total_tokens": 5550848} {"current_steps": 1045, "total_steps": 6250, "loss": 0.6784, "learning_rate": 4.662966076289362e-05, "epoch": 0.1672, "percentage": 16.72, "elapsed_time": "2:02:41", "remaining_time": "10:11:07", "throughput": 758.2, "total_tokens": 5581552} {"current_steps": 1050, "total_steps": 6250, "loss": 0.8294, "learning_rate": 4.659808542982088e-05, "epoch": 0.168, "percentage": 16.8, "elapsed_time": "2:03:14", "remaining_time": "10:10:17", "throughput": 757.95, "total_tokens": 5604288} {"current_steps": 1055, "total_steps": 6250, "loss": 0.6633, "learning_rate": 4.6566373671502196e-05, "epoch": 0.1688, "percentage": 16.88, "elapsed_time": "2:03:45", "remaining_time": "10:09:24", "throughput": 758.24, "total_tokens": 5630336} {"current_steps": 1060, "total_steps": 6250, "loss": 0.6684, "learning_rate": 4.653452568824625e-05, "epoch": 0.1696, "percentage": 16.96, "elapsed_time": "2:04:24", "remaining_time": "10:09:06", "throughput": 758.62, "total_tokens": 5662480} {"current_steps": 1065, "total_steps": 6250, "loss": 0.7109, "learning_rate": 4.650254168122222e-05, "epoch": 0.1704, "percentage": 17.04, "elapsed_time": "2:04:58", "remaining_time": "10:08:26", "throughput": 758.48, "total_tokens": 5687376} {"current_steps": 1070, "total_steps": 6250, "loss": 0.8036, "learning_rate": 4.647042185245847e-05, "epoch": 0.1712, "percentage": 17.12, "elapsed_time": "2:05:29", "remaining_time": "10:07:32", "throughput": 758.97, "total_tokens": 5714896} {"current_steps": 1075, "total_steps": 6250, "loss": 0.6575, "learning_rate": 4.643816640484131e-05, "epoch": 0.172, "percentage": 17.2, "elapsed_time": "2:06:02", "remaining_time": "10:06:46", "throughput": 759.02, "total_tokens": 5740192} {"current_steps": 1080, "total_steps": 6250, "loss": 0.7477, "learning_rate": 4.640577554211366e-05, "epoch": 0.1728, "percentage": 17.28, "elapsed_time": "2:06:37", "remaining_time": "10:06:11", "throughput": 759.23, "total_tokens": 5768656} {"current_steps": 1085, "total_steps": 6250, "loss": 0.7555, "learning_rate": 4.6373249468873833e-05, "epoch": 0.1736, "percentage": 17.36, "elapsed_time": "2:07:12", "remaining_time": "10:05:31", "throughput": 759.25, "total_tokens": 5794576} {"current_steps": 1090, "total_steps": 6250, "loss": 0.6695, "learning_rate": 4.634058839057417e-05, "epoch": 0.1744, "percentage": 17.44, "elapsed_time": "2:07:45", "remaining_time": "10:04:46", "throughput": 759.7, "total_tokens": 5823296} {"current_steps": 1095, "total_steps": 6250, "loss": 0.6948, "learning_rate": 4.63077925135198e-05, "epoch": 0.1752, "percentage": 17.52, "elapsed_time": "2:08:18", "remaining_time": "10:04:04", "throughput": 759.46, "total_tokens": 5846928} {"current_steps": 1100, "total_steps": 6250, "loss": 0.7728, "learning_rate": 4.6274862044867304e-05, "epoch": 0.176, "percentage": 17.6, "elapsed_time": "2:08:51", "remaining_time": "10:03:17", "throughput": 759.49, "total_tokens": 5871968} {"current_steps": 1105, "total_steps": 6250, "loss": 0.765, "learning_rate": 4.624179719262342e-05, "epoch": 0.1768, "percentage": 17.68, "elapsed_time": "2:09:24", "remaining_time": "10:02:33", "throughput": 759.88, "total_tokens": 5900304} {"current_steps": 1110, "total_steps": 6250, "loss": 0.6515, "learning_rate": 4.6208598165643715e-05, "epoch": 0.1776, "percentage": 17.76, "elapsed_time": "2:09:59", "remaining_time": "10:01:55", "throughput": 759.79, "total_tokens": 5925792} {"current_steps": 1115, "total_steps": 6250, "loss": 0.75, "learning_rate": 4.61752651736313e-05, "epoch": 0.1784, "percentage": 17.84, "elapsed_time": "2:10:31", "remaining_time": "10:01:07", "throughput": 759.83, "total_tokens": 5950672} {"current_steps": 1120, "total_steps": 6250, "loss": 0.6592, "learning_rate": 4.614179842713547e-05, "epoch": 0.1792, "percentage": 17.92, "elapsed_time": "2:11:10", "remaining_time": "10:00:48", "throughput": 760.52, "total_tokens": 5985552} {"current_steps": 1125, "total_steps": 6250, "loss": 0.8463, "learning_rate": 4.610819813755038e-05, "epoch": 0.18, "percentage": 18.0, "elapsed_time": "2:11:41", "remaining_time": "9:59:57", "throughput": 760.57, "total_tokens": 6009904} {"current_steps": 1130, "total_steps": 6250, "loss": 0.7349, "learning_rate": 4.607446451711372e-05, "epoch": 0.1808, "percentage": 18.08, "elapsed_time": "2:12:16", "remaining_time": "9:59:19", "throughput": 760.32, "total_tokens": 6034160} {"current_steps": 1135, "total_steps": 6250, "loss": 0.6396, "learning_rate": 4.604059777890537e-05, "epoch": 0.1816, "percentage": 18.16, "elapsed_time": "2:12:47", "remaining_time": "9:58:26", "throughput": 760.16, "total_tokens": 6056544} {"current_steps": 1140, "total_steps": 6250, "loss": 0.6164, "learning_rate": 4.6006598136846056e-05, "epoch": 0.1824, "percentage": 18.24, "elapsed_time": "2:13:24", "remaining_time": "9:58:00", "throughput": 760.06, "total_tokens": 6083920} {"current_steps": 1145, "total_steps": 6250, "loss": 0.6775, "learning_rate": 4.5972465805695996e-05, "epoch": 0.1832, "percentage": 18.32, "elapsed_time": "2:14:01", "remaining_time": "9:57:32", "throughput": 760.02, "total_tokens": 6111520} {"current_steps": 1150, "total_steps": 6250, "loss": 0.6295, "learning_rate": 4.593820100105355e-05, "epoch": 0.184, "percentage": 18.4, "elapsed_time": "2:14:36", "remaining_time": "9:56:56", "throughput": 760.38, "total_tokens": 6141056} {"current_steps": 1155, "total_steps": 6250, "loss": 0.7429, "learning_rate": 4.590380393935383e-05, "epoch": 0.1848, "percentage": 18.48, "elapsed_time": "2:15:07", "remaining_time": "9:56:03", "throughput": 760.23, "total_tokens": 6163408} {"current_steps": 1160, "total_steps": 6250, "loss": 0.7516, "learning_rate": 4.5869274837867394e-05, "epoch": 0.1856, "percentage": 18.56, "elapsed_time": "2:15:39", "remaining_time": "9:55:17", "throughput": 760.3, "total_tokens": 6188816} {"current_steps": 1165, "total_steps": 6250, "loss": 0.7524, "learning_rate": 4.583461391469879e-05, "epoch": 0.1864, "percentage": 18.64, "elapsed_time": "2:16:14", "remaining_time": "9:54:38", "throughput": 760.56, "total_tokens": 6216800} {"current_steps": 1170, "total_steps": 6250, "loss": 0.7337, "learning_rate": 4.579982138878527e-05, "epoch": 0.1872, "percentage": 18.72, "elapsed_time": "2:16:46", "remaining_time": "9:53:52", "throughput": 761.08, "total_tokens": 6245888} {"current_steps": 1175, "total_steps": 6250, "loss": 0.7891, "learning_rate": 4.5764897479895317e-05, "epoch": 0.188, "percentage": 18.8, "elapsed_time": "2:17:21", "remaining_time": "9:53:17", "throughput": 761.37, "total_tokens": 6275120} {"current_steps": 1180, "total_steps": 6250, "loss": 0.79, "learning_rate": 4.5729842408627334e-05, "epoch": 0.1888, "percentage": 18.88, "elapsed_time": "2:17:53", "remaining_time": "9:52:26", "throughput": 761.46, "total_tokens": 6299760} {"current_steps": 1185, "total_steps": 6250, "loss": 0.7506, "learning_rate": 4.5694656396408195e-05, "epoch": 0.1896, "percentage": 18.96, "elapsed_time": "2:18:27", "remaining_time": "9:51:48", "throughput": 761.56, "total_tokens": 6326720} {"current_steps": 1190, "total_steps": 6250, "loss": 0.6294, "learning_rate": 4.565933966549189e-05, "epoch": 0.1904, "percentage": 19.04, "elapsed_time": "2:19:00", "remaining_time": "9:51:02", "throughput": 761.84, "total_tokens": 6353728} {"current_steps": 1195, "total_steps": 6250, "loss": 0.7564, "learning_rate": 4.5623892438958074e-05, "epoch": 0.1912, "percentage": 19.12, "elapsed_time": "2:19:34", "remaining_time": "9:50:24", "throughput": 761.8, "total_tokens": 6379536} {"current_steps": 1200, "total_steps": 6250, "loss": 0.7683, "learning_rate": 4.558831494071069e-05, "epoch": 0.192, "percentage": 19.2, "elapsed_time": "2:20:07", "remaining_time": "9:49:41", "throughput": 762.08, "total_tokens": 6407152} {"current_steps": 1205, "total_steps": 6250, "loss": 0.7701, "learning_rate": 4.555260739547657e-05, "epoch": 0.1928, "percentage": 19.28, "elapsed_time": "2:20:40", "remaining_time": "9:48:58", "throughput": 762.33, "total_tokens": 6434480} {"current_steps": 1210, "total_steps": 6250, "loss": 0.694, "learning_rate": 4.5516770028803954e-05, "epoch": 0.1936, "percentage": 19.36, "elapsed_time": "2:21:15", "remaining_time": "9:48:24", "throughput": 762.58, "total_tokens": 6463424} {"current_steps": 1215, "total_steps": 6250, "loss": 0.7322, "learning_rate": 4.548080306706114e-05, "epoch": 0.1944, "percentage": 19.44, "elapsed_time": "2:21:48", "remaining_time": "9:47:40", "throughput": 762.41, "total_tokens": 6487136} {"current_steps": 1220, "total_steps": 6250, "loss": 0.7616, "learning_rate": 4.5444706737435014e-05, "epoch": 0.1952, "percentage": 19.52, "elapsed_time": "2:22:24", "remaining_time": "9:47:08", "throughput": 762.25, "total_tokens": 6513120} {"current_steps": 1225, "total_steps": 6250, "loss": 0.6743, "learning_rate": 4.5408481267929605e-05, "epoch": 0.196, "percentage": 19.6, "elapsed_time": "2:23:01", "remaining_time": "9:46:41", "throughput": 762.45, "total_tokens": 6543040} {"current_steps": 1230, "total_steps": 6250, "loss": 0.7377, "learning_rate": 4.5372126887364655e-05, "epoch": 0.1968, "percentage": 19.68, "elapsed_time": "2:23:35", "remaining_time": "9:46:02", "throughput": 762.85, "total_tokens": 6572432} {"current_steps": 1235, "total_steps": 6250, "loss": 0.7766, "learning_rate": 4.533564382537421e-05, "epoch": 0.1976, "percentage": 19.76, "elapsed_time": "2:24:07", "remaining_time": "9:45:13", "throughput": 762.47, "total_tokens": 6593136} {"current_steps": 1240, "total_steps": 6250, "loss": 0.7873, "learning_rate": 4.529903231240511e-05, "epoch": 0.1984, "percentage": 19.84, "elapsed_time": "2:24:42", "remaining_time": "9:44:40", "throughput": 762.56, "total_tokens": 6621024} {"current_steps": 1245, "total_steps": 6250, "loss": 0.7096, "learning_rate": 4.5262292579715556e-05, "epoch": 0.1992, "percentage": 19.92, "elapsed_time": "2:25:15", "remaining_time": "9:43:55", "throughput": 762.64, "total_tokens": 6646480} {"current_steps": 1250, "total_steps": 6250, "loss": 0.8187, "learning_rate": 4.522542485937369e-05, "epoch": 0.2, "percentage": 20.0, "elapsed_time": "2:25:47", "remaining_time": "9:43:11", "throughput": 762.92, "total_tokens": 6674032} {"current_steps": 1255, "total_steps": 6250, "loss": 0.772, "learning_rate": 4.518842938425605e-05, "epoch": 0.2008, "percentage": 20.08, "elapsed_time": "2:26:20", "remaining_time": "9:42:28", "throughput": 763.04, "total_tokens": 6700112} {"current_steps": 1260, "total_steps": 6250, "loss": 0.6796, "learning_rate": 4.5151306388046175e-05, "epoch": 0.2016, "percentage": 20.16, "elapsed_time": "2:26:54", "remaining_time": "9:41:50", "throughput": 763.14, "total_tokens": 6727008} {"current_steps": 1265, "total_steps": 6250, "loss": 0.7177, "learning_rate": 4.511405610523309e-05, "epoch": 0.2024, "percentage": 20.24, "elapsed_time": "2:27:26", "remaining_time": "9:40:59", "throughput": 763.36, "total_tokens": 6752768} {"current_steps": 1270, "total_steps": 6250, "loss": 0.7078, "learning_rate": 4.5076678771109815e-05, "epoch": 0.2032, "percentage": 20.32, "elapsed_time": "2:27:59", "remaining_time": "9:40:17", "throughput": 763.37, "total_tokens": 6778112} {"current_steps": 1275, "total_steps": 6250, "loss": 0.6496, "learning_rate": 4.503917462177192e-05, "epoch": 0.204, "percentage": 20.4, "elapsed_time": "2:28:34", "remaining_time": "9:39:44", "throughput": 763.3, "total_tokens": 6804432} {"current_steps": 1280, "total_steps": 6250, "loss": 0.6802, "learning_rate": 4.5001543894115975e-05, "epoch": 0.2048, "percentage": 20.48, "elapsed_time": "2:29:08", "remaining_time": "9:39:04", "throughput": 763.25, "total_tokens": 6829824} {"current_steps": 1285, "total_steps": 6250, "loss": 0.7187, "learning_rate": 4.496378682583813e-05, "epoch": 0.2056, "percentage": 20.56, "elapsed_time": "2:29:41", "remaining_time": "9:38:21", "throughput": 763.65, "total_tokens": 6858480} {"current_steps": 1290, "total_steps": 6250, "loss": 0.6198, "learning_rate": 4.492590365543253e-05, "epoch": 0.2064, "percentage": 20.64, "elapsed_time": "2:30:14", "remaining_time": "9:37:38", "throughput": 764.03, "total_tokens": 6886960} {"current_steps": 1295, "total_steps": 6250, "loss": 0.6105, "learning_rate": 4.488789462218987e-05, "epoch": 0.2072, "percentage": 20.72, "elapsed_time": "2:30:45", "remaining_time": "9:36:49", "throughput": 764.22, "total_tokens": 6912560} {"current_steps": 1300, "total_steps": 6250, "loss": 0.7671, "learning_rate": 4.484975996619589e-05, "epoch": 0.208, "percentage": 20.8, "elapsed_time": "2:31:16", "remaining_time": "9:35:59", "throughput": 764.52, "total_tokens": 6938912} {"current_steps": 1305, "total_steps": 6250, "loss": 0.6833, "learning_rate": 4.481149992832977e-05, "epoch": 0.2088, "percentage": 20.88, "elapsed_time": "2:31:50", "remaining_time": "9:35:23", "throughput": 764.76, "total_tokens": 6967616} {"current_steps": 1310, "total_steps": 6250, "loss": 0.7547, "learning_rate": 4.477311475026271e-05, "epoch": 0.2096, "percentage": 20.96, "elapsed_time": "2:32:25", "remaining_time": "9:34:46", "throughput": 764.75, "total_tokens": 6993872} {"current_steps": 1315, "total_steps": 6250, "loss": 0.7479, "learning_rate": 4.473460467445637e-05, "epoch": 0.2104, "percentage": 21.04, "elapsed_time": "2:32:59", "remaining_time": "9:34:09", "throughput": 764.83, "total_tokens": 7020784} {"current_steps": 1320, "total_steps": 6250, "loss": 0.761, "learning_rate": 4.46959699441613e-05, "epoch": 0.2112, "percentage": 21.12, "elapsed_time": "2:33:30", "remaining_time": "9:33:20", "throughput": 764.88, "total_tokens": 7045024} {"current_steps": 1325, "total_steps": 6250, "loss": 0.7612, "learning_rate": 4.465721080341547e-05, "epoch": 0.212, "percentage": 21.2, "elapsed_time": "2:34:03", "remaining_time": "9:32:37", "throughput": 765.13, "total_tokens": 7072448} {"current_steps": 1330, "total_steps": 6250, "loss": 0.6792, "learning_rate": 4.461832749704268e-05, "epoch": 0.2128, "percentage": 21.28, "elapsed_time": "2:34:36", "remaining_time": "9:31:55", "throughput": 765.14, "total_tokens": 7097776} {"current_steps": 1335, "total_steps": 6250, "loss": 0.7357, "learning_rate": 4.457932027065102e-05, "epoch": 0.2136, "percentage": 21.36, "elapsed_time": "2:35:10", "remaining_time": "9:31:18", "throughput": 765.1, "total_tokens": 7123568} {"current_steps": 1340, "total_steps": 6250, "loss": 0.6676, "learning_rate": 4.4540189370631315e-05, "epoch": 0.2144, "percentage": 21.44, "elapsed_time": "2:35:43", "remaining_time": "9:30:35", "throughput": 765.45, "total_tokens": 7151728} {"current_steps": 1345, "total_steps": 6250, "loss": 0.7394, "learning_rate": 4.4500935044155626e-05, "epoch": 0.2152, "percentage": 21.52, "elapsed_time": "2:36:15", "remaining_time": "9:29:52", "throughput": 765.97, "total_tokens": 7181664} {"current_steps": 1350, "total_steps": 6250, "loss": 0.8017, "learning_rate": 4.4461557539175594e-05, "epoch": 0.216, "percentage": 21.6, "elapsed_time": "2:36:50", "remaining_time": "9:29:15", "throughput": 766.22, "total_tokens": 7210336} {"current_steps": 1355, "total_steps": 6250, "loss": 0.6533, "learning_rate": 4.4422057104420946e-05, "epoch": 0.2168, "percentage": 21.68, "elapsed_time": "2:37:25", "remaining_time": "9:28:43", "throughput": 766.58, "total_tokens": 7240992} {"current_steps": 1360, "total_steps": 6250, "loss": 0.7029, "learning_rate": 4.4382433989397895e-05, "epoch": 0.2176, "percentage": 21.76, "elapsed_time": "2:37:58", "remaining_time": "9:28:00", "throughput": 766.79, "total_tokens": 7268048} {"current_steps": 1365, "total_steps": 6250, "loss": 0.7096, "learning_rate": 4.434268844438758e-05, "epoch": 0.2184, "percentage": 21.84, "elapsed_time": "2:38:32", "remaining_time": "9:27:23", "throughput": 767.14, "total_tokens": 7297616} {"current_steps": 1370, "total_steps": 6250, "loss": 0.8103, "learning_rate": 4.4302820720444456e-05, "epoch": 0.2192, "percentage": 21.92, "elapsed_time": "2:39:08", "remaining_time": "9:26:53", "throughput": 767.32, "total_tokens": 7326912} {"current_steps": 1375, "total_steps": 6250, "loss": 0.6238, "learning_rate": 4.426283106939474e-05, "epoch": 0.22, "percentage": 22.0, "elapsed_time": "2:39:44", "remaining_time": "9:26:21", "throughput": 767.4, "total_tokens": 7355136} {"current_steps": 1380, "total_steps": 6250, "loss": 0.6625, "learning_rate": 4.422271974383479e-05, "epoch": 0.2208, "percentage": 22.08, "elapsed_time": "2:40:15", "remaining_time": "9:25:32", "throughput": 767.27, "total_tokens": 7377584} {"current_steps": 1385, "total_steps": 6250, "loss": 0.6831, "learning_rate": 4.418248699712955e-05, "epoch": 0.2216, "percentage": 22.16, "elapsed_time": "2:40:49", "remaining_time": "9:24:54", "throughput": 767.47, "total_tokens": 7405552} {"current_steps": 1390, "total_steps": 6250, "loss": 0.7664, "learning_rate": 4.414213308341092e-05, "epoch": 0.2224, "percentage": 22.24, "elapsed_time": "2:41:22", "remaining_time": "9:24:13", "throughput": 767.48, "total_tokens": 7430960} {"current_steps": 1395, "total_steps": 6250, "loss": 0.7273, "learning_rate": 4.410165825757613e-05, "epoch": 0.2232, "percentage": 22.32, "elapsed_time": "2:41:56", "remaining_time": "9:23:36", "throughput": 767.47, "total_tokens": 7457136} {"current_steps": 1400, "total_steps": 6250, "loss": 0.6607, "learning_rate": 4.40610627752862e-05, "epoch": 0.224, "percentage": 22.4, "elapsed_time": "2:42:27", "remaining_time": "9:22:48", "throughput": 767.59, "total_tokens": 7482208} {"current_steps": 1405, "total_steps": 6250, "loss": 0.731, "learning_rate": 4.4020346892964246e-05, "epoch": 0.2248, "percentage": 22.48, "elapsed_time": "2:43:05", "remaining_time": "9:22:23", "throughput": 768.08, "total_tokens": 7515760} {"current_steps": 1410, "total_steps": 6250, "loss": 0.7258, "learning_rate": 4.3979510867793917e-05, "epoch": 0.2256, "percentage": 22.56, "elapsed_time": "2:43:38", "remaining_time": "9:21:42", "throughput": 768.26, "total_tokens": 7542944} {"current_steps": 1415, "total_steps": 6250, "loss": 0.6566, "learning_rate": 4.393855495771774e-05, "epoch": 0.2264, "percentage": 22.64, "elapsed_time": "2:44:15", "remaining_time": "9:21:14", "throughput": 768.5, "total_tokens": 7573760} {"current_steps": 1420, "total_steps": 6250, "loss": 0.7433, "learning_rate": 4.38974794214355e-05, "epoch": 0.2272, "percentage": 22.72, "elapsed_time": "2:44:50", "remaining_time": "9:20:43", "throughput": 769.04, "total_tokens": 7606592} {"current_steps": 1425, "total_steps": 6250, "loss": 0.7452, "learning_rate": 4.3856284518402594e-05, "epoch": 0.228, "percentage": 22.8, "elapsed_time": "2:45:22", "remaining_time": "9:19:55", "throughput": 768.86, "total_tokens": 7628672} {"current_steps": 1430, "total_steps": 6250, "loss": 0.7077, "learning_rate": 4.381497050882845e-05, "epoch": 0.2288, "percentage": 22.88, "elapsed_time": "2:45:58", "remaining_time": "9:19:25", "throughput": 769.07, "total_tokens": 7658528} {"current_steps": 1435, "total_steps": 6250, "loss": 0.6274, "learning_rate": 4.377353765367479e-05, "epoch": 0.2296, "percentage": 22.96, "elapsed_time": "2:46:30", "remaining_time": "9:18:42", "throughput": 769.24, "total_tokens": 7685248} {"current_steps": 1440, "total_steps": 6250, "loss": 0.6845, "learning_rate": 4.3731986214654035e-05, "epoch": 0.2304, "percentage": 23.04, "elapsed_time": "2:47:04", "remaining_time": "9:18:05", "throughput": 769.46, "total_tokens": 7713616} {"current_steps": 1445, "total_steps": 6250, "loss": 0.7115, "learning_rate": 4.3690316454227674e-05, "epoch": 0.2312, "percentage": 23.12, "elapsed_time": "2:47:40", "remaining_time": "9:17:32", "throughput": 769.41, "total_tokens": 7740304} {"current_steps": 1450, "total_steps": 6250, "loss": 0.7209, "learning_rate": 4.3648528635604556e-05, "epoch": 0.232, "percentage": 23.2, "elapsed_time": "2:48:11", "remaining_time": "9:16:46", "throughput": 769.64, "total_tokens": 7766848} {"current_steps": 1455, "total_steps": 6250, "loss": 0.8239, "learning_rate": 4.360662302273924e-05, "epoch": 0.2328, "percentage": 23.28, "elapsed_time": "2:48:44", "remaining_time": "9:16:05", "throughput": 769.62, "total_tokens": 7791888} {"current_steps": 1460, "total_steps": 6250, "loss": 0.6199, "learning_rate": 4.3564599880330385e-05, "epoch": 0.2336, "percentage": 23.36, "elapsed_time": "2:49:20", "remaining_time": "9:15:33", "throughput": 769.92, "total_tokens": 7822448} {"current_steps": 1465, "total_steps": 6250, "loss": 0.7481, "learning_rate": 4.352245947381898e-05, "epoch": 0.2344, "percentage": 23.44, "elapsed_time": "2:49:52", "remaining_time": "9:14:51", "throughput": 770.0, "total_tokens": 7848464} {"current_steps": 1470, "total_steps": 6250, "loss": 0.7235, "learning_rate": 4.348020206938672e-05, "epoch": 0.2352, "percentage": 23.52, "elapsed_time": "2:50:27", "remaining_time": "9:14:15", "throughput": 770.22, "total_tokens": 7877216} {"current_steps": 1475, "total_steps": 6250, "loss": 0.7345, "learning_rate": 4.343782793395435e-05, "epoch": 0.236, "percentage": 23.6, "elapsed_time": "2:51:01", "remaining_time": "9:13:38", "throughput": 770.31, "total_tokens": 7904368} {"current_steps": 1480, "total_steps": 6250, "loss": 0.7532, "learning_rate": 4.3395337335179945e-05, "epoch": 0.2368, "percentage": 23.68, "elapsed_time": "2:51:32", "remaining_time": "9:12:52", "throughput": 770.62, "total_tokens": 7931520} {"current_steps": 1485, "total_steps": 6250, "loss": 0.6902, "learning_rate": 4.335273054145722e-05, "epoch": 0.2376, "percentage": 23.76, "elapsed_time": "2:52:04", "remaining_time": "9:12:09", "throughput": 770.3, "total_tokens": 7953296} {"current_steps": 1490, "total_steps": 6250, "loss": 0.7329, "learning_rate": 4.3310007821913836e-05, "epoch": 0.2384, "percentage": 23.84, "elapsed_time": "2:52:39", "remaining_time": "9:11:35", "throughput": 770.19, "total_tokens": 7978832} {"current_steps": 1495, "total_steps": 6250, "loss": 0.6693, "learning_rate": 4.32671694464097e-05, "epoch": 0.2392, "percentage": 23.92, "elapsed_time": "2:53:13", "remaining_time": "9:10:57", "throughput": 770.19, "total_tokens": 8004992} {"current_steps": 1500, "total_steps": 6250, "loss": 0.7418, "learning_rate": 4.3224215685535294e-05, "epoch": 0.24, "percentage": 24.0, "elapsed_time": "2:53:44", "remaining_time": "9:10:11", "throughput": 770.09, "total_tokens": 8027824} {"current_steps": 1505, "total_steps": 6250, "loss": 0.6157, "learning_rate": 4.31811468106099e-05, "epoch": 0.2408, "percentage": 24.08, "elapsed_time": "2:54:19", "remaining_time": "9:09:36", "throughput": 770.47, "total_tokens": 8058528} {"current_steps": 1510, "total_steps": 6250, "loss": 0.6302, "learning_rate": 4.3137963093679945e-05, "epoch": 0.2416, "percentage": 24.16, "elapsed_time": "2:54:50", "remaining_time": "9:08:51", "throughput": 770.39, "total_tokens": 8081984} {"current_steps": 1515, "total_steps": 6250, "loss": 0.628, "learning_rate": 4.309466480751726e-05, "epoch": 0.2424, "percentage": 24.24, "elapsed_time": "2:55:26", "remaining_time": "9:08:19", "throughput": 770.75, "total_tokens": 8113216} {"current_steps": 1520, "total_steps": 6250, "loss": 0.635, "learning_rate": 4.305125222561736e-05, "epoch": 0.2432, "percentage": 24.32, "elapsed_time": "2:56:00", "remaining_time": "9:07:42", "throughput": 770.99, "total_tokens": 8142080} {"current_steps": 1525, "total_steps": 6250, "loss": 0.8114, "learning_rate": 4.3007725622197674e-05, "epoch": 0.244, "percentage": 24.4, "elapsed_time": "2:56:37", "remaining_time": "9:07:15", "throughput": 771.01, "total_tokens": 8171008} {"current_steps": 1530, "total_steps": 6250, "loss": 0.6678, "learning_rate": 4.296408527219592e-05, "epoch": 0.2448, "percentage": 24.48, "elapsed_time": "2:57:09", "remaining_time": "9:06:30", "throughput": 771.26, "total_tokens": 8197696} {"current_steps": 1535, "total_steps": 6250, "loss": 0.8364, "learning_rate": 4.292033145126825e-05, "epoch": 0.2456, "percentage": 24.56, "elapsed_time": "2:57:44", "remaining_time": "9:05:57", "throughput": 771.32, "total_tokens": 8225552} {"current_steps": 1540, "total_steps": 6250, "loss": 0.7312, "learning_rate": 4.287646443578758e-05, "epoch": 0.2464, "percentage": 24.64, "elapsed_time": "2:58:17", "remaining_time": "9:05:16", "throughput": 771.89, "total_tokens": 8257120} {"current_steps": 1545, "total_steps": 6250, "loss": 0.8067, "learning_rate": 4.283248450284182e-05, "epoch": 0.2472, "percentage": 24.72, "elapsed_time": "2:58:48", "remaining_time": "9:04:32", "throughput": 771.97, "total_tokens": 8282400} {"current_steps": 1550, "total_steps": 6250, "loss": 0.7109, "learning_rate": 4.2788391930232136e-05, "epoch": 0.248, "percentage": 24.8, "elapsed_time": "2:59:21", "remaining_time": "9:03:50", "throughput": 772.18, "total_tokens": 8309568} {"current_steps": 1555, "total_steps": 6250, "loss": 0.6543, "learning_rate": 4.2744186996471174e-05, "epoch": 0.2488, "percentage": 24.88, "elapsed_time": "2:59:53", "remaining_time": "9:03:09", "throughput": 772.56, "total_tokens": 8338864} {"current_steps": 1560, "total_steps": 6250, "loss": 0.7401, "learning_rate": 4.269986998078132e-05, "epoch": 0.2496, "percentage": 24.96, "elapsed_time": "3:00:26", "remaining_time": "9:02:29", "throughput": 772.58, "total_tokens": 8364592} {"current_steps": 1565, "total_steps": 6250, "loss": 0.7538, "learning_rate": 4.265544116309294e-05, "epoch": 0.2504, "percentage": 25.04, "elapsed_time": "3:00:59", "remaining_time": "9:01:49", "throughput": 772.68, "total_tokens": 8391120} {"current_steps": 1570, "total_steps": 6250, "loss": 0.7705, "learning_rate": 4.261090082404258e-05, "epoch": 0.2512, "percentage": 25.12, "elapsed_time": "3:01:32", "remaining_time": "9:01:09", "throughput": 772.86, "total_tokens": 8418320} {"current_steps": 1575, "total_steps": 6250, "loss": 0.6846, "learning_rate": 4.256624924497123e-05, "epoch": 0.252, "percentage": 25.2, "elapsed_time": "3:02:03", "remaining_time": "9:00:24", "throughput": 773.24, "total_tokens": 8446640} {"current_steps": 1580, "total_steps": 6250, "loss": 0.8502, "learning_rate": 4.252148670792254e-05, "epoch": 0.2528, "percentage": 25.28, "elapsed_time": "3:02:36", "remaining_time": "8:59:44", "throughput": 773.09, "total_tokens": 8470416} {"current_steps": 1585, "total_steps": 6250, "loss": 0.6987, "learning_rate": 4.2476613495641026e-05, "epoch": 0.2536, "percentage": 25.36, "elapsed_time": "3:03:09", "remaining_time": "8:59:03", "throughput": 773.33, "total_tokens": 8498160} {"current_steps": 1590, "total_steps": 6250, "loss": 0.6461, "learning_rate": 4.2431629891570266e-05, "epoch": 0.2544, "percentage": 25.44, "elapsed_time": "3:03:42", "remaining_time": "8:58:26", "throughput": 773.47, "total_tokens": 8525904} {"current_steps": 1595, "total_steps": 6250, "loss": 0.7143, "learning_rate": 4.238653617985118e-05, "epoch": 0.2552, "percentage": 25.52, "elapsed_time": "3:04:15", "remaining_time": "8:57:46", "throughput": 773.53, "total_tokens": 8551872} {"current_steps": 1600, "total_steps": 6250, "loss": 0.7215, "learning_rate": 4.234133264532012e-05, "epoch": 0.256, "percentage": 25.6, "elapsed_time": "3:04:51", "remaining_time": "8:57:14", "throughput": 773.88, "total_tokens": 8583440} {"current_steps": 1605, "total_steps": 6250, "loss": 0.8008, "learning_rate": 4.229601957350722e-05, "epoch": 0.2568, "percentage": 25.68, "elapsed_time": "3:05:22", "remaining_time": "8:56:30", "throughput": 774.05, "total_tokens": 8609632} {"current_steps": 1610, "total_steps": 6250, "loss": 0.6612, "learning_rate": 4.225059725063444e-05, "epoch": 0.2576, "percentage": 25.76, "elapsed_time": "3:05:55", "remaining_time": "8:55:49", "throughput": 773.98, "total_tokens": 8633888} {"current_steps": 1615, "total_steps": 6250, "loss": 0.7544, "learning_rate": 4.2205065963613864e-05, "epoch": 0.2584, "percentage": 25.84, "elapsed_time": "3:06:29", "remaining_time": "8:55:13", "throughput": 773.97, "total_tokens": 8660288} {"current_steps": 1620, "total_steps": 6250, "loss": 0.7569, "learning_rate": 4.2159426000045854e-05, "epoch": 0.2592, "percentage": 25.92, "elapsed_time": "3:07:04", "remaining_time": "8:54:40", "throughput": 774.11, "total_tokens": 8689184} {"current_steps": 1625, "total_steps": 6250, "loss": 0.8161, "learning_rate": 4.211367764821722e-05, "epoch": 0.26, "percentage": 26.0, "elapsed_time": "3:07:35", "remaining_time": "8:53:55", "throughput": 774.14, "total_tokens": 8713504} {"current_steps": 1630, "total_steps": 6250, "loss": 0.8283, "learning_rate": 4.206782119709942e-05, "epoch": 0.2608, "percentage": 26.08, "elapsed_time": "3:08:08", "remaining_time": "8:53:16", "throughput": 774.32, "total_tokens": 8741088} {"current_steps": 1635, "total_steps": 6250, "loss": 0.5745, "learning_rate": 4.20218569363467e-05, "epoch": 0.2616, "percentage": 26.16, "elapsed_time": "3:08:41", "remaining_time": "8:52:36", "throughput": 774.39, "total_tokens": 8767456} {"current_steps": 1640, "total_steps": 6250, "loss": 0.7525, "learning_rate": 4.197578515629435e-05, "epoch": 0.2624, "percentage": 26.24, "elapsed_time": "3:09:14", "remaining_time": "8:51:56", "throughput": 774.32, "total_tokens": 8791952} {"current_steps": 1645, "total_steps": 6250, "loss": 0.7991, "learning_rate": 4.192960614795675e-05, "epoch": 0.2632, "percentage": 26.32, "elapsed_time": "3:09:46", "remaining_time": "8:51:16", "throughput": 774.23, "total_tokens": 8816080} {"current_steps": 1650, "total_steps": 6250, "loss": 0.7297, "learning_rate": 4.188332020302561e-05, "epoch": 0.264, "percentage": 26.4, "elapsed_time": "3:10:19", "remaining_time": "8:50:36", "throughput": 774.25, "total_tokens": 8841536} {"current_steps": 1655, "total_steps": 6250, "loss": 0.6276, "learning_rate": 4.183692761386813e-05, "epoch": 0.2648, "percentage": 26.48, "elapsed_time": "3:10:52", "remaining_time": "8:49:57", "throughput": 774.49, "total_tokens": 8869872} {"current_steps": 1660, "total_steps": 6250, "loss": 0.7127, "learning_rate": 4.179042867352511e-05, "epoch": 0.2656, "percentage": 26.56, "elapsed_time": "3:11:23", "remaining_time": "8:49:12", "throughput": 774.44, "total_tokens": 8893152} {"current_steps": 1665, "total_steps": 6250, "loss": 0.7712, "learning_rate": 4.174382367570912e-05, "epoch": 0.2664, "percentage": 26.64, "elapsed_time": "3:11:57", "remaining_time": "8:48:37", "throughput": 774.72, "total_tokens": 8923040} {"current_steps": 1670, "total_steps": 6250, "loss": 0.8388, "learning_rate": 4.169711291480266e-05, "epoch": 0.2672, "percentage": 26.72, "elapsed_time": "3:12:29", "remaining_time": "8:47:54", "throughput": 774.58, "total_tokens": 8945856} {"current_steps": 1675, "total_steps": 6250, "loss": 0.7538, "learning_rate": 4.165029668585629e-05, "epoch": 0.268, "percentage": 26.8, "elapsed_time": "3:13:01", "remaining_time": "8:47:14", "throughput": 774.63, "total_tokens": 8971664} {"current_steps": 1680, "total_steps": 6250, "loss": 0.708, "learning_rate": 4.160337528458676e-05, "epoch": 0.2688, "percentage": 26.88, "elapsed_time": "3:13:36", "remaining_time": "8:46:40", "throughput": 774.4, "total_tokens": 8996064} {"current_steps": 1685, "total_steps": 6250, "loss": 0.668, "learning_rate": 4.155634900737513e-05, "epoch": 0.2696, "percentage": 26.96, "elapsed_time": "3:14:11", "remaining_time": "8:46:04", "throughput": 774.39, "total_tokens": 9022416} {"current_steps": 1690, "total_steps": 6250, "loss": 0.752, "learning_rate": 4.150921815126493e-05, "epoch": 0.2704, "percentage": 27.04, "elapsed_time": "3:14:48", "remaining_time": "8:45:38", "throughput": 774.46, "total_tokens": 9052480} {"current_steps": 1695, "total_steps": 6250, "loss": 0.6534, "learning_rate": 4.1461983013960245e-05, "epoch": 0.2712, "percentage": 27.12, "elapsed_time": "3:15:23", "remaining_time": "8:45:03", "throughput": 774.52, "total_tokens": 9079760} {"current_steps": 1700, "total_steps": 6250, "loss": 0.6808, "learning_rate": 4.1414643893823914e-05, "epoch": 0.272, "percentage": 27.2, "elapsed_time": "3:15:56", "remaining_time": "8:44:24", "throughput": 774.87, "total_tokens": 9109424} {"current_steps": 1705, "total_steps": 6250, "loss": 0.7627, "learning_rate": 4.136720108987552e-05, "epoch": 0.2728, "percentage": 27.28, "elapsed_time": "3:16:29", "remaining_time": "8:43:45", "throughput": 774.63, "total_tokens": 9132128} {"current_steps": 1710, "total_steps": 6250, "loss": 0.6527, "learning_rate": 4.131965490178959e-05, "epoch": 0.2736, "percentage": 27.36, "elapsed_time": "3:17:04", "remaining_time": "8:43:14", "throughput": 774.73, "total_tokens": 9160960} {"current_steps": 1715, "total_steps": 6250, "loss": 0.7102, "learning_rate": 4.1272005629893714e-05, "epoch": 0.2744, "percentage": 27.44, "elapsed_time": "3:17:39", "remaining_time": "8:42:39", "throughput": 775.02, "total_tokens": 9190992} {"current_steps": 1720, "total_steps": 6250, "loss": 0.67, "learning_rate": 4.122425357516658e-05, "epoch": 0.2752, "percentage": 27.52, "elapsed_time": "3:18:13", "remaining_time": "8:42:04", "throughput": 775.06, "total_tokens": 9218320} {"current_steps": 1725, "total_steps": 6250, "loss": 0.7159, "learning_rate": 4.1176399039236116e-05, "epoch": 0.276, "percentage": 27.6, "elapsed_time": "3:18:46", "remaining_time": "8:41:25", "throughput": 775.27, "total_tokens": 9246304} {"current_steps": 1730, "total_steps": 6250, "loss": 0.8248, "learning_rate": 4.112844232437757e-05, "epoch": 0.2768, "percentage": 27.68, "elapsed_time": "3:19:17", "remaining_time": "8:40:42", "throughput": 775.38, "total_tokens": 9271856} {"current_steps": 1735, "total_steps": 6250, "loss": 0.7264, "learning_rate": 4.108038373351163e-05, "epoch": 0.2776, "percentage": 27.76, "elapsed_time": "3:19:50", "remaining_time": "8:40:02", "throughput": 775.38, "total_tokens": 9297152} {"current_steps": 1740, "total_steps": 6250, "loss": 0.7368, "learning_rate": 4.1032223570202474e-05, "epoch": 0.2784, "percentage": 27.84, "elapsed_time": "3:20:22", "remaining_time": "8:39:21", "throughput": 775.8, "total_tokens": 9326896} {"current_steps": 1745, "total_steps": 6250, "loss": 0.6245, "learning_rate": 4.0983962138655873e-05, "epoch": 0.2792, "percentage": 27.92, "elapsed_time": "3:20:53", "remaining_time": "8:38:38", "throughput": 775.83, "total_tokens": 9351680} {"current_steps": 1750, "total_steps": 6250, "loss": 0.8033, "learning_rate": 4.093559974371725e-05, "epoch": 0.28, "percentage": 28.0, "elapsed_time": "3:21:24", "remaining_time": "8:37:55", "throughput": 775.75, "total_tokens": 9374896} {"current_steps": 1755, "total_steps": 6250, "loss": 0.6803, "learning_rate": 4.088713669086977e-05, "epoch": 0.2808, "percentage": 28.08, "elapsed_time": "3:21:57", "remaining_time": "8:37:16", "throughput": 775.77, "total_tokens": 9400592} {"current_steps": 1760, "total_steps": 6250, "loss": 0.7384, "learning_rate": 4.083857328623243e-05, "epoch": 0.2816, "percentage": 28.16, "elapsed_time": "3:22:33", "remaining_time": "8:36:45", "throughput": 775.85, "total_tokens": 9429280} {"current_steps": 1765, "total_steps": 6250, "loss": 0.8149, "learning_rate": 4.078990983655807e-05, "epoch": 0.2824, "percentage": 28.24, "elapsed_time": "3:23:08", "remaining_time": "8:36:11", "throughput": 775.72, "total_tokens": 9454736} {"current_steps": 1770, "total_steps": 6250, "loss": 0.7243, "learning_rate": 4.0741146649231504e-05, "epoch": 0.2832, "percentage": 28.32, "elapsed_time": "3:23:41", "remaining_time": "8:35:32", "throughput": 775.68, "total_tokens": 9479648} {"current_steps": 1775, "total_steps": 6250, "loss": 0.7639, "learning_rate": 4.0692284032267516e-05, "epoch": 0.284, "percentage": 28.4, "elapsed_time": "3:24:14", "remaining_time": "8:34:54", "throughput": 775.6, "total_tokens": 9504432} {"current_steps": 1780, "total_steps": 6250, "loss": 0.6857, "learning_rate": 4.064332229430895e-05, "epoch": 0.2848, "percentage": 28.48, "elapsed_time": "3:24:49", "remaining_time": "8:34:22", "throughput": 775.35, "total_tokens": 9528880} {"current_steps": 1785, "total_steps": 6250, "loss": 0.69, "learning_rate": 4.059426174462476e-05, "epoch": 0.2856, "percentage": 28.56, "elapsed_time": "3:25:23", "remaining_time": "8:33:46", "throughput": 775.52, "total_tokens": 9557360} {"current_steps": 1790, "total_steps": 6250, "loss": 0.704, "learning_rate": 4.054510269310803e-05, "epoch": 0.2864, "percentage": 28.64, "elapsed_time": "3:25:55", "remaining_time": "8:33:05", "throughput": 775.42, "total_tokens": 9580608} {"current_steps": 1795, "total_steps": 6250, "loss": 0.8015, "learning_rate": 4.0495845450274064e-05, "epoch": 0.2872, "percentage": 28.72, "elapsed_time": "3:26:28", "remaining_time": "8:32:27", "throughput": 775.82, "total_tokens": 9611376} {"current_steps": 1800, "total_steps": 6250, "loss": 0.7382, "learning_rate": 4.044649032725836e-05, "epoch": 0.288, "percentage": 28.8, "elapsed_time": "3:27:02", "remaining_time": "8:31:51", "throughput": 776.06, "total_tokens": 9640784} {"current_steps": 1805, "total_steps": 6250, "loss": 0.7299, "learning_rate": 4.039703763581472e-05, "epoch": 0.2888, "percentage": 28.88, "elapsed_time": "3:27:38", "remaining_time": "8:31:19", "throughput": 775.96, "total_tokens": 9667120} {"current_steps": 1810, "total_steps": 6250, "loss": 0.6402, "learning_rate": 4.0347487688313194e-05, "epoch": 0.2896, "percentage": 28.96, "elapsed_time": "3:28:14", "remaining_time": "8:30:49", "throughput": 776.08, "total_tokens": 9696832} {"current_steps": 1815, "total_steps": 6250, "loss": 0.711, "learning_rate": 4.02978407977382e-05, "epoch": 0.2904, "percentage": 29.04, "elapsed_time": "3:28:48", "remaining_time": "8:30:14", "throughput": 775.98, "total_tokens": 9722080} {"current_steps": 1820, "total_steps": 6250, "loss": 0.6587, "learning_rate": 4.024809727768648e-05, "epoch": 0.2912, "percentage": 29.12, "elapsed_time": "3:29:21", "remaining_time": "8:29:36", "throughput": 776.02, "total_tokens": 9748096} {"current_steps": 1825, "total_steps": 6250, "loss": 0.6656, "learning_rate": 4.019825744236514e-05, "epoch": 0.292, "percentage": 29.2, "elapsed_time": "3:29:54", "remaining_time": "8:28:56", "throughput": 776.08, "total_tokens": 9774128} {"current_steps": 1830, "total_steps": 6250, "loss": 0.7143, "learning_rate": 4.0148321606589656e-05, "epoch": 0.2928, "percentage": 29.28, "elapsed_time": "3:30:30", "remaining_time": "8:28:25", "throughput": 776.35, "total_tokens": 9805488} {"current_steps": 1835, "total_steps": 6250, "loss": 0.6735, "learning_rate": 4.009829008578192e-05, "epoch": 0.2936, "percentage": 29.36, "elapsed_time": "3:31:03", "remaining_time": "8:27:49", "throughput": 776.1, "total_tokens": 9828480} {"current_steps": 1840, "total_steps": 6250, "loss": 0.7395, "learning_rate": 4.0048163195968214e-05, "epoch": 0.2944, "percentage": 29.44, "elapsed_time": "3:31:39", "remaining_time": "8:27:17", "throughput": 776.69, "total_tokens": 9863648} {"current_steps": 1845, "total_steps": 6250, "loss": 0.729, "learning_rate": 3.999794125377721e-05, "epoch": 0.2952, "percentage": 29.52, "elapsed_time": "3:32:14", "remaining_time": "8:26:43", "throughput": 776.9, "total_tokens": 9893184} {"current_steps": 1850, "total_steps": 6250, "loss": 0.6565, "learning_rate": 3.9947624576437975e-05, "epoch": 0.296, "percentage": 29.6, "elapsed_time": "3:32:48", "remaining_time": "8:26:08", "throughput": 777.11, "total_tokens": 9922464} {"current_steps": 1855, "total_steps": 6250, "loss": 0.691, "learning_rate": 3.9897213481778006e-05, "epoch": 0.2968, "percentage": 29.68, "elapsed_time": "3:33:21", "remaining_time": "8:25:30", "throughput": 777.13, "total_tokens": 9948384} {"current_steps": 1860, "total_steps": 6250, "loss": 0.7408, "learning_rate": 3.984670828822118e-05, "epoch": 0.2976, "percentage": 29.76, "elapsed_time": "3:33:53", "remaining_time": "8:24:50", "throughput": 777.14, "total_tokens": 9973760} {"current_steps": 1865, "total_steps": 6250, "loss": 0.761, "learning_rate": 3.979610931478574e-05, "epoch": 0.2984, "percentage": 29.84, "elapsed_time": "3:34:28", "remaining_time": "8:24:16", "throughput": 777.22, "total_tokens": 10001648} {"current_steps": 1870, "total_steps": 6250, "loss": 0.8524, "learning_rate": 3.97454168810823e-05, "epoch": 0.2992, "percentage": 29.92, "elapsed_time": "3:35:00", "remaining_time": "8:23:37", "throughput": 777.07, "total_tokens": 10024912} {"current_steps": 1875, "total_steps": 6250, "loss": 0.7221, "learning_rate": 3.969463130731183e-05, "epoch": 0.3, "percentage": 30.0, "elapsed_time": "3:35:33", "remaining_time": "8:22:58", "throughput": 777.03, "total_tokens": 10049872} {"current_steps": 1880, "total_steps": 6250, "loss": 0.7708, "learning_rate": 3.964375291426361e-05, "epoch": 0.3008, "percentage": 30.08, "elapsed_time": "3:36:06", "remaining_time": "8:22:19", "throughput": 776.92, "total_tokens": 10073568} {"current_steps": 1885, "total_steps": 6250, "loss": 0.6842, "learning_rate": 3.959278202331322e-05, "epoch": 0.3016, "percentage": 30.16, "elapsed_time": "3:36:38", "remaining_time": "8:21:41", "throughput": 776.86, "total_tokens": 10098448} {"current_steps": 1890, "total_steps": 6250, "loss": 0.772, "learning_rate": 3.954171895642052e-05, "epoch": 0.3024, "percentage": 30.24, "elapsed_time": "3:37:10", "remaining_time": "8:20:59", "throughput": 776.9, "total_tokens": 10123168} {"current_steps": 1895, "total_steps": 6250, "loss": 0.6993, "learning_rate": 3.949056403612758e-05, "epoch": 0.3032, "percentage": 30.32, "elapsed_time": "3:37:41", "remaining_time": "8:20:17", "throughput": 777.05, "total_tokens": 10149440} {"current_steps": 1900, "total_steps": 6250, "loss": 0.7672, "learning_rate": 3.943931758555669e-05, "epoch": 0.304, "percentage": 30.4, "elapsed_time": "3:38:14", "remaining_time": "8:19:38", "throughput": 777.03, "total_tokens": 10174496} {"current_steps": 1905, "total_steps": 6250, "loss": 0.6716, "learning_rate": 3.938797992840828e-05, "epoch": 0.3048, "percentage": 30.48, "elapsed_time": "3:38:48", "remaining_time": "8:19:04", "throughput": 776.89, "total_tokens": 10199648} {"current_steps": 1910, "total_steps": 6250, "loss": 0.7062, "learning_rate": 3.933655138895889e-05, "epoch": 0.3056, "percentage": 30.56, "elapsed_time": "3:39:19", "remaining_time": "8:18:22", "throughput": 776.74, "total_tokens": 10221840} {"current_steps": 1915, "total_steps": 6250, "loss": 0.6748, "learning_rate": 3.928503229205913e-05, "epoch": 0.3064, "percentage": 30.64, "elapsed_time": "3:39:50", "remaining_time": "8:17:40", "throughput": 776.87, "total_tokens": 10247504} {"current_steps": 1920, "total_steps": 6250, "loss": 0.6331, "learning_rate": 3.9233422963131616e-05, "epoch": 0.3072, "percentage": 30.72, "elapsed_time": "3:40:23", "remaining_time": "8:17:02", "throughput": 777.24, "total_tokens": 10277984} {"current_steps": 1925, "total_steps": 6250, "loss": 0.779, "learning_rate": 3.9181723728168916e-05, "epoch": 0.308, "percentage": 30.8, "elapsed_time": "3:40:54", "remaining_time": "8:16:20", "throughput": 777.11, "total_tokens": 10300400} {"current_steps": 1930, "total_steps": 6250, "loss": 0.722, "learning_rate": 3.91299349137315e-05, "epoch": 0.3088, "percentage": 30.88, "elapsed_time": "3:41:28", "remaining_time": "8:15:45", "throughput": 777.09, "total_tokens": 10326672} {"current_steps": 1935, "total_steps": 6250, "loss": 0.6321, "learning_rate": 3.907805684694566e-05, "epoch": 0.3096, "percentage": 30.96, "elapsed_time": "3:42:03", "remaining_time": "8:15:10", "throughput": 777.36, "total_tokens": 10356864} {"current_steps": 1940, "total_steps": 6250, "loss": 0.6077, "learning_rate": 3.902608985550147e-05, "epoch": 0.3104, "percentage": 31.04, "elapsed_time": "3:42:39", "remaining_time": "8:14:39", "throughput": 777.61, "total_tokens": 10388032} {"current_steps": 1945, "total_steps": 6250, "loss": 0.6726, "learning_rate": 3.897403426765069e-05, "epoch": 0.3112, "percentage": 31.12, "elapsed_time": "3:43:14", "remaining_time": "8:14:08", "throughput": 777.69, "total_tokens": 10417152} {"current_steps": 1950, "total_steps": 6250, "loss": 0.741, "learning_rate": 3.8921890412204705e-05, "epoch": 0.312, "percentage": 31.2, "elapsed_time": "3:43:51", "remaining_time": "8:13:39", "throughput": 777.85, "total_tokens": 10448128} {"current_steps": 1955, "total_steps": 6250, "loss": 0.6555, "learning_rate": 3.886965861853244e-05, "epoch": 0.3128, "percentage": 31.28, "elapsed_time": "3:44:23", "remaining_time": "8:12:58", "throughput": 778.03, "total_tokens": 10474960} {"current_steps": 1960, "total_steps": 6250, "loss": 0.75, "learning_rate": 3.881733921655829e-05, "epoch": 0.3136, "percentage": 31.36, "elapsed_time": "3:44:57", "remaining_time": "8:12:23", "throughput": 778.13, "total_tokens": 10502848} {"current_steps": 1965, "total_steps": 6250, "loss": 0.7042, "learning_rate": 3.876493253676004e-05, "epoch": 0.3144, "percentage": 31.44, "elapsed_time": "3:45:32", "remaining_time": "8:11:48", "throughput": 778.35, "total_tokens": 10532640} {"current_steps": 1970, "total_steps": 6250, "loss": 0.6188, "learning_rate": 3.871243891016676e-05, "epoch": 0.3152, "percentage": 31.52, "elapsed_time": "3:46:06", "remaining_time": "8:11:13", "throughput": 778.42, "total_tokens": 10560096} {"current_steps": 1975, "total_steps": 6250, "loss": 0.8165, "learning_rate": 3.865985866835673e-05, "epoch": 0.316, "percentage": 31.6, "elapsed_time": "3:46:38", "remaining_time": "8:10:35", "throughput": 778.42, "total_tokens": 10585520} {"current_steps": 1980, "total_steps": 6250, "loss": 0.7437, "learning_rate": 3.8607192143455326e-05, "epoch": 0.3168, "percentage": 31.68, "elapsed_time": "3:47:13", "remaining_time": "8:10:01", "throughput": 778.57, "total_tokens": 10614560} {"current_steps": 1985, "total_steps": 6250, "loss": 0.7758, "learning_rate": 3.8554439668132946e-05, "epoch": 0.3176, "percentage": 31.76, "elapsed_time": "3:47:44", "remaining_time": "8:09:19", "throughput": 778.46, "total_tokens": 10637344} {"current_steps": 1990, "total_steps": 6250, "loss": 0.7593, "learning_rate": 3.85016015756029e-05, "epoch": 0.3184, "percentage": 31.84, "elapsed_time": "3:48:17", "remaining_time": "8:08:41", "throughput": 778.52, "total_tokens": 10663440} {"current_steps": 1995, "total_steps": 6250, "loss": 0.6535, "learning_rate": 3.844867819961928e-05, "epoch": 0.3192, "percentage": 31.92, "elapsed_time": "3:48:51", "remaining_time": "8:08:06", "throughput": 778.76, "total_tokens": 10693392} {"current_steps": 2000, "total_steps": 6250, "loss": 0.8263, "learning_rate": 3.8395669874474915e-05, "epoch": 0.32, "percentage": 32.0, "elapsed_time": "3:49:25", "remaining_time": "8:07:32", "throughput": 778.69, "total_tokens": 10719232} {"current_steps": 2005, "total_steps": 6250, "loss": 0.7992, "learning_rate": 3.8342576934999184e-05, "epoch": 0.3208, "percentage": 32.08, "elapsed_time": "3:49:58", "remaining_time": "8:06:55", "throughput": 778.8, "total_tokens": 10746560} {"current_steps": 2010, "total_steps": 6250, "loss": 0.7513, "learning_rate": 3.828939971655595e-05, "epoch": 0.3216, "percentage": 32.16, "elapsed_time": "3:50:29", "remaining_time": "8:06:13", "throughput": 778.65, "total_tokens": 10768512} {"current_steps": 2015, "total_steps": 6250, "loss": 0.6775, "learning_rate": 3.8236138555041434e-05, "epoch": 0.3224, "percentage": 32.24, "elapsed_time": "3:51:04", "remaining_time": "8:05:39", "throughput": 779.24, "total_tokens": 10803648} {"current_steps": 2020, "total_steps": 6250, "loss": 0.7856, "learning_rate": 3.8182793786882065e-05, "epoch": 0.3232, "percentage": 32.32, "elapsed_time": "3:51:39", "remaining_time": "8:05:05", "throughput": 779.23, "total_tokens": 10830640} {"current_steps": 2025, "total_steps": 6250, "loss": 0.6793, "learning_rate": 3.81293657490324e-05, "epoch": 0.324, "percentage": 32.4, "elapsed_time": "3:52:13", "remaining_time": "8:04:30", "throughput": 779.46, "total_tokens": 10860272} {"current_steps": 2030, "total_steps": 6250, "loss": 0.6546, "learning_rate": 3.8075854778972955e-05, "epoch": 0.3248, "percentage": 32.48, "elapsed_time": "3:52:48", "remaining_time": "8:03:58", "throughput": 779.44, "total_tokens": 10887664} {"current_steps": 2035, "total_steps": 6250, "loss": 0.6673, "learning_rate": 3.802226121470811e-05, "epoch": 0.3256, "percentage": 32.56, "elapsed_time": "3:53:22", "remaining_time": "8:03:23", "throughput": 779.27, "total_tokens": 10912000} {"current_steps": 2040, "total_steps": 6250, "loss": 0.6933, "learning_rate": 3.796858539476394e-05, "epoch": 0.3264, "percentage": 32.64, "elapsed_time": "3:53:55", "remaining_time": "8:02:45", "throughput": 779.21, "total_tokens": 10936704} {"current_steps": 2045, "total_steps": 6250, "loss": 0.6593, "learning_rate": 3.7914827658186103e-05, "epoch": 0.3272, "percentage": 32.72, "elapsed_time": "3:54:26", "remaining_time": "8:02:04", "throughput": 779.18, "total_tokens": 10960464} {"current_steps": 2050, "total_steps": 6250, "loss": 0.6246, "learning_rate": 3.786098834453766e-05, "epoch": 0.328, "percentage": 32.8, "elapsed_time": "3:55:00", "remaining_time": "8:01:29", "throughput": 779.37, "total_tokens": 10989680} {"current_steps": 2055, "total_steps": 6250, "loss": 0.7029, "learning_rate": 3.780706779389701e-05, "epoch": 0.3288, "percentage": 32.88, "elapsed_time": "3:55:33", "remaining_time": "8:00:51", "throughput": 779.36, "total_tokens": 11014928} {"current_steps": 2060, "total_steps": 6250, "loss": 0.7331, "learning_rate": 3.775306634685562e-05, "epoch": 0.3296, "percentage": 32.96, "elapsed_time": "3:56:06", "remaining_time": "8:00:14", "throughput": 779.44, "total_tokens": 11041920} {"current_steps": 2065, "total_steps": 6250, "loss": 0.6624, "learning_rate": 3.7698984344515997e-05, "epoch": 0.3304, "percentage": 33.04, "elapsed_time": "3:56:43", "remaining_time": "7:59:44", "throughput": 779.43, "total_tokens": 11070304} {"current_steps": 2070, "total_steps": 6250, "loss": 0.7505, "learning_rate": 3.764482212848948e-05, "epoch": 0.3312, "percentage": 33.12, "elapsed_time": "3:57:16", "remaining_time": "7:59:07", "throughput": 779.68, "total_tokens": 11099520} {"current_steps": 2075, "total_steps": 6250, "loss": 0.6908, "learning_rate": 3.759058004089402e-05, "epoch": 0.332, "percentage": 33.2, "elapsed_time": "3:57:48", "remaining_time": "7:58:29", "throughput": 779.96, "total_tokens": 11129008} {"current_steps": 2080, "total_steps": 6250, "loss": 0.7062, "learning_rate": 3.753625842435216e-05, "epoch": 0.3328, "percentage": 33.28, "elapsed_time": "3:58:19", "remaining_time": "7:57:48", "throughput": 779.84, "total_tokens": 11151600} {"current_steps": 2085, "total_steps": 6250, "loss": 0.7177, "learning_rate": 3.748185762198873e-05, "epoch": 0.3336, "percentage": 33.36, "elapsed_time": "3:58:51", "remaining_time": "7:57:08", "throughput": 779.88, "total_tokens": 11176784} {"current_steps": 2090, "total_steps": 6250, "loss": 0.7504, "learning_rate": 3.742737797742878e-05, "epoch": 0.3344, "percentage": 33.44, "elapsed_time": "3:59:23", "remaining_time": "7:56:30", "throughput": 780.09, "total_tokens": 11205008} {"current_steps": 2095, "total_steps": 6250, "loss": 0.7144, "learning_rate": 3.7372819834795335e-05, "epoch": 0.3352, "percentage": 33.52, "elapsed_time": "3:59:56", "remaining_time": "7:55:51", "throughput": 780.06, "total_tokens": 11229872} {"current_steps": 2100, "total_steps": 6250, "loss": 0.6876, "learning_rate": 3.731818353870729e-05, "epoch": 0.336, "percentage": 33.6, "elapsed_time": "4:00:28", "remaining_time": "7:55:14", "throughput": 779.92, "total_tokens": 11253296} {"current_steps": 2105, "total_steps": 6250, "loss": 0.7102, "learning_rate": 3.726346943427719e-05, "epoch": 0.3368, "percentage": 33.68, "elapsed_time": "4:01:02", "remaining_time": "7:54:37", "throughput": 779.93, "total_tokens": 11279408} {"current_steps": 2110, "total_steps": 6250, "loss": 0.7708, "learning_rate": 3.720867786710904e-05, "epoch": 0.3376, "percentage": 33.76, "elapsed_time": "4:01:36", "remaining_time": "7:54:02", "throughput": 779.81, "total_tokens": 11304176} {"current_steps": 2115, "total_steps": 6250, "loss": 0.5882, "learning_rate": 3.7153809183296176e-05, "epoch": 0.3384, "percentage": 33.84, "elapsed_time": "4:02:07", "remaining_time": "7:53:22", "throughput": 779.97, "total_tokens": 11330944} {"current_steps": 2120, "total_steps": 6250, "loss": 0.6127, "learning_rate": 3.7098863729419e-05, "epoch": 0.3392, "percentage": 33.92, "elapsed_time": "4:02:38", "remaining_time": "7:52:41", "throughput": 779.89, "total_tokens": 11354064} {"current_steps": 2125, "total_steps": 6250, "loss": 0.7732, "learning_rate": 3.704384185254288e-05, "epoch": 0.34, "percentage": 34.0, "elapsed_time": "4:03:10", "remaining_time": "7:52:01", "throughput": 779.73, "total_tokens": 11376288} {"current_steps": 2130, "total_steps": 6250, "loss": 0.7334, "learning_rate": 3.6988743900215894e-05, "epoch": 0.3408, "percentage": 34.08, "elapsed_time": "4:03:44", "remaining_time": "7:51:27", "throughput": 779.89, "total_tokens": 11405472} {"current_steps": 2135, "total_steps": 6250, "loss": 0.8137, "learning_rate": 3.693357022046665e-05, "epoch": 0.3416, "percentage": 34.16, "elapsed_time": "4:04:15", "remaining_time": "7:50:47", "throughput": 780.0, "total_tokens": 11431552} {"current_steps": 2140, "total_steps": 6250, "loss": 0.6987, "learning_rate": 3.68783211618021e-05, "epoch": 0.3424, "percentage": 34.24, "elapsed_time": "4:04:49", "remaining_time": "7:50:12", "throughput": 780.07, "total_tokens": 11459152} {"current_steps": 2145, "total_steps": 6250, "loss": 0.6614, "learning_rate": 3.682299707320532e-05, "epoch": 0.3432, "percentage": 34.32, "elapsed_time": "4:05:24", "remaining_time": "7:49:39", "throughput": 780.16, "total_tokens": 11487552} {"current_steps": 2150, "total_steps": 6250, "loss": 0.688, "learning_rate": 3.6767598304133324e-05, "epoch": 0.344, "percentage": 34.4, "elapsed_time": "4:05:58", "remaining_time": "7:49:04", "throughput": 780.27, "total_tokens": 11515792} {"current_steps": 2155, "total_steps": 6250, "loss": 0.7897, "learning_rate": 3.671212520451484e-05, "epoch": 0.3448, "percentage": 34.48, "elapsed_time": "4:06:32", "remaining_time": "7:48:29", "throughput": 780.21, "total_tokens": 11541280} {"current_steps": 2160, "total_steps": 6250, "loss": 0.7086, "learning_rate": 3.665657812474812e-05, "epoch": 0.3456, "percentage": 34.56, "elapsed_time": "4:07:09", "remaining_time": "7:48:00", "throughput": 780.15, "total_tokens": 11569440} {"current_steps": 2165, "total_steps": 6250, "loss": 0.7421, "learning_rate": 3.660095741569871e-05, "epoch": 0.3464, "percentage": 34.64, "elapsed_time": "4:07:44", "remaining_time": "7:47:27", "throughput": 780.22, "total_tokens": 11597792} {"current_steps": 2170, "total_steps": 6250, "loss": 0.6954, "learning_rate": 3.654526342869724e-05, "epoch": 0.3472, "percentage": 34.72, "elapsed_time": "4:08:17", "remaining_time": "7:46:49", "throughput": 780.2, "total_tokens": 11622864} {"current_steps": 2175, "total_steps": 6250, "loss": 0.6764, "learning_rate": 3.6489496515537204e-05, "epoch": 0.348, "percentage": 34.8, "elapsed_time": "4:08:49", "remaining_time": "7:46:11", "throughput": 780.41, "total_tokens": 11651280} {"current_steps": 2180, "total_steps": 6250, "loss": 0.705, "learning_rate": 3.643365702847272e-05, "epoch": 0.3488, "percentage": 34.88, "elapsed_time": "4:09:25", "remaining_time": "7:45:40", "throughput": 780.47, "total_tokens": 11680048} {"current_steps": 2185, "total_steps": 6250, "loss": 0.7433, "learning_rate": 3.6377745320216346e-05, "epoch": 0.3496, "percentage": 34.96, "elapsed_time": "4:09:56", "remaining_time": "7:44:59", "throughput": 780.32, "total_tokens": 11702144} {"current_steps": 2190, "total_steps": 6250, "loss": 0.653, "learning_rate": 3.632176174393682e-05, "epoch": 0.3504, "percentage": 35.04, "elapsed_time": "4:10:29", "remaining_time": "7:44:22", "throughput": 780.4, "total_tokens": 11728816} {"current_steps": 2195, "total_steps": 6250, "loss": 0.6381, "learning_rate": 3.626570665325684e-05, "epoch": 0.3512, "percentage": 35.12, "elapsed_time": "4:11:04", "remaining_time": "7:43:50", "throughput": 780.41, "total_tokens": 11756688} {"current_steps": 2200, "total_steps": 6250, "loss": 0.7347, "learning_rate": 3.6209580402250815e-05, "epoch": 0.352, "percentage": 35.2, "elapsed_time": "4:11:35", "remaining_time": "7:43:10", "throughput": 780.45, "total_tokens": 11781664} {"current_steps": 2205, "total_steps": 6250, "loss": 0.8036, "learning_rate": 3.615338334544265e-05, "epoch": 0.3528, "percentage": 35.28, "elapsed_time": "4:12:09", "remaining_time": "7:42:34", "throughput": 780.49, "total_tokens": 11808352} {"current_steps": 2210, "total_steps": 6250, "loss": 0.7486, "learning_rate": 3.6097115837803505e-05, "epoch": 0.3536, "percentage": 35.36, "elapsed_time": "4:12:43", "remaining_time": "7:41:59", "throughput": 780.59, "total_tokens": 11836400} {"current_steps": 2215, "total_steps": 6250, "loss": 0.7885, "learning_rate": 3.604077823474954e-05, "epoch": 0.3544, "percentage": 35.44, "elapsed_time": "4:13:16", "remaining_time": "7:41:22", "throughput": 780.63, "total_tokens": 11862608} {"current_steps": 2220, "total_steps": 6250, "loss": 0.7005, "learning_rate": 3.5984370892139666e-05, "epoch": 0.3552, "percentage": 35.52, "elapsed_time": "4:13:47", "remaining_time": "7:40:43", "throughput": 780.57, "total_tokens": 11886528} {"current_steps": 2225, "total_steps": 6250, "loss": 0.607, "learning_rate": 3.592789416627332e-05, "epoch": 0.356, "percentage": 35.6, "elapsed_time": "4:14:30", "remaining_time": "7:40:23", "throughput": 780.28, "total_tokens": 11915040} {"current_steps": 2230, "total_steps": 6250, "loss": 0.6723, "learning_rate": 3.5871348413888204e-05, "epoch": 0.3568, "percentage": 35.68, "elapsed_time": "4:15:29", "remaining_time": "7:40:33", "throughput": 779.08, "total_tokens": 11942768} {"current_steps": 2235, "total_steps": 6250, "loss": 0.7302, "learning_rate": 3.581473399215802e-05, "epoch": 0.3576, "percentage": 35.76, "elapsed_time": "4:15:59", "remaining_time": "7:39:51", "throughput": 779.88, "total_tokens": 11978464} {"current_steps": 2240, "total_steps": 6250, "loss": 0.6867, "learning_rate": 3.575805125869022e-05, "epoch": 0.3584, "percentage": 35.84, "elapsed_time": "4:16:20", "remaining_time": "7:38:54", "throughput": 780.28, "total_tokens": 12001392} {"current_steps": 2245, "total_steps": 6250, "loss": 0.7346, "learning_rate": 3.5701300571523755e-05, "epoch": 0.3592, "percentage": 35.92, "elapsed_time": "4:16:47", "remaining_time": "7:38:06", "throughput": 780.82, "total_tokens": 12030352} {"current_steps": 2250, "total_steps": 6250, "loss": 0.6381, "learning_rate": 3.564448228912682e-05, "epoch": 0.36, "percentage": 36.0, "elapsed_time": "4:17:14", "remaining_time": "7:37:19", "throughput": 781.5, "total_tokens": 12062384} {"current_steps": 2255, "total_steps": 6250, "loss": 0.7679, "learning_rate": 3.558759677039455e-05, "epoch": 0.3608, "percentage": 36.08, "elapsed_time": "4:17:37", "remaining_time": "7:36:24", "throughput": 782.11, "total_tokens": 12089408} {"current_steps": 2260, "total_steps": 6250, "loss": 0.668, "learning_rate": 3.5530644374646815e-05, "epoch": 0.3616, "percentage": 36.16, "elapsed_time": "4:18:01", "remaining_time": "7:35:33", "throughput": 782.51, "total_tokens": 12114656} {"current_steps": 2265, "total_steps": 6250, "loss": 0.7454, "learning_rate": 3.547362546162588e-05, "epoch": 0.3624, "percentage": 36.24, "elapsed_time": "4:18:27", "remaining_time": "7:34:44", "throughput": 783.14, "total_tokens": 12144832} {"current_steps": 2270, "total_steps": 6250, "loss": 0.7513, "learning_rate": 3.54165403914942e-05, "epoch": 0.3632, "percentage": 36.32, "elapsed_time": "4:18:49", "remaining_time": "7:33:48", "throughput": 783.67, "total_tokens": 12170096} {"current_steps": 2275, "total_steps": 6250, "loss": 0.7881, "learning_rate": 3.535938952483211e-05, "epoch": 0.364, "percentage": 36.4, "elapsed_time": "4:19:09", "remaining_time": "7:32:49", "throughput": 784.0, "total_tokens": 12191104} {"current_steps": 2280, "total_steps": 6250, "loss": 0.7253, "learning_rate": 3.5302173222635524e-05, "epoch": 0.3648, "percentage": 36.48, "elapsed_time": "4:19:30", "remaining_time": "7:31:51", "throughput": 784.46, "total_tokens": 12214416} {"current_steps": 2285, "total_steps": 6250, "loss": 0.8122, "learning_rate": 3.5244891846313736e-05, "epoch": 0.3656, "percentage": 36.56, "elapsed_time": "4:19:52", "remaining_time": "7:30:56", "throughput": 785.08, "total_tokens": 12241344} {"current_steps": 2290, "total_steps": 6250, "loss": 0.6188, "learning_rate": 3.5187545757687015e-05, "epoch": 0.3664, "percentage": 36.64, "elapsed_time": "4:20:17", "remaining_time": "7:30:06", "throughput": 785.63, "total_tokens": 12269376} {"current_steps": 2295, "total_steps": 6250, "loss": 0.7138, "learning_rate": 3.5130135318984456e-05, "epoch": 0.3672, "percentage": 36.72, "elapsed_time": "4:20:40", "remaining_time": "7:29:13", "throughput": 786.11, "total_tokens": 12294960} {"current_steps": 2300, "total_steps": 6250, "loss": 0.7425, "learning_rate": 3.507266089284157e-05, "epoch": 0.368, "percentage": 36.8, "elapsed_time": "4:21:00", "remaining_time": "7:28:15", "throughput": 786.61, "total_tokens": 12318864} {"current_steps": 2305, "total_steps": 6250, "loss": 0.7238, "learning_rate": 3.501512284229807e-05, "epoch": 0.3688, "percentage": 36.88, "elapsed_time": "4:21:24", "remaining_time": "7:27:23", "throughput": 787.13, "total_tokens": 12345520} {"current_steps": 2310, "total_steps": 6250, "loss": 0.684, "learning_rate": 3.495752153079557e-05, "epoch": 0.3696, "percentage": 36.96, "elapsed_time": "4:21:44", "remaining_time": "7:26:26", "throughput": 787.62, "total_tokens": 12369600} {"current_steps": 2315, "total_steps": 6250, "loss": 0.707, "learning_rate": 3.489985732217525e-05, "epoch": 0.3704, "percentage": 37.04, "elapsed_time": "4:22:06", "remaining_time": "7:25:31", "throughput": 788.11, "total_tokens": 12394400} {"current_steps": 2320, "total_steps": 6250, "loss": 0.5843, "learning_rate": 3.484213058067559e-05, "epoch": 0.3712, "percentage": 37.12, "elapsed_time": "4:22:29", "remaining_time": "7:24:39", "throughput": 788.63, "total_tokens": 12420848} {"current_steps": 2325, "total_steps": 6250, "loss": 0.7014, "learning_rate": 3.4784341670930065e-05, "epoch": 0.372, "percentage": 37.2, "elapsed_time": "4:22:51", "remaining_time": "7:23:45", "throughput": 789.13, "total_tokens": 12446192} {"current_steps": 2330, "total_steps": 6250, "loss": 0.777, "learning_rate": 3.4726490957964834e-05, "epoch": 0.3728, "percentage": 37.28, "elapsed_time": "4:23:19", "remaining_time": "7:23:01", "throughput": 789.45, "total_tokens": 12472960} {"current_steps": 2335, "total_steps": 6250, "loss": 0.6856, "learning_rate": 3.466857880719645e-05, "epoch": 0.3736, "percentage": 37.36, "elapsed_time": "4:23:48", "remaining_time": "7:22:18", "throughput": 790.0, "total_tokens": 12504256} {"current_steps": 2340, "total_steps": 6250, "loss": 0.7742, "learning_rate": 3.461060558442952e-05, "epoch": 0.3744, "percentage": 37.44, "elapsed_time": "4:24:13", "remaining_time": "7:21:29", "throughput": 790.38, "total_tokens": 12529872} {"current_steps": 2345, "total_steps": 6250, "loss": 0.6815, "learning_rate": 3.455257165585444e-05, "epoch": 0.3752, "percentage": 37.52, "elapsed_time": "4:24:37", "remaining_time": "7:20:39", "throughput": 790.6, "total_tokens": 12552368} {"current_steps": 2350, "total_steps": 6250, "loss": 0.677, "learning_rate": 3.4494477388045035e-05, "epoch": 0.376, "percentage": 37.6, "elapsed_time": "4:25:01", "remaining_time": "7:19:49", "throughput": 790.91, "total_tokens": 12576720} {"current_steps": 2355, "total_steps": 6250, "loss": 0.6239, "learning_rate": 3.443632314795627e-05, "epoch": 0.3768, "percentage": 37.68, "elapsed_time": "4:25:24", "remaining_time": "7:18:57", "throughput": 791.63, "total_tokens": 12606096} {"current_steps": 2360, "total_steps": 6250, "loss": 0.7379, "learning_rate": 3.437810930292195e-05, "epoch": 0.3776, "percentage": 37.76, "elapsed_time": "4:25:46", "remaining_time": "7:18:04", "throughput": 792.11, "total_tokens": 12631376} {"current_steps": 2365, "total_steps": 6250, "loss": 0.7315, "learning_rate": 3.4319836220652335e-05, "epoch": 0.3784, "percentage": 37.84, "elapsed_time": "4:26:09", "remaining_time": "7:17:12", "throughput": 792.91, "total_tokens": 12662096} {"current_steps": 2370, "total_steps": 6250, "loss": 0.7738, "learning_rate": 3.4261504269231904e-05, "epoch": 0.3792, "percentage": 37.92, "elapsed_time": "4:26:34", "remaining_time": "7:16:25", "throughput": 793.5, "total_tokens": 12691696} {"current_steps": 2375, "total_steps": 6250, "loss": 0.7307, "learning_rate": 3.4203113817116957e-05, "epoch": 0.38, "percentage": 38.0, "elapsed_time": "4:26:57", "remaining_time": "7:15:33", "throughput": 794.05, "total_tokens": 12718368} {"current_steps": 2380, "total_steps": 6250, "loss": 0.7119, "learning_rate": 3.414466523313332e-05, "epoch": 0.3808, "percentage": 38.08, "elapsed_time": "4:27:20", "remaining_time": "7:14:43", "throughput": 794.45, "total_tokens": 12743664} {"current_steps": 2385, "total_steps": 6250, "loss": 0.781, "learning_rate": 3.408615888647402e-05, "epoch": 0.3816, "percentage": 38.16, "elapsed_time": "4:27:44", "remaining_time": "7:13:53", "throughput": 795.24, "total_tokens": 12775088} {"current_steps": 2390, "total_steps": 6250, "loss": 0.6256, "learning_rate": 3.402759514669694e-05, "epoch": 0.3824, "percentage": 38.24, "elapsed_time": "4:28:08", "remaining_time": "7:13:03", "throughput": 795.77, "total_tokens": 12802576} {"current_steps": 2395, "total_steps": 6250, "loss": 0.7672, "learning_rate": 3.3968974383722495e-05, "epoch": 0.3832, "percentage": 38.32, "elapsed_time": "4:28:31", "remaining_time": "7:12:13", "throughput": 796.38, "total_tokens": 12831280} {"current_steps": 2400, "total_steps": 6250, "loss": 0.7665, "learning_rate": 3.3910296967831266e-05, "epoch": 0.384, "percentage": 38.4, "elapsed_time": "4:28:52", "remaining_time": "7:11:19", "throughput": 796.76, "total_tokens": 12853744} {"current_steps": 2405, "total_steps": 6250, "loss": 0.6321, "learning_rate": 3.3851563269661726e-05, "epoch": 0.3848, "percentage": 38.48, "elapsed_time": "4:29:14", "remaining_time": "7:10:26", "throughput": 797.51, "total_tokens": 12883408} {"current_steps": 2410, "total_steps": 6250, "loss": 0.7086, "learning_rate": 3.379277366020782e-05, "epoch": 0.3856, "percentage": 38.56, "elapsed_time": "4:29:35", "remaining_time": "7:09:33", "throughput": 798.4, "total_tokens": 12914592} {"current_steps": 2415, "total_steps": 6250, "loss": 0.7712, "learning_rate": 3.373392851081668e-05, "epoch": 0.3864, "percentage": 38.64, "elapsed_time": "4:29:56", "remaining_time": "7:08:40", "throughput": 798.73, "total_tokens": 12936832} {"current_steps": 2420, "total_steps": 6250, "loss": 0.6844, "learning_rate": 3.367502819318624e-05, "epoch": 0.3872, "percentage": 38.72, "elapsed_time": "4:30:20", "remaining_time": "7:07:51", "throughput": 799.16, "total_tokens": 12962864} {"current_steps": 2425, "total_steps": 6250, "loss": 0.6877, "learning_rate": 3.3616073079362926e-05, "epoch": 0.388, "percentage": 38.8, "elapsed_time": "4:30:44", "remaining_time": "7:07:03", "throughput": 799.79, "total_tokens": 12992560} {"current_steps": 2430, "total_steps": 6250, "loss": 0.8139, "learning_rate": 3.355706354173928e-05, "epoch": 0.3888, "percentage": 38.88, "elapsed_time": "4:31:07", "remaining_time": "7:06:12", "throughput": 800.09, "total_tokens": 13015440} {"current_steps": 2435, "total_steps": 6250, "loss": 0.6696, "learning_rate": 3.349799995305162e-05, "epoch": 0.3896, "percentage": 38.96, "elapsed_time": "4:31:28", "remaining_time": "7:05:19", "throughput": 800.5, "total_tokens": 13039008} {"current_steps": 2440, "total_steps": 6250, "loss": 0.7001, "learning_rate": 3.343888268637765e-05, "epoch": 0.3904, "percentage": 39.04, "elapsed_time": "4:31:51", "remaining_time": "7:04:29", "throughput": 801.14, "total_tokens": 13067648} {"current_steps": 2445, "total_steps": 6250, "loss": 0.8036, "learning_rate": 3.337971211513417e-05, "epoch": 0.3912, "percentage": 39.12, "elapsed_time": "4:32:12", "remaining_time": "7:03:37", "throughput": 801.45, "total_tokens": 13090064} {"current_steps": 2450, "total_steps": 6250, "loss": 0.7405, "learning_rate": 3.332048861307467e-05, "epoch": 0.392, "percentage": 39.2, "elapsed_time": "4:32:36", "remaining_time": "7:02:49", "throughput": 802.12, "total_tokens": 13119856} {"current_steps": 2455, "total_steps": 6250, "loss": 0.6975, "learning_rate": 3.3261212554286975e-05, "epoch": 0.3928, "percentage": 39.28, "elapsed_time": "4:32:58", "remaining_time": "7:01:58", "throughput": 802.77, "total_tokens": 13148288} {"current_steps": 2460, "total_steps": 6250, "loss": 0.6809, "learning_rate": 3.320188431319088e-05, "epoch": 0.3936, "percentage": 39.36, "elapsed_time": "4:33:21", "remaining_time": "7:01:08", "throughput": 803.33, "total_tokens": 13175616} {"current_steps": 2465, "total_steps": 6250, "loss": 0.7749, "learning_rate": 3.3142504264535804e-05, "epoch": 0.3944, "percentage": 39.44, "elapsed_time": "4:33:46", "remaining_time": "7:00:22", "throughput": 803.54, "total_tokens": 13199280} {"current_steps": 2470, "total_steps": 6250, "loss": 0.6873, "learning_rate": 3.3083072783398416e-05, "epoch": 0.3952, "percentage": 39.52, "elapsed_time": "4:34:08", "remaining_time": "6:59:32", "throughput": 803.98, "total_tokens": 13224640} {"current_steps": 2475, "total_steps": 6250, "loss": 0.7554, "learning_rate": 3.302359024518024e-05, "epoch": 0.396, "percentage": 39.6, "elapsed_time": "4:34:34", "remaining_time": "6:58:47", "throughput": 804.31, "total_tokens": 13250448} {"current_steps": 2480, "total_steps": 6250, "loss": 0.7112, "learning_rate": 3.296405702560532e-05, "epoch": 0.3968, "percentage": 39.68, "elapsed_time": "4:34:59", "remaining_time": "6:58:01", "throughput": 804.48, "total_tokens": 13273472} {"current_steps": 2485, "total_steps": 6250, "loss": 0.8207, "learning_rate": 3.2904473500717824e-05, "epoch": 0.3976, "percentage": 39.76, "elapsed_time": "4:35:26", "remaining_time": "6:57:19", "throughput": 804.79, "total_tokens": 13300608} {"current_steps": 2490, "total_steps": 6250, "loss": 0.693, "learning_rate": 3.2844840046879686e-05, "epoch": 0.3984, "percentage": 39.84, "elapsed_time": "4:35:50", "remaining_time": "6:56:31", "throughput": 805.23, "total_tokens": 13326976} {"current_steps": 2495, "total_steps": 6250, "loss": 0.6826, "learning_rate": 3.278515704076821e-05, "epoch": 0.3992, "percentage": 39.92, "elapsed_time": "4:36:19", "remaining_time": "6:55:51", "throughput": 805.74, "total_tokens": 13358528} {"current_steps": 2500, "total_steps": 6250, "loss": 0.6714, "learning_rate": 3.272542485937369e-05, "epoch": 0.4, "percentage": 40.0, "elapsed_time": "4:36:40", "remaining_time": "6:55:00", "throughput": 806.25, "total_tokens": 13384096} {"current_steps": 2505, "total_steps": 6250, "loss": 0.7387, "learning_rate": 3.2665643879997056e-05, "epoch": 0.4008, "percentage": 40.08, "elapsed_time": "4:37:11", "remaining_time": "6:54:24", "throughput": 806.72, "total_tokens": 13417120} {"current_steps": 2510, "total_steps": 6250, "loss": 0.6875, "learning_rate": 3.260581448024745e-05, "epoch": 0.4016, "percentage": 40.16, "elapsed_time": "4:37:38", "remaining_time": "6:53:41", "throughput": 807.09, "total_tokens": 13444832} {"current_steps": 2515, "total_steps": 6250, "loss": 0.834, "learning_rate": 3.25459370380399e-05, "epoch": 0.4024, "percentage": 40.24, "elapsed_time": "4:38:05", "remaining_time": "6:52:58", "throughput": 807.45, "total_tokens": 13472304} {"current_steps": 2520, "total_steps": 6250, "loss": 0.7144, "learning_rate": 3.248601193159287e-05, "epoch": 0.4032, "percentage": 40.32, "elapsed_time": "4:38:26", "remaining_time": "6:52:08", "throughput": 807.83, "total_tokens": 13495984} {"current_steps": 2525, "total_steps": 6250, "loss": 0.7171, "learning_rate": 3.2426039539425876e-05, "epoch": 0.404, "percentage": 40.4, "elapsed_time": "4:38:50", "remaining_time": "6:51:21", "throughput": 808.3, "total_tokens": 13523360} {"current_steps": 2530, "total_steps": 6250, "loss": 0.7197, "learning_rate": 3.236602024035716e-05, "epoch": 0.4048, "percentage": 40.48, "elapsed_time": "4:39:17", "remaining_time": "6:50:39", "throughput": 808.59, "total_tokens": 13550016} {"current_steps": 2535, "total_steps": 6250, "loss": 0.7997, "learning_rate": 3.230595441350125e-05, "epoch": 0.4056, "percentage": 40.56, "elapsed_time": "4:39:39", "remaining_time": "6:49:50", "throughput": 809.03, "total_tokens": 13575088} {"current_steps": 2540, "total_steps": 6250, "loss": 0.7847, "learning_rate": 3.2245842438266526e-05, "epoch": 0.4064, "percentage": 40.64, "elapsed_time": "4:40:04", "remaining_time": "6:49:05", "throughput": 809.34, "total_tokens": 13600832} {"current_steps": 2545, "total_steps": 6250, "loss": 0.7213, "learning_rate": 3.2185684694352916e-05, "epoch": 0.4072, "percentage": 40.72, "elapsed_time": "4:40:33", "remaining_time": "6:48:25", "throughput": 809.55, "total_tokens": 13627328} {"current_steps": 2550, "total_steps": 6250, "loss": 0.633, "learning_rate": 3.21254815617494e-05, "epoch": 0.408, "percentage": 40.8, "elapsed_time": "4:40:56", "remaining_time": "6:47:39", "throughput": 809.85, "total_tokens": 13651664} {"current_steps": 2555, "total_steps": 6250, "loss": 0.7512, "learning_rate": 3.206523342073172e-05, "epoch": 0.4088, "percentage": 40.88, "elapsed_time": "4:41:18", "remaining_time": "6:46:48", "throughput": 810.36, "total_tokens": 13677248} {"current_steps": 2560, "total_steps": 6250, "loss": 0.703, "learning_rate": 3.2004940651859844e-05, "epoch": 0.4096, "percentage": 40.96, "elapsed_time": "4:41:42", "remaining_time": "6:46:02", "throughput": 810.9, "total_tokens": 13705904} {"current_steps": 2565, "total_steps": 6250, "loss": 0.7212, "learning_rate": 3.194460363597569e-05, "epoch": 0.4104, "percentage": 41.04, "elapsed_time": "4:42:07", "remaining_time": "6:45:19", "throughput": 811.18, "total_tokens": 13731520} {"current_steps": 2570, "total_steps": 6250, "loss": 0.7009, "learning_rate": 3.1884222754200625e-05, "epoch": 0.4112, "percentage": 41.12, "elapsed_time": "4:42:32", "remaining_time": "6:44:34", "throughput": 811.33, "total_tokens": 13753840} {"current_steps": 2575, "total_steps": 6250, "loss": 0.718, "learning_rate": 3.1823798387933134e-05, "epoch": 0.412, "percentage": 41.2, "elapsed_time": "4:43:00", "remaining_time": "6:43:53", "throughput": 811.39, "total_tokens": 13777504} {"current_steps": 2580, "total_steps": 6250, "loss": 0.6796, "learning_rate": 3.176333091884635e-05, "epoch": 0.4128, "percentage": 41.28, "elapsed_time": "4:43:34", "remaining_time": "6:43:22", "throughput": 811.4, "total_tokens": 13805392} {"current_steps": 2585, "total_steps": 6250, "loss": 0.6632, "learning_rate": 3.170282072888566e-05, "epoch": 0.4136, "percentage": 41.36, "elapsed_time": "4:44:01", "remaining_time": "6:42:40", "throughput": 811.89, "total_tokens": 13835600} {"current_steps": 2590, "total_steps": 6250, "loss": 0.743, "learning_rate": 3.1642268200266317e-05, "epoch": 0.4144, "percentage": 41.44, "elapsed_time": "4:44:21", "remaining_time": "6:41:50", "throughput": 812.49, "total_tokens": 13862528} {"current_steps": 2595, "total_steps": 6250, "loss": 0.7091, "learning_rate": 3.1581673715471006e-05, "epoch": 0.4152, "percentage": 41.52, "elapsed_time": "4:44:43", "remaining_time": "6:41:01", "throughput": 813.08, "total_tokens": 13890272} {"current_steps": 2600, "total_steps": 6250, "loss": 0.8011, "learning_rate": 3.152103765724743e-05, "epoch": 0.416, "percentage": 41.6, "elapsed_time": "4:45:08", "remaining_time": "6:40:17", "throughput": 813.24, "total_tokens": 13913328} {"current_steps": 2605, "total_steps": 6250, "loss": 0.7569, "learning_rate": 3.1460360408605866e-05, "epoch": 0.4168, "percentage": 41.68, "elapsed_time": "4:45:34", "remaining_time": "6:39:35", "throughput": 813.74, "total_tokens": 13943040} {"current_steps": 2610, "total_steps": 6250, "loss": 0.6976, "learning_rate": 3.139964235281682e-05, "epoch": 0.4176, "percentage": 41.76, "elapsed_time": "4:46:00", "remaining_time": "6:38:52", "throughput": 814.2, "total_tokens": 13971872} {"current_steps": 2615, "total_steps": 6250, "loss": 0.7039, "learning_rate": 3.1338883873408516e-05, "epoch": 0.4184, "percentage": 41.84, "elapsed_time": "4:46:50", "remaining_time": "6:38:43", "throughput": 813.32, "total_tokens": 13997456} {"current_steps": 2620, "total_steps": 6250, "loss": 0.7153, "learning_rate": 3.127808535416454e-05, "epoch": 0.4192, "percentage": 41.92, "elapsed_time": "4:47:20", "remaining_time": "6:38:06", "throughput": 813.47, "total_tokens": 14024656} {"current_steps": 2625, "total_steps": 6250, "loss": 0.7317, "learning_rate": 3.121724717912138e-05, "epoch": 0.42, "percentage": 42.0, "elapsed_time": "4:47:47", "remaining_time": "6:37:26", "throughput": 813.86, "total_tokens": 14053680} {"current_steps": 2630, "total_steps": 6250, "loss": 0.6991, "learning_rate": 3.1156369732566006e-05, "epoch": 0.4208, "percentage": 42.08, "elapsed_time": "4:48:09", "remaining_time": "6:36:37", "throughput": 814.38, "total_tokens": 14080096} {"current_steps": 2635, "total_steps": 6250, "loss": 0.7442, "learning_rate": 3.1095453399033466e-05, "epoch": 0.4216, "percentage": 42.16, "elapsed_time": "4:48:35", "remaining_time": "6:35:54", "throughput": 814.79, "total_tokens": 14108080} {"current_steps": 2640, "total_steps": 6250, "loss": 0.7026, "learning_rate": 3.103449856330443e-05, "epoch": 0.4224, "percentage": 42.24, "elapsed_time": "4:48:57", "remaining_time": "6:35:08", "throughput": 815.12, "total_tokens": 14132448} {"current_steps": 2645, "total_steps": 6250, "loss": 0.6425, "learning_rate": 3.0973505610402765e-05, "epoch": 0.4232, "percentage": 42.32, "elapsed_time": "4:49:20", "remaining_time": "6:34:21", "throughput": 815.47, "total_tokens": 14157312} {"current_steps": 2650, "total_steps": 6250, "loss": 0.7421, "learning_rate": 3.091247492559312e-05, "epoch": 0.424, "percentage": 42.4, "elapsed_time": "4:49:43", "remaining_time": "6:33:35", "throughput": 815.95, "total_tokens": 14184288} {"current_steps": 2655, "total_steps": 6250, "loss": 0.7044, "learning_rate": 3.085140689437846e-05, "epoch": 0.4248, "percentage": 42.48, "elapsed_time": "4:50:05", "remaining_time": "6:32:48", "throughput": 816.28, "total_tokens": 14207920} {"current_steps": 2660, "total_steps": 6250, "loss": 0.6892, "learning_rate": 3.0790301902497666e-05, "epoch": 0.4256, "percentage": 42.56, "elapsed_time": "4:50:29", "remaining_time": "6:32:03", "throughput": 816.75, "total_tokens": 14235504} {"current_steps": 2665, "total_steps": 6250, "loss": 0.6595, "learning_rate": 3.072916033592307e-05, "epoch": 0.4264, "percentage": 42.64, "elapsed_time": "4:50:50", "remaining_time": "6:31:14", "throughput": 817.13, "total_tokens": 14259280} {"current_steps": 2670, "total_steps": 6250, "loss": 0.6948, "learning_rate": 3.0667982580858044e-05, "epoch": 0.4272, "percentage": 42.72, "elapsed_time": "4:51:19", "remaining_time": "6:30:37", "throughput": 817.32, "total_tokens": 14286592} {"current_steps": 2675, "total_steps": 6250, "loss": 0.7009, "learning_rate": 3.0606769023734536e-05, "epoch": 0.428, "percentage": 42.8, "elapsed_time": "4:51:47", "remaining_time": "6:29:57", "throughput": 817.34, "total_tokens": 14309280} {"current_steps": 2680, "total_steps": 6250, "loss": 0.6814, "learning_rate": 3.054552005121064e-05, "epoch": 0.4288, "percentage": 42.88, "elapsed_time": "4:52:14", "remaining_time": "6:29:17", "throughput": 817.59, "total_tokens": 14335984} {"current_steps": 2685, "total_steps": 6250, "loss": 0.7468, "learning_rate": 3.0484236050168153e-05, "epoch": 0.4296, "percentage": 42.96, "elapsed_time": "4:52:37", "remaining_time": "6:28:31", "throughput": 817.96, "total_tokens": 14361024} {"current_steps": 2690, "total_steps": 6250, "loss": 0.629, "learning_rate": 3.0422917407710137e-05, "epoch": 0.4304, "percentage": 43.04, "elapsed_time": "4:53:02", "remaining_time": "6:27:48", "throughput": 818.52, "total_tokens": 14391440} {"current_steps": 2695, "total_steps": 6250, "loss": 0.7106, "learning_rate": 3.0361564511158457e-05, "epoch": 0.4312, "percentage": 43.12, "elapsed_time": "4:53:30", "remaining_time": "6:27:09", "throughput": 818.72, "total_tokens": 14417952} {"current_steps": 2700, "total_steps": 6250, "loss": 0.7136, "learning_rate": 3.0300177748051373e-05, "epoch": 0.432, "percentage": 43.2, "elapsed_time": "4:53:54", "remaining_time": "6:26:26", "throughput": 819.21, "total_tokens": 14446752} {"current_steps": 2705, "total_steps": 6250, "loss": 0.6269, "learning_rate": 3.0238757506141012e-05, "epoch": 0.4328, "percentage": 43.28, "elapsed_time": "4:54:21", "remaining_time": "6:25:45", "throughput": 819.61, "total_tokens": 14475280} {"current_steps": 2710, "total_steps": 6250, "loss": 0.6517, "learning_rate": 3.0177304173391037e-05, "epoch": 0.4336, "percentage": 43.36, "elapsed_time": "4:54:42", "remaining_time": "6:24:58", "throughput": 819.89, "total_tokens": 14498112} {"current_steps": 2715, "total_steps": 6250, "loss": 0.6903, "learning_rate": 3.0115818137974067e-05, "epoch": 0.4344, "percentage": 43.44, "elapsed_time": "4:55:07", "remaining_time": "6:24:15", "throughput": 820.31, "total_tokens": 14525664} {"current_steps": 2720, "total_steps": 6250, "loss": 0.7302, "learning_rate": 3.005429978826934e-05, "epoch": 0.4352, "percentage": 43.52, "elapsed_time": "4:55:29", "remaining_time": "6:23:29", "throughput": 820.73, "total_tokens": 14551536} {"current_steps": 2725, "total_steps": 6250, "loss": 0.7126, "learning_rate": 2.9992749512860173e-05, "epoch": 0.436, "percentage": 43.6, "elapsed_time": "4:55:52", "remaining_time": "6:22:43", "throughput": 821.01, "total_tokens": 14574560} {"current_steps": 2730, "total_steps": 6250, "loss": 0.6701, "learning_rate": 2.9931167700531578e-05, "epoch": 0.4368, "percentage": 43.68, "elapsed_time": "4:56:16", "remaining_time": "6:22:00", "throughput": 821.46, "total_tokens": 14602384} {"current_steps": 2735, "total_steps": 6250, "loss": 0.5816, "learning_rate": 2.9869554740267724e-05, "epoch": 0.4376, "percentage": 43.76, "elapsed_time": "4:56:42", "remaining_time": "6:21:19", "throughput": 822.0, "total_tokens": 14633728} {"current_steps": 2740, "total_steps": 6250, "loss": 0.7965, "learning_rate": 2.9807911021249573e-05, "epoch": 0.4384, "percentage": 43.84, "elapsed_time": "4:57:08", "remaining_time": "6:20:39", "throughput": 822.41, "total_tokens": 14662752} {"current_steps": 2745, "total_steps": 6250, "loss": 0.6396, "learning_rate": 2.9746236932852355e-05, "epoch": 0.4392, "percentage": 43.92, "elapsed_time": "4:57:32", "remaining_time": "6:19:55", "throughput": 822.9, "total_tokens": 14690896} {"current_steps": 2750, "total_steps": 6250, "loss": 0.6914, "learning_rate": 2.9684532864643122e-05, "epoch": 0.44, "percentage": 44.0, "elapsed_time": "4:57:53", "remaining_time": "6:19:08", "throughput": 823.43, "total_tokens": 14717680} {"current_steps": 2755, "total_steps": 6250, "loss": 0.7188, "learning_rate": 2.9622799206378305e-05, "epoch": 0.4408, "percentage": 44.08, "elapsed_time": "4:58:16", "remaining_time": "6:18:24", "throughput": 823.84, "total_tokens": 14744176} {"current_steps": 2760, "total_steps": 6250, "loss": 0.6936, "learning_rate": 2.956103634800126e-05, "epoch": 0.4416, "percentage": 44.16, "elapsed_time": "4:58:42", "remaining_time": "6:17:42", "throughput": 824.25, "total_tokens": 14772464} {"current_steps": 2765, "total_steps": 6250, "loss": 0.709, "learning_rate": 2.949924467963975e-05, "epoch": 0.4424, "percentage": 44.24, "elapsed_time": "4:59:06", "remaining_time": "6:16:59", "throughput": 824.72, "total_tokens": 14800896} {"current_steps": 2770, "total_steps": 6250, "loss": 0.6361, "learning_rate": 2.943742459160354e-05, "epoch": 0.4432, "percentage": 44.32, "elapsed_time": "4:59:29", "remaining_time": "6:16:15", "throughput": 825.09, "total_tokens": 14826624} {"current_steps": 2775, "total_steps": 6250, "loss": 0.6062, "learning_rate": 2.9375576474381905e-05, "epoch": 0.444, "percentage": 44.4, "elapsed_time": "4:59:56", "remaining_time": "6:15:36", "throughput": 825.68, "total_tokens": 14859392} {"current_steps": 2780, "total_steps": 6250, "loss": 0.7882, "learning_rate": 2.9313700718641167e-05, "epoch": 0.4448, "percentage": 44.48, "elapsed_time": "5:00:18", "remaining_time": "6:14:51", "throughput": 825.93, "total_tokens": 14882336} {"current_steps": 2785, "total_steps": 6250, "loss": 0.7978, "learning_rate": 2.925179771522223e-05, "epoch": 0.4456, "percentage": 44.56, "elapsed_time": "5:00:42", "remaining_time": "6:14:08", "throughput": 826.44, "total_tokens": 14911312} {"current_steps": 2790, "total_steps": 6250, "loss": 0.6835, "learning_rate": 2.9189867855138103e-05, "epoch": 0.4464, "percentage": 44.64, "elapsed_time": "5:01:05", "remaining_time": "6:13:23", "throughput": 826.9, "total_tokens": 14938400} {"current_steps": 2795, "total_steps": 6250, "loss": 0.6566, "learning_rate": 2.912791152957145e-05, "epoch": 0.4472, "percentage": 44.72, "elapsed_time": "5:01:31", "remaining_time": "6:12:43", "throughput": 827.22, "total_tokens": 14965424} {"current_steps": 2800, "total_steps": 6250, "loss": 0.6616, "learning_rate": 2.9065929129872094e-05, "epoch": 0.448, "percentage": 44.8, "elapsed_time": "5:01:55", "remaining_time": "6:12:01", "throughput": 827.69, "total_tokens": 14994368} {"current_steps": 2805, "total_steps": 6250, "loss": 0.8051, "learning_rate": 2.900392104755455e-05, "epoch": 0.4488, "percentage": 44.88, "elapsed_time": "5:02:17", "remaining_time": "6:11:16", "throughput": 828.02, "total_tokens": 15018480} {"current_steps": 2810, "total_steps": 6250, "loss": 0.6961, "learning_rate": 2.894188767429557e-05, "epoch": 0.4496, "percentage": 44.96, "elapsed_time": "5:02:46", "remaining_time": "6:10:39", "throughput": 828.23, "total_tokens": 15045840} {"current_steps": 2815, "total_steps": 6250, "loss": 0.6898, "learning_rate": 2.8879829401931652e-05, "epoch": 0.4504, "percentage": 45.04, "elapsed_time": "5:03:06", "remaining_time": "6:09:52", "throughput": 828.67, "total_tokens": 15070832} {"current_steps": 2820, "total_steps": 6250, "loss": 0.6789, "learning_rate": 2.881774662245658e-05, "epoch": 0.4512, "percentage": 45.12, "elapsed_time": "5:03:29", "remaining_time": "6:09:08", "throughput": 829.07, "total_tokens": 15097008} {"current_steps": 2825, "total_steps": 6250, "loss": 0.6684, "learning_rate": 2.875563972801893e-05, "epoch": 0.452, "percentage": 45.2, "elapsed_time": "5:03:49", "remaining_time": "6:08:21", "throughput": 829.41, "total_tokens": 15120080} {"current_steps": 2830, "total_steps": 6250, "loss": 0.6577, "learning_rate": 2.8693509110919598e-05, "epoch": 0.4528, "percentage": 45.28, "elapsed_time": "5:04:14", "remaining_time": "6:07:40", "throughput": 829.64, "total_tokens": 15144976} {"current_steps": 2835, "total_steps": 6250, "loss": 0.7893, "learning_rate": 2.863135516360932e-05, "epoch": 0.4536, "percentage": 45.36, "elapsed_time": "5:04:37", "remaining_time": "6:06:56", "throughput": 830.24, "total_tokens": 15174640} {"current_steps": 2840, "total_steps": 6250, "loss": 0.7377, "learning_rate": 2.856917827868622e-05, "epoch": 0.4544, "percentage": 45.44, "elapsed_time": "5:04:58", "remaining_time": "6:06:11", "throughput": 830.55, "total_tokens": 15198128} {"current_steps": 2845, "total_steps": 6250, "loss": 0.821, "learning_rate": 2.8506978848893302e-05, "epoch": 0.4552, "percentage": 45.52, "elapsed_time": "5:05:19", "remaining_time": "6:05:25", "throughput": 830.94, "total_tokens": 15222224} {"current_steps": 2850, "total_steps": 6250, "loss": 0.695, "learning_rate": 2.844475726711595e-05, "epoch": 0.456, "percentage": 45.6, "elapsed_time": "5:05:41", "remaining_time": "6:04:40", "throughput": 831.28, "total_tokens": 15246640} {"current_steps": 2855, "total_steps": 6250, "loss": 0.7175, "learning_rate": 2.8382513926379504e-05, "epoch": 0.4568, "percentage": 45.68, "elapsed_time": "5:06:03", "remaining_time": "6:03:56", "throughput": 831.97, "total_tokens": 15277728} {"current_steps": 2860, "total_steps": 6250, "loss": 0.6505, "learning_rate": 2.832024921984674e-05, "epoch": 0.4576, "percentage": 45.76, "elapsed_time": "5:06:31", "remaining_time": "6:03:19", "throughput": 832.29, "total_tokens": 15307040} {"current_steps": 2865, "total_steps": 6250, "loss": 0.6686, "learning_rate": 2.825796354081537e-05, "epoch": 0.4584, "percentage": 45.84, "elapsed_time": "5:06:58", "remaining_time": "6:02:40", "throughput": 832.56, "total_tokens": 15334176} {"current_steps": 2870, "total_steps": 6250, "loss": 0.6365, "learning_rate": 2.8195657282715594e-05, "epoch": 0.4592, "percentage": 45.92, "elapsed_time": "5:07:21", "remaining_time": "6:01:58", "throughput": 832.95, "total_tokens": 15360496} {"current_steps": 2875, "total_steps": 6250, "loss": 0.6518, "learning_rate": 2.8133330839107608e-05, "epoch": 0.46, "percentage": 46.0, "elapsed_time": "5:07:42", "remaining_time": "6:01:13", "throughput": 833.11, "total_tokens": 15381328} {"current_steps": 2880, "total_steps": 6250, "loss": 0.6262, "learning_rate": 2.8070984603679107e-05, "epoch": 0.4608, "percentage": 46.08, "elapsed_time": "5:08:09", "remaining_time": "6:00:34", "throughput": 833.46, "total_tokens": 15409936} {"current_steps": 2885, "total_steps": 6250, "loss": 0.6684, "learning_rate": 2.800861897024279e-05, "epoch": 0.4616, "percentage": 46.16, "elapsed_time": "5:08:32", "remaining_time": "5:59:52", "throughput": 833.87, "total_tokens": 15436848} {"current_steps": 2890, "total_steps": 6250, "loss": 0.6978, "learning_rate": 2.79462343327339e-05, "epoch": 0.4624, "percentage": 46.24, "elapsed_time": "5:08:54", "remaining_time": "5:59:09", "throughput": 834.28, "total_tokens": 15463328} {"current_steps": 2895, "total_steps": 6250, "loss": 0.7062, "learning_rate": 2.7883831085207707e-05, "epoch": 0.4632, "percentage": 46.32, "elapsed_time": "5:09:16", "remaining_time": "5:58:24", "throughput": 834.72, "total_tokens": 15489232} {"current_steps": 2900, "total_steps": 6250, "loss": 0.6642, "learning_rate": 2.782140962183704e-05, "epoch": 0.464, "percentage": 46.4, "elapsed_time": "5:09:39", "remaining_time": "5:57:42", "throughput": 835.11, "total_tokens": 15516224} {"current_steps": 2905, "total_steps": 6250, "loss": 0.6287, "learning_rate": 2.7758970336909795e-05, "epoch": 0.4648, "percentage": 46.48, "elapsed_time": "5:10:04", "remaining_time": "5:57:02", "throughput": 835.58, "total_tokens": 15545584} {"current_steps": 2910, "total_steps": 6250, "loss": 0.6672, "learning_rate": 2.769651362482642e-05, "epoch": 0.4656, "percentage": 46.56, "elapsed_time": "5:10:27", "remaining_time": "5:56:20", "throughput": 835.91, "total_tokens": 15571216} {"current_steps": 2915, "total_steps": 6250, "loss": 0.737, "learning_rate": 2.763403988009746e-05, "epoch": 0.4664, "percentage": 46.64, "elapsed_time": "5:10:50", "remaining_time": "5:55:37", "throughput": 836.32, "total_tokens": 15597744} {"current_steps": 2920, "total_steps": 6250, "loss": 0.7715, "learning_rate": 2.7571549497341042e-05, "epoch": 0.4672, "percentage": 46.72, "elapsed_time": "5:11:14", "remaining_time": "5:54:56", "throughput": 836.57, "total_tokens": 15622496} {"current_steps": 2925, "total_steps": 6250, "loss": 0.7435, "learning_rate": 2.7509042871280372e-05, "epoch": 0.468, "percentage": 46.8, "elapsed_time": "5:11:39", "remaining_time": "5:54:17", "throughput": 836.76, "total_tokens": 15647344} {"current_steps": 2930, "total_steps": 6250, "loss": 0.6946, "learning_rate": 2.744652039674129e-05, "epoch": 0.4688, "percentage": 46.88, "elapsed_time": "5:12:03", "remaining_time": "5:53:35", "throughput": 837.07, "total_tokens": 15672672} {"current_steps": 2935, "total_steps": 6250, "loss": 0.7523, "learning_rate": 2.7383982468649714e-05, "epoch": 0.4696, "percentage": 46.96, "elapsed_time": "5:12:25", "remaining_time": "5:52:52", "throughput": 837.34, "total_tokens": 15696144} {"current_steps": 2940, "total_steps": 6250, "loss": 0.7218, "learning_rate": 2.73214294820292e-05, "epoch": 0.4704, "percentage": 47.04, "elapsed_time": "5:12:47", "remaining_time": "5:52:08", "throughput": 837.83, "total_tokens": 15723600} {"current_steps": 2945, "total_steps": 6250, "loss": 0.6736, "learning_rate": 2.7258861831998388e-05, "epoch": 0.4712, "percentage": 47.12, "elapsed_time": "5:13:10", "remaining_time": "5:51:27", "throughput": 838.17, "total_tokens": 15749680} {"current_steps": 2950, "total_steps": 6250, "loss": 0.6314, "learning_rate": 2.7196279913768584e-05, "epoch": 0.472, "percentage": 47.2, "elapsed_time": "5:13:35", "remaining_time": "5:50:48", "throughput": 838.49, "total_tokens": 15776768} {"current_steps": 2955, "total_steps": 6250, "loss": 0.7035, "learning_rate": 2.713368412264118e-05, "epoch": 0.4728, "percentage": 47.28, "elapsed_time": "5:14:02", "remaining_time": "5:50:10", "throughput": 838.6, "total_tokens": 15801376} {"current_steps": 2960, "total_steps": 6250, "loss": 0.6785, "learning_rate": 2.707107485400521e-05, "epoch": 0.4736, "percentage": 47.36, "elapsed_time": "5:14:28", "remaining_time": "5:49:32", "throughput": 838.87, "total_tokens": 15828416} {"current_steps": 2965, "total_steps": 6250, "loss": 0.7672, "learning_rate": 2.7008452503334858e-05, "epoch": 0.4744, "percentage": 47.44, "elapsed_time": "5:14:55", "remaining_time": "5:48:54", "throughput": 838.98, "total_tokens": 15852720} {"current_steps": 2970, "total_steps": 6250, "loss": 0.7723, "learning_rate": 2.6945817466186912e-05, "epoch": 0.4752, "percentage": 47.52, "elapsed_time": "5:15:24", "remaining_time": "5:48:20", "throughput": 839.15, "total_tokens": 15880624} {"current_steps": 2975, "total_steps": 6250, "loss": 0.6105, "learning_rate": 2.6883170138198323e-05, "epoch": 0.476, "percentage": 47.6, "elapsed_time": "5:15:56", "remaining_time": "5:47:48", "throughput": 839.38, "total_tokens": 15912176} {"current_steps": 2980, "total_steps": 6250, "loss": 0.6941, "learning_rate": 2.6820510915083648e-05, "epoch": 0.4768, "percentage": 47.68, "elapsed_time": "5:16:32", "remaining_time": "5:47:21", "throughput": 839.5, "total_tokens": 15944384} {"current_steps": 2985, "total_steps": 6250, "loss": 0.6669, "learning_rate": 2.6757840192632598e-05, "epoch": 0.4776, "percentage": 47.76, "elapsed_time": "5:16:57", "remaining_time": "5:46:41", "throughput": 839.72, "total_tokens": 15969680} {"current_steps": 2990, "total_steps": 6250, "loss": 0.6814, "learning_rate": 2.6695158366707522e-05, "epoch": 0.4784, "percentage": 47.84, "elapsed_time": "5:17:26", "remaining_time": "5:46:06", "throughput": 839.91, "total_tokens": 15997264} {"current_steps": 2995, "total_steps": 6250, "loss": 0.5641, "learning_rate": 2.6632465833240893e-05, "epoch": 0.4792, "percentage": 47.92, "elapsed_time": "5:17:58", "remaining_time": "5:45:34", "throughput": 840.21, "total_tokens": 16029664} {"current_steps": 3000, "total_steps": 6250, "loss": 0.7797, "learning_rate": 2.656976298823284e-05, "epoch": 0.48, "percentage": 48.0, "elapsed_time": "5:18:22", "remaining_time": "5:44:54", "throughput": 840.44, "total_tokens": 16054864} {"current_steps": 3005, "total_steps": 6250, "loss": 0.6778, "learning_rate": 2.650705022774859e-05, "epoch": 0.4808, "percentage": 48.08, "elapsed_time": "5:18:47", "remaining_time": "5:44:15", "throughput": 840.64, "total_tokens": 16079552} {"current_steps": 3010, "total_steps": 6250, "loss": 0.6806, "learning_rate": 2.6444327947916036e-05, "epoch": 0.4816, "percentage": 48.16, "elapsed_time": "5:19:13", "remaining_time": "5:43:37", "throughput": 840.86, "total_tokens": 16105632} {"current_steps": 3015, "total_steps": 6250, "loss": 0.7589, "learning_rate": 2.638159654492318e-05, "epoch": 0.4824, "percentage": 48.24, "elapsed_time": "5:19:39", "remaining_time": "5:42:59", "throughput": 841.24, "total_tokens": 16134688} {"current_steps": 3020, "total_steps": 6250, "loss": 0.677, "learning_rate": 2.6318856415015664e-05, "epoch": 0.4832, "percentage": 48.32, "elapsed_time": "5:20:02", "remaining_time": "5:42:17", "throughput": 841.72, "total_tokens": 16163152} {"current_steps": 3025, "total_steps": 6250, "loss": 0.6136, "learning_rate": 2.6256107954494242e-05, "epoch": 0.484, "percentage": 48.4, "elapsed_time": "5:20:26", "remaining_time": "5:41:37", "throughput": 842.04, "total_tokens": 16189248} {"current_steps": 3030, "total_steps": 6250, "loss": 0.6369, "learning_rate": 2.6193351559712292e-05, "epoch": 0.4848, "percentage": 48.48, "elapsed_time": "5:20:51", "remaining_time": "5:40:58", "throughput": 842.26, "total_tokens": 16214832} {"current_steps": 3035, "total_steps": 6250, "loss": 0.7202, "learning_rate": 2.6130587627073315e-05, "epoch": 0.4856, "percentage": 48.56, "elapsed_time": "5:21:19", "remaining_time": "5:40:23", "throughput": 842.57, "total_tokens": 16244736} {"current_steps": 3040, "total_steps": 6250, "loss": 0.7057, "learning_rate": 2.606781655302843e-05, "epoch": 0.4864, "percentage": 48.64, "elapsed_time": "5:21:43", "remaining_time": "5:39:42", "throughput": 842.98, "total_tokens": 16272064} {"current_steps": 3045, "total_steps": 6250, "loss": 0.6715, "learning_rate": 2.6005038734073833e-05, "epoch": 0.4872, "percentage": 48.72, "elapsed_time": "5:22:11", "remaining_time": "5:39:07", "throughput": 843.24, "total_tokens": 16301344} {"current_steps": 3050, "total_steps": 6250, "loss": 0.7479, "learning_rate": 2.594225456674837e-05, "epoch": 0.488, "percentage": 48.8, "elapsed_time": "5:22:35", "remaining_time": "5:38:27", "throughput": 843.46, "total_tokens": 16325872} {"current_steps": 3055, "total_steps": 6250, "loss": 0.6581, "learning_rate": 2.5879464447630946e-05, "epoch": 0.4888, "percentage": 48.88, "elapsed_time": "5:22:59", "remaining_time": "5:37:47", "throughput": 843.81, "total_tokens": 16352272} {"current_steps": 3060, "total_steps": 6250, "loss": 0.691, "learning_rate": 2.5816668773338098e-05, "epoch": 0.4896, "percentage": 48.96, "elapsed_time": "5:23:26", "remaining_time": "5:37:11", "throughput": 844.06, "total_tokens": 16380464} {"current_steps": 3065, "total_steps": 6250, "loss": 0.6606, "learning_rate": 2.575386794052142e-05, "epoch": 0.4904, "percentage": 49.04, "elapsed_time": "5:23:50", "remaining_time": "5:36:31", "throughput": 844.48, "total_tokens": 16408736} {"current_steps": 3070, "total_steps": 6250, "loss": 0.729, "learning_rate": 2.569106234586511e-05, "epoch": 0.4912, "percentage": 49.12, "elapsed_time": "5:24:12", "remaining_time": "5:35:49", "throughput": 844.93, "total_tokens": 16436352} {"current_steps": 3075, "total_steps": 6250, "loss": 0.7137, "learning_rate": 2.562825238608344e-05, "epoch": 0.492, "percentage": 49.2, "elapsed_time": "5:24:37", "remaining_time": "5:35:11", "throughput": 845.29, "total_tokens": 16464624} {"current_steps": 3080, "total_steps": 6250, "loss": 0.7238, "learning_rate": 2.5565438457918244e-05, "epoch": 0.4928, "percentage": 49.28, "elapsed_time": "5:25:07", "remaining_time": "5:34:37", "throughput": 845.67, "total_tokens": 16496720} {"current_steps": 3085, "total_steps": 6250, "loss": 0.7019, "learning_rate": 2.5502620958136443e-05, "epoch": 0.4936, "percentage": 49.36, "elapsed_time": "5:25:30", "remaining_time": "5:33:57", "throughput": 846.05, "total_tokens": 16524208} {"current_steps": 3090, "total_steps": 6250, "loss": 0.5851, "learning_rate": 2.5439800283527494e-05, "epoch": 0.4944, "percentage": 49.44, "elapsed_time": "5:25:55", "remaining_time": "5:33:18", "throughput": 846.4, "total_tokens": 16552192} {"current_steps": 3095, "total_steps": 6250, "loss": 0.7357, "learning_rate": 2.537697683090093e-05, "epoch": 0.4952, "percentage": 49.52, "elapsed_time": "5:26:21", "remaining_time": "5:32:40", "throughput": 846.64, "total_tokens": 16578144} {"current_steps": 3100, "total_steps": 6250, "loss": 0.6254, "learning_rate": 2.531415099708382e-05, "epoch": 0.496, "percentage": 49.6, "elapsed_time": "5:26:48", "remaining_time": "5:32:04", "throughput": 847.0, "total_tokens": 16608288} {"current_steps": 3105, "total_steps": 6250, "loss": 0.7284, "learning_rate": 2.5251323178918268e-05, "epoch": 0.4968, "percentage": 49.68, "elapsed_time": "5:27:13", "remaining_time": "5:31:26", "throughput": 847.35, "total_tokens": 16636176} {"current_steps": 3110, "total_steps": 6250, "loss": 0.8136, "learning_rate": 2.518849377325893e-05, "epoch": 0.4976, "percentage": 49.76, "elapsed_time": "5:27:37", "remaining_time": "5:30:46", "throughput": 847.48, "total_tokens": 16659168} {"current_steps": 3115, "total_steps": 6250, "loss": 0.7334, "learning_rate": 2.5125663176970476e-05, "epoch": 0.4984, "percentage": 49.84, "elapsed_time": "5:27:59", "remaining_time": "5:30:06", "throughput": 847.94, "total_tokens": 16687344} {"current_steps": 3120, "total_steps": 6250, "loss": 0.7599, "learning_rate": 2.5062831786925102e-05, "epoch": 0.4992, "percentage": 49.92, "elapsed_time": "5:28:24", "remaining_time": "5:29:27", "throughput": 848.26, "total_tokens": 16714496} {"current_steps": 3125, "total_steps": 6250, "loss": 0.6517, "learning_rate": 2.5e-05, "epoch": 0.5, "percentage": 50.0, "elapsed_time": "5:28:49", "remaining_time": "5:28:49", "throughput": 848.59, "total_tokens": 16742528} {"current_steps": 3130, "total_steps": 6250, "loss": 0.6778, "learning_rate": 2.4937168213074907e-05, "epoch": 0.5008, "percentage": 50.08, "elapsed_time": "5:29:14", "remaining_time": "5:28:11", "throughput": 848.99, "total_tokens": 16771248} {"current_steps": 3135, "total_steps": 6250, "loss": 0.6847, "learning_rate": 2.4874336823029526e-05, "epoch": 0.5016, "percentage": 50.16, "elapsed_time": "5:29:38", "remaining_time": "5:27:32", "throughput": 849.35, "total_tokens": 16799136} {"current_steps": 3140, "total_steps": 6250, "loss": 0.6638, "learning_rate": 2.481150622674108e-05, "epoch": 0.5024, "percentage": 50.24, "elapsed_time": "5:30:02", "remaining_time": "5:26:53", "throughput": 849.65, "total_tokens": 16825648} {"current_steps": 3145, "total_steps": 6250, "loss": 0.7139, "learning_rate": 2.4748676821081738e-05, "epoch": 0.5032, "percentage": 50.32, "elapsed_time": "5:30:27", "remaining_time": "5:26:15", "throughput": 849.95, "total_tokens": 16852240} {"current_steps": 3150, "total_steps": 6250, "loss": 0.7507, "learning_rate": 2.4685849002916183e-05, "epoch": 0.504, "percentage": 50.4, "elapsed_time": "5:30:50", "remaining_time": "5:25:35", "throughput": 850.3, "total_tokens": 16878624} {"current_steps": 3155, "total_steps": 6250, "loss": 0.6951, "learning_rate": 2.4623023169099073e-05, "epoch": 0.5048, "percentage": 50.48, "elapsed_time": "5:31:17", "remaining_time": "5:24:59", "throughput": 850.56, "total_tokens": 16906864} {"current_steps": 3160, "total_steps": 6250, "loss": 0.733, "learning_rate": 2.4560199716472508e-05, "epoch": 0.5056, "percentage": 50.56, "elapsed_time": "5:31:38", "remaining_time": "5:24:17", "throughput": 850.83, "total_tokens": 16930080} {"current_steps": 3165, "total_steps": 6250, "loss": 0.7517, "learning_rate": 2.449737904186357e-05, "epoch": 0.5064, "percentage": 50.64, "elapsed_time": "5:32:00", "remaining_time": "5:23:36", "throughput": 851.0, "total_tokens": 16952240} {"current_steps": 3170, "total_steps": 6250, "loss": 0.7472, "learning_rate": 2.4434561542081762e-05, "epoch": 0.5072, "percentage": 50.72, "elapsed_time": "5:32:27", "remaining_time": "5:23:01", "throughput": 851.5, "total_tokens": 16985408} {"current_steps": 3175, "total_steps": 6250, "loss": 0.7514, "learning_rate": 2.4371747613916566e-05, "epoch": 0.508, "percentage": 50.8, "elapsed_time": "5:32:53", "remaining_time": "5:22:24", "throughput": 851.8, "total_tokens": 17013776} {"current_steps": 3180, "total_steps": 6250, "loss": 0.7633, "learning_rate": 2.4308937654134893e-05, "epoch": 0.5088, "percentage": 50.88, "elapsed_time": "5:33:15", "remaining_time": "5:21:44", "throughput": 852.13, "total_tokens": 17039120} {"current_steps": 3185, "total_steps": 6250, "loss": 0.6606, "learning_rate": 2.4246132059478578e-05, "epoch": 0.5096, "percentage": 50.96, "elapsed_time": "5:33:40", "remaining_time": "5:21:05", "throughput": 852.4, "total_tokens": 17065296} {"current_steps": 3190, "total_steps": 6250, "loss": 0.764, "learning_rate": 2.418333122666191e-05, "epoch": 0.5104, "percentage": 51.04, "elapsed_time": "5:34:02", "remaining_time": "5:20:25", "throughput": 852.64, "total_tokens": 17089264} {"current_steps": 3195, "total_steps": 6250, "loss": 0.751, "learning_rate": 2.412053555236906e-05, "epoch": 0.5112, "percentage": 51.12, "elapsed_time": "5:34:30", "remaining_time": "5:19:51", "throughput": 852.86, "total_tokens": 17117488} {"current_steps": 3200, "total_steps": 6250, "loss": 0.7067, "learning_rate": 2.4057745433251635e-05, "epoch": 0.512, "percentage": 51.2, "elapsed_time": "5:34:54", "remaining_time": "5:19:12", "throughput": 853.02, "total_tokens": 17141232} {"current_steps": 3205, "total_steps": 6250, "loss": 0.6432, "learning_rate": 2.3994961265926166e-05, "epoch": 0.5128, "percentage": 51.28, "elapsed_time": "5:35:20", "remaining_time": "5:18:36", "throughput": 853.42, "total_tokens": 17171632} {"current_steps": 3210, "total_steps": 6250, "loss": 0.6373, "learning_rate": 2.3932183446971583e-05, "epoch": 0.5136, "percentage": 51.36, "elapsed_time": "5:35:46", "remaining_time": "5:17:59", "throughput": 853.66, "total_tokens": 17198640} {"current_steps": 3215, "total_steps": 6250, "loss": 0.7347, "learning_rate": 2.3869412372926687e-05, "epoch": 0.5144, "percentage": 51.44, "elapsed_time": "5:36:09", "remaining_time": "5:17:20", "throughput": 854.17, "total_tokens": 17228240} {"current_steps": 3220, "total_steps": 6250, "loss": 0.6789, "learning_rate": 2.3806648440287714e-05, "epoch": 0.5152, "percentage": 51.52, "elapsed_time": "5:36:34", "remaining_time": "5:16:42", "throughput": 854.67, "total_tokens": 17259392} {"current_steps": 3225, "total_steps": 6250, "loss": 0.7548, "learning_rate": 2.3743892045505764e-05, "epoch": 0.516, "percentage": 51.6, "elapsed_time": "5:36:58", "remaining_time": "5:16:05", "throughput": 855.03, "total_tokens": 17287808} {"current_steps": 3230, "total_steps": 6250, "loss": 0.7792, "learning_rate": 2.368114358498434e-05, "epoch": 0.5168, "percentage": 51.68, "elapsed_time": "5:37:20", "remaining_time": "5:15:24", "throughput": 855.28, "total_tokens": 17311520} {"current_steps": 3235, "total_steps": 6250, "loss": 0.6575, "learning_rate": 2.361840345507683e-05, "epoch": 0.5176, "percentage": 51.76, "elapsed_time": "5:37:45", "remaining_time": "5:14:47", "throughput": 855.67, "total_tokens": 17340816} {"current_steps": 3240, "total_steps": 6250, "loss": 0.6414, "learning_rate": 2.355567205208397e-05, "epoch": 0.5184, "percentage": 51.84, "elapsed_time": "5:38:07", "remaining_time": "5:14:07", "throughput": 855.86, "total_tokens": 17363408} {"current_steps": 3245, "total_steps": 6250, "loss": 0.7161, "learning_rate": 2.3492949772251414e-05, "epoch": 0.5192, "percentage": 51.92, "elapsed_time": "5:38:28", "remaining_time": "5:13:26", "throughput": 856.46, "total_tokens": 17393248} {"current_steps": 3250, "total_steps": 6250, "loss": 0.6957, "learning_rate": 2.3430237011767167e-05, "epoch": 0.52, "percentage": 52.0, "elapsed_time": "5:38:51", "remaining_time": "5:12:47", "throughput": 857.05, "total_tokens": 17425232} {"current_steps": 3255, "total_steps": 6250, "loss": 0.7615, "learning_rate": 2.3367534166759102e-05, "epoch": 0.5208, "percentage": 52.08, "elapsed_time": "5:39:13", "remaining_time": "5:12:07", "throughput": 857.2, "total_tokens": 17446864} {"current_steps": 3260, "total_steps": 6250, "loss": 0.6994, "learning_rate": 2.3304841633292487e-05, "epoch": 0.5216, "percentage": 52.16, "elapsed_time": "5:39:36", "remaining_time": "5:11:28", "throughput": 857.42, "total_tokens": 17470896} {"current_steps": 3265, "total_steps": 6250, "loss": 0.7116, "learning_rate": 2.3242159807367408e-05, "epoch": 0.5224, "percentage": 52.24, "elapsed_time": "5:40:00", "remaining_time": "5:10:50", "throughput": 857.91, "total_tokens": 17501488} {"current_steps": 3270, "total_steps": 6250, "loss": 0.7583, "learning_rate": 2.3179489084916358e-05, "epoch": 0.5232, "percentage": 52.32, "elapsed_time": "5:40:21", "remaining_time": "5:10:10", "throughput": 858.2, "total_tokens": 17526032} {"current_steps": 3275, "total_steps": 6250, "loss": 0.7302, "learning_rate": 2.3116829861801686e-05, "epoch": 0.524, "percentage": 52.4, "elapsed_time": "5:40:43", "remaining_time": "5:09:30", "throughput": 858.46, "total_tokens": 17550144} {"current_steps": 3280, "total_steps": 6250, "loss": 0.6794, "learning_rate": 2.3054182533813087e-05, "epoch": 0.5248, "percentage": 52.48, "elapsed_time": "5:41:06", "remaining_time": "5:08:52", "throughput": 858.73, "total_tokens": 17575600} {"current_steps": 3285, "total_steps": 6250, "loss": 0.7294, "learning_rate": 2.2991547496665148e-05, "epoch": 0.5256, "percentage": 52.56, "elapsed_time": "5:41:30", "remaining_time": "5:08:14", "throughput": 859.01, "total_tokens": 17601408} {"current_steps": 3290, "total_steps": 6250, "loss": 0.6333, "learning_rate": 2.2928925145994794e-05, "epoch": 0.5264, "percentage": 52.64, "elapsed_time": "5:41:50", "remaining_time": "5:07:33", "throughput": 859.28, "total_tokens": 17624752} {"current_steps": 3295, "total_steps": 6250, "loss": 0.7779, "learning_rate": 2.286631587735883e-05, "epoch": 0.5272, "percentage": 52.72, "elapsed_time": "5:42:13", "remaining_time": "5:06:54", "throughput": 859.64, "total_tokens": 17651040} {"current_steps": 3300, "total_steps": 6250, "loss": 0.7035, "learning_rate": 2.280372008623142e-05, "epoch": 0.528, "percentage": 52.8, "elapsed_time": "5:42:36", "remaining_time": "5:06:16", "throughput": 859.99, "total_tokens": 17678288} {"current_steps": 3305, "total_steps": 6250, "loss": 0.719, "learning_rate": 2.2741138168001608e-05, "epoch": 0.5288, "percentage": 52.88, "elapsed_time": "5:42:59", "remaining_time": "5:05:38", "throughput": 860.2, "total_tokens": 17702816} {"current_steps": 3310, "total_steps": 6250, "loss": 0.7134, "learning_rate": 2.267857051797081e-05, "epoch": 0.5296, "percentage": 52.96, "elapsed_time": "5:43:21", "remaining_time": "5:04:58", "throughput": 860.56, "total_tokens": 17728848} {"current_steps": 3315, "total_steps": 6250, "loss": 0.6916, "learning_rate": 2.2616017531350288e-05, "epoch": 0.5304, "percentage": 53.04, "elapsed_time": "5:43:44", "remaining_time": "5:04:20", "throughput": 860.92, "total_tokens": 17756240} {"current_steps": 3320, "total_steps": 6250, "loss": 0.6389, "learning_rate": 2.255347960325871e-05, "epoch": 0.5312, "percentage": 53.12, "elapsed_time": "5:44:06", "remaining_time": "5:03:41", "throughput": 861.21, "total_tokens": 17781104} {"current_steps": 3325, "total_steps": 6250, "loss": 0.6648, "learning_rate": 2.2490957128719624e-05, "epoch": 0.532, "percentage": 53.2, "elapsed_time": "5:44:28", "remaining_time": "5:03:02", "throughput": 861.64, "total_tokens": 17808816} {"current_steps": 3330, "total_steps": 6250, "loss": 0.6683, "learning_rate": 2.2428450502658967e-05, "epoch": 0.5328, "percentage": 53.28, "elapsed_time": "5:44:51", "remaining_time": "5:02:24", "throughput": 861.91, "total_tokens": 17834496} {"current_steps": 3335, "total_steps": 6250, "loss": 0.7686, "learning_rate": 2.2365960119902545e-05, "epoch": 0.5336, "percentage": 53.36, "elapsed_time": "5:45:13", "remaining_time": "5:01:45", "throughput": 862.37, "total_tokens": 17862880} {"current_steps": 3340, "total_steps": 6250, "loss": 0.7073, "learning_rate": 2.2303486375173585e-05, "epoch": 0.5344, "percentage": 53.44, "elapsed_time": "5:45:34", "remaining_time": "5:01:04", "throughput": 862.83, "total_tokens": 17890064} {"current_steps": 3345, "total_steps": 6250, "loss": 0.642, "learning_rate": 2.224102966309021e-05, "epoch": 0.5352, "percentage": 53.52, "elapsed_time": "5:45:56", "remaining_time": "5:00:26", "throughput": 863.26, "total_tokens": 17918144} {"current_steps": 3350, "total_steps": 6250, "loss": 0.7078, "learning_rate": 2.217859037816296e-05, "epoch": 0.536, "percentage": 53.6, "elapsed_time": "5:46:19", "remaining_time": "4:59:48", "throughput": 863.59, "total_tokens": 17945344} {"current_steps": 3355, "total_steps": 6250, "loss": 0.7437, "learning_rate": 2.2116168914792292e-05, "epoch": 0.5368, "percentage": 53.68, "elapsed_time": "5:46:39", "remaining_time": "4:59:08", "throughput": 863.95, "total_tokens": 17970096} {"current_steps": 3360, "total_steps": 6250, "loss": 0.7606, "learning_rate": 2.205376566726611e-05, "epoch": 0.5376, "percentage": 53.76, "elapsed_time": "5:47:01", "remaining_time": "4:58:28", "throughput": 864.38, "total_tokens": 17997328} {"current_steps": 3365, "total_steps": 6250, "loss": 0.6824, "learning_rate": 2.1991381029757215e-05, "epoch": 0.5384, "percentage": 53.84, "elapsed_time": "5:47:22", "remaining_time": "4:57:49", "throughput": 864.68, "total_tokens": 18022464} {"current_steps": 3370, "total_steps": 6250, "loss": 0.7262, "learning_rate": 2.19290153963209e-05, "epoch": 0.5392, "percentage": 53.92, "elapsed_time": "5:47:47", "remaining_time": "4:57:13", "throughput": 865.07, "total_tokens": 18052176} {"current_steps": 3375, "total_steps": 6250, "loss": 0.7491, "learning_rate": 2.186666916089239e-05, "epoch": 0.54, "percentage": 54.0, "elapsed_time": "5:48:11", "remaining_time": "4:56:36", "throughput": 865.39, "total_tokens": 18079008} {"current_steps": 3380, "total_steps": 6250, "loss": 0.6246, "learning_rate": 2.1804342717284415e-05, "epoch": 0.5408, "percentage": 54.08, "elapsed_time": "5:48:33", "remaining_time": "4:55:57", "throughput": 865.61, "total_tokens": 18102784} {"current_steps": 3385, "total_steps": 6250, "loss": 0.6712, "learning_rate": 2.174203645918464e-05, "epoch": 0.5416, "percentage": 54.16, "elapsed_time": "5:48:56", "remaining_time": "4:55:19", "throughput": 866.0, "total_tokens": 18130688} {"current_steps": 3390, "total_steps": 6250, "loss": 0.7238, "learning_rate": 2.1679750780153267e-05, "epoch": 0.5424, "percentage": 54.24, "elapsed_time": "5:49:18", "remaining_time": "4:54:41", "throughput": 866.45, "total_tokens": 18159200} {"current_steps": 3395, "total_steps": 6250, "loss": 0.663, "learning_rate": 2.1617486073620498e-05, "epoch": 0.5432, "percentage": 54.32, "elapsed_time": "5:49:45", "remaining_time": "4:54:08", "throughput": 866.71, "total_tokens": 18188736} {"current_steps": 3400, "total_steps": 6250, "loss": 0.6928, "learning_rate": 2.155524273288405e-05, "epoch": 0.544, "percentage": 54.4, "elapsed_time": "5:50:13", "remaining_time": "4:53:33", "throughput": 866.98, "total_tokens": 18217856} {"current_steps": 3405, "total_steps": 6250, "loss": 0.7373, "learning_rate": 2.1493021151106703e-05, "epoch": 0.5448, "percentage": 54.48, "elapsed_time": "5:50:39", "remaining_time": "4:52:59", "throughput": 867.3, "total_tokens": 18247616} {"current_steps": 3410, "total_steps": 6250, "loss": 0.7593, "learning_rate": 2.1430821721313782e-05, "epoch": 0.5456, "percentage": 54.56, "elapsed_time": "5:51:00", "remaining_time": "4:52:20", "throughput": 867.7, "total_tokens": 18274416} {"current_steps": 3415, "total_steps": 6250, "loss": 0.6718, "learning_rate": 2.1368644836390684e-05, "epoch": 0.5464, "percentage": 54.64, "elapsed_time": "5:51:21", "remaining_time": "4:51:40", "throughput": 868.02, "total_tokens": 18298720} {"current_steps": 3420, "total_steps": 6250, "loss": 0.7303, "learning_rate": 2.130649088908041e-05, "epoch": 0.5472, "percentage": 54.72, "elapsed_time": "5:51:42", "remaining_time": "4:51:01", "throughput": 868.44, "total_tokens": 18326160} {"current_steps": 3425, "total_steps": 6250, "loss": 0.74, "learning_rate": 2.1244360271981073e-05, "epoch": 0.548, "percentage": 54.8, "elapsed_time": "5:52:06", "remaining_time": "4:50:25", "throughput": 868.63, "total_tokens": 18351344} {"current_steps": 3430, "total_steps": 6250, "loss": 0.6448, "learning_rate": 2.1182253377543425e-05, "epoch": 0.5488, "percentage": 54.88, "elapsed_time": "5:52:28", "remaining_time": "4:49:47", "throughput": 868.83, "total_tokens": 18374752} {"current_steps": 3435, "total_steps": 6250, "loss": 0.6759, "learning_rate": 2.112017059806835e-05, "epoch": 0.5496, "percentage": 54.96, "elapsed_time": "5:52:53", "remaining_time": "4:49:11", "throughput": 869.14, "total_tokens": 18402432} {"current_steps": 3440, "total_steps": 6250, "loss": 0.7327, "learning_rate": 2.1058112325704436e-05, "epoch": 0.5504, "percentage": 55.04, "elapsed_time": "5:53:16", "remaining_time": "4:48:34", "throughput": 869.43, "total_tokens": 18428656} {"current_steps": 3445, "total_steps": 6250, "loss": 0.7214, "learning_rate": 2.0996078952445452e-05, "epoch": 0.5512, "percentage": 55.12, "elapsed_time": "5:53:38", "remaining_time": "4:47:56", "throughput": 869.62, "total_tokens": 18451744} {"current_steps": 3450, "total_steps": 6250, "loss": 0.7192, "learning_rate": 2.0934070870127912e-05, "epoch": 0.552, "percentage": 55.2, "elapsed_time": "5:54:00", "remaining_time": "4:47:18", "throughput": 869.89, "total_tokens": 18476960} {"current_steps": 3455, "total_steps": 6250, "loss": 0.6481, "learning_rate": 2.0872088470428553e-05, "epoch": 0.5528, "percentage": 55.28, "elapsed_time": "5:54:24", "remaining_time": "4:46:42", "throughput": 870.34, "total_tokens": 18507280} {"current_steps": 3460, "total_steps": 6250, "loss": 0.6906, "learning_rate": 2.08101321448619e-05, "epoch": 0.5536, "percentage": 55.36, "elapsed_time": "5:54:44", "remaining_time": "4:46:03", "throughput": 870.64, "total_tokens": 18531264} {"current_steps": 3465, "total_steps": 6250, "loss": 0.6691, "learning_rate": 2.0748202284777777e-05, "epoch": 0.5544, "percentage": 55.44, "elapsed_time": "5:55:08", "remaining_time": "4:45:26", "throughput": 871.0, "total_tokens": 18559552} {"current_steps": 3470, "total_steps": 6250, "loss": 0.743, "learning_rate": 2.0686299281358835e-05, "epoch": 0.5552, "percentage": 55.52, "elapsed_time": "5:55:34", "remaining_time": "4:44:51", "throughput": 871.25, "total_tokens": 18587408} {"current_steps": 3475, "total_steps": 6250, "loss": 0.6896, "learning_rate": 2.0624423525618098e-05, "epoch": 0.556, "percentage": 55.6, "elapsed_time": "5:56:01", "remaining_time": "4:44:18", "throughput": 871.49, "total_tokens": 18616384} {"current_steps": 3480, "total_steps": 6250, "loss": 0.7799, "learning_rate": 2.056257540839647e-05, "epoch": 0.5568, "percentage": 55.68, "elapsed_time": "5:56:22", "remaining_time": "4:43:40", "throughput": 871.75, "total_tokens": 18640432} {"current_steps": 3485, "total_steps": 6250, "loss": 0.6796, "learning_rate": 2.050075532036026e-05, "epoch": 0.5576, "percentage": 55.76, "elapsed_time": "5:56:45", "remaining_time": "4:43:02", "throughput": 871.84, "total_tokens": 18661696} {"current_steps": 3490, "total_steps": 6250, "loss": 0.6601, "learning_rate": 2.0438963651998747e-05, "epoch": 0.5584, "percentage": 55.84, "elapsed_time": "5:57:11", "remaining_time": "4:42:28", "throughput": 872.04, "total_tokens": 18689280} {"current_steps": 3495, "total_steps": 6250, "loss": 0.7247, "learning_rate": 2.037720079362169e-05, "epoch": 0.5592, "percentage": 55.92, "elapsed_time": "5:57:35", "remaining_time": "4:41:52", "throughput": 872.2, "total_tokens": 18713776} {"current_steps": 3500, "total_steps": 6250, "loss": 0.7113, "learning_rate": 2.031546713535688e-05, "epoch": 0.56, "percentage": 56.0, "elapsed_time": "5:58:00", "remaining_time": "4:41:17", "throughput": 872.39, "total_tokens": 18739632} {"current_steps": 3505, "total_steps": 6250, "loss": 0.604, "learning_rate": 2.0253763067147657e-05, "epoch": 0.5608, "percentage": 56.08, "elapsed_time": "5:58:26", "remaining_time": "4:40:42", "throughput": 872.66, "total_tokens": 18767504} {"current_steps": 3510, "total_steps": 6250, "loss": 0.6292, "learning_rate": 2.0192088978750433e-05, "epoch": 0.5616, "percentage": 56.16, "elapsed_time": "5:58:53", "remaining_time": "4:40:09", "throughput": 872.84, "total_tokens": 18794976} {"current_steps": 3515, "total_steps": 6250, "loss": 0.7227, "learning_rate": 2.0130445259732285e-05, "epoch": 0.5624, "percentage": 56.24, "elapsed_time": "5:59:16", "remaining_time": "4:39:32", "throughput": 873.22, "total_tokens": 18823456} {"current_steps": 3520, "total_steps": 6250, "loss": 0.6536, "learning_rate": 2.0068832299468428e-05, "epoch": 0.5632, "percentage": 56.32, "elapsed_time": "5:59:38", "remaining_time": "4:38:55", "throughput": 873.61, "total_tokens": 18851104} {"current_steps": 3525, "total_steps": 6250, "loss": 0.6729, "learning_rate": 2.000725048713983e-05, "epoch": 0.564, "percentage": 56.4, "elapsed_time": "6:00:05", "remaining_time": "4:38:21", "throughput": 873.97, "total_tokens": 18882096} {"current_steps": 3530, "total_steps": 6250, "loss": 0.8178, "learning_rate": 1.994570021173067e-05, "epoch": 0.5648, "percentage": 56.48, "elapsed_time": "6:00:24", "remaining_time": "4:37:42", "throughput": 874.16, "total_tokens": 18903520} {"current_steps": 3535, "total_steps": 6250, "loss": 0.6575, "learning_rate": 1.988418186202594e-05, "epoch": 0.5656, "percentage": 56.56, "elapsed_time": "6:00:52", "remaining_time": "4:37:09", "throughput": 874.6, "total_tokens": 18937200} {"current_steps": 3540, "total_steps": 6250, "loss": 0.7789, "learning_rate": 1.9822695826608972e-05, "epoch": 0.5664, "percentage": 56.64, "elapsed_time": "6:01:20", "remaining_time": "4:36:37", "throughput": 874.77, "total_tokens": 18965424} {"current_steps": 3545, "total_steps": 6250, "loss": 0.6699, "learning_rate": 1.9761242493858987e-05, "epoch": 0.5672, "percentage": 56.72, "elapsed_time": "6:01:44", "remaining_time": "4:36:01", "throughput": 874.92, "total_tokens": 18989456} {"current_steps": 3550, "total_steps": 6250, "loss": 0.7095, "learning_rate": 1.969982225194864e-05, "epoch": 0.568, "percentage": 56.8, "elapsed_time": "6:02:07", "remaining_time": "4:35:25", "throughput": 875.29, "total_tokens": 19017808} {"current_steps": 3555, "total_steps": 6250, "loss": 0.7191, "learning_rate": 1.9638435488841546e-05, "epoch": 0.5688, "percentage": 56.88, "elapsed_time": "6:02:35", "remaining_time": "4:34:52", "throughput": 875.5, "total_tokens": 19046496} {"current_steps": 3560, "total_steps": 6250, "loss": 0.7016, "learning_rate": 1.957708259228987e-05, "epoch": 0.5696, "percentage": 56.96, "elapsed_time": "6:02:58", "remaining_time": "4:34:16", "throughput": 875.74, "total_tokens": 19072128} {"current_steps": 3565, "total_steps": 6250, "loss": 0.6903, "learning_rate": 1.951576394983185e-05, "epoch": 0.5704, "percentage": 57.04, "elapsed_time": "6:03:19", "remaining_time": "4:33:38", "throughput": 876.0, "total_tokens": 19096528} {"current_steps": 3570, "total_steps": 6250, "loss": 0.6144, "learning_rate": 1.945447994878937e-05, "epoch": 0.5712, "percentage": 57.12, "elapsed_time": "6:03:43", "remaining_time": "4:33:02", "throughput": 876.41, "total_tokens": 19126240} {"current_steps": 3575, "total_steps": 6250, "loss": 0.6755, "learning_rate": 1.9393230976265473e-05, "epoch": 0.572, "percentage": 57.2, "elapsed_time": "6:04:07", "remaining_time": "4:32:27", "throughput": 876.67, "total_tokens": 19152752} {"current_steps": 3580, "total_steps": 6250, "loss": 0.748, "learning_rate": 1.9332017419141962e-05, "epoch": 0.5728, "percentage": 57.28, "elapsed_time": "6:04:29", "remaining_time": "4:31:50", "throughput": 877.0, "total_tokens": 19179296} {"current_steps": 3585, "total_steps": 6250, "loss": 0.7011, "learning_rate": 1.9270839664076936e-05, "epoch": 0.5736, "percentage": 57.36, "elapsed_time": "6:04:50", "remaining_time": "4:31:12", "throughput": 877.35, "total_tokens": 19205616} {"current_steps": 3590, "total_steps": 6250, "loss": 0.6672, "learning_rate": 1.920969809750234e-05, "epoch": 0.5744, "percentage": 57.44, "elapsed_time": "6:05:14", "remaining_time": "4:30:37", "throughput": 877.56, "total_tokens": 19231440} {"current_steps": 3595, "total_steps": 6250, "loss": 0.7261, "learning_rate": 1.914859310562154e-05, "epoch": 0.5752, "percentage": 57.52, "elapsed_time": "6:05:43", "remaining_time": "4:30:06", "throughput": 877.62, "total_tokens": 19258288} {"current_steps": 3600, "total_steps": 6250, "loss": 0.7838, "learning_rate": 1.908752507440689e-05, "epoch": 0.576, "percentage": 57.6, "elapsed_time": "6:06:13", "remaining_time": "4:29:34", "throughput": 877.63, "total_tokens": 19284464} {"current_steps": 3605, "total_steps": 6250, "loss": 0.6574, "learning_rate": 1.9026494389597238e-05, "epoch": 0.5768, "percentage": 57.68, "elapsed_time": "6:06:44", "remaining_time": "4:29:04", "throughput": 877.67, "total_tokens": 19312272} {"current_steps": 3610, "total_steps": 6250, "loss": 0.7692, "learning_rate": 1.8965501436695577e-05, "epoch": 0.5776, "percentage": 57.76, "elapsed_time": "6:07:12", "remaining_time": "4:28:32", "throughput": 877.57, "total_tokens": 19335408} {"current_steps": 3615, "total_steps": 6250, "loss": 0.7165, "learning_rate": 1.890454660096654e-05, "epoch": 0.5784, "percentage": 57.84, "elapsed_time": "6:07:34", "remaining_time": "4:27:55", "throughput": 877.87, "total_tokens": 19360768} {"current_steps": 3620, "total_steps": 6250, "loss": 0.8187, "learning_rate": 1.8843630267434e-05, "epoch": 0.5792, "percentage": 57.92, "elapsed_time": "6:07:59", "remaining_time": "4:27:20", "throughput": 878.02, "total_tokens": 19386016} {"current_steps": 3625, "total_steps": 6250, "loss": 0.6587, "learning_rate": 1.8782752820878634e-05, "epoch": 0.58, "percentage": 58.0, "elapsed_time": "6:08:24", "remaining_time": "4:26:47", "throughput": 878.02, "total_tokens": 19408560} {"current_steps": 3630, "total_steps": 6250, "loss": 0.6268, "learning_rate": 1.872191464583547e-05, "epoch": 0.5808, "percentage": 58.08, "elapsed_time": "6:08:58", "remaining_time": "4:26:18", "throughput": 877.95, "total_tokens": 19436592} {"current_steps": 3635, "total_steps": 6250, "loss": 0.6977, "learning_rate": 1.866111612659149e-05, "epoch": 0.5816, "percentage": 58.16, "elapsed_time": "6:09:29", "remaining_time": "4:25:48", "throughput": 877.94, "total_tokens": 19463440} {"current_steps": 3640, "total_steps": 6250, "loss": 0.6292, "learning_rate": 1.8600357647183185e-05, "epoch": 0.5824, "percentage": 58.24, "elapsed_time": "6:10:03", "remaining_time": "4:25:20", "throughput": 877.92, "total_tokens": 19493360} {"current_steps": 3645, "total_steps": 6250, "loss": 0.6547, "learning_rate": 1.8539639591394133e-05, "epoch": 0.5832, "percentage": 58.32, "elapsed_time": "6:10:37", "remaining_time": "4:24:52", "throughput": 877.87, "total_tokens": 19521392} {"current_steps": 3650, "total_steps": 6250, "loss": 0.6717, "learning_rate": 1.8478962342752583e-05, "epoch": 0.584, "percentage": 58.4, "elapsed_time": "6:11:02", "remaining_time": "4:24:18", "throughput": 878.17, "total_tokens": 19550336} {"current_steps": 3655, "total_steps": 6250, "loss": 0.7065, "learning_rate": 1.8418326284528996e-05, "epoch": 0.5848, "percentage": 58.48, "elapsed_time": "6:11:24", "remaining_time": "4:23:41", "throughput": 878.46, "total_tokens": 19575776} {"current_steps": 3660, "total_steps": 6250, "loss": 0.7029, "learning_rate": 1.8357731799733686e-05, "epoch": 0.5856, "percentage": 58.56, "elapsed_time": "6:11:45", "remaining_time": "4:23:04", "throughput": 878.63, "total_tokens": 19598128} {"current_steps": 3665, "total_steps": 6250, "loss": 0.7311, "learning_rate": 1.8297179271114346e-05, "epoch": 0.5864, "percentage": 58.64, "elapsed_time": "6:12:05", "remaining_time": "4:22:26", "throughput": 879.08, "total_tokens": 19625648} {"current_steps": 3670, "total_steps": 6250, "loss": 0.7296, "learning_rate": 1.8236669081153657e-05, "epoch": 0.5872, "percentage": 58.72, "elapsed_time": "6:12:26", "remaining_time": "4:21:49", "throughput": 879.32, "total_tokens": 19649952} {"current_steps": 3675, "total_steps": 6250, "loss": 0.7534, "learning_rate": 1.817620161206687e-05, "epoch": 0.588, "percentage": 58.8, "elapsed_time": "6:12:46", "remaining_time": "4:21:11", "throughput": 879.77, "total_tokens": 19677680} {"current_steps": 3680, "total_steps": 6250, "loss": 0.6995, "learning_rate": 1.811577724579938e-05, "epoch": 0.5888, "percentage": 58.88, "elapsed_time": "6:13:13", "remaining_time": "4:20:38", "throughput": 880.25, "total_tokens": 19711904} {"current_steps": 3685, "total_steps": 6250, "loss": 0.7517, "learning_rate": 1.8055396364024317e-05, "epoch": 0.5896, "percentage": 58.96, "elapsed_time": "6:13:33", "remaining_time": "4:20:00", "throughput": 880.48, "total_tokens": 19734272} {"current_steps": 3690, "total_steps": 6250, "loss": 0.7048, "learning_rate": 1.7995059348140165e-05, "epoch": 0.5904, "percentage": 59.04, "elapsed_time": "6:13:54", "remaining_time": "4:19:24", "throughput": 880.83, "total_tokens": 19761136} {"current_steps": 3695, "total_steps": 6250, "loss": 0.6385, "learning_rate": 1.7934766579268292e-05, "epoch": 0.5912, "percentage": 59.12, "elapsed_time": "6:14:15", "remaining_time": "4:18:47", "throughput": 881.06, "total_tokens": 19784880} {"current_steps": 3700, "total_steps": 6250, "loss": 0.8177, "learning_rate": 1.7874518438250597e-05, "epoch": 0.592, "percentage": 59.2, "elapsed_time": "6:14:35", "remaining_time": "4:18:10", "throughput": 881.45, "total_tokens": 19811456} {"current_steps": 3705, "total_steps": 6250, "loss": 0.7373, "learning_rate": 1.7814315305647093e-05, "epoch": 0.5928, "percentage": 59.28, "elapsed_time": "6:14:58", "remaining_time": "4:17:34", "throughput": 881.78, "total_tokens": 19839168} {"current_steps": 3710, "total_steps": 6250, "loss": 0.723, "learning_rate": 1.7754157561733476e-05, "epoch": 0.5936, "percentage": 59.36, "elapsed_time": "6:15:18", "remaining_time": "4:16:57", "throughput": 882.18, "total_tokens": 19865584} {"current_steps": 3715, "total_steps": 6250, "loss": 0.6315, "learning_rate": 1.7694045586498752e-05, "epoch": 0.5944, "percentage": 59.44, "elapsed_time": "6:15:38", "remaining_time": "4:16:19", "throughput": 882.62, "total_tokens": 19893232} {"current_steps": 3720, "total_steps": 6250, "loss": 0.6184, "learning_rate": 1.7633979759642844e-05, "epoch": 0.5952, "percentage": 59.52, "elapsed_time": "6:16:01", "remaining_time": "4:15:44", "throughput": 882.86, "total_tokens": 19918512} {"current_steps": 3725, "total_steps": 6250, "loss": 0.682, "learning_rate": 1.7573960460574133e-05, "epoch": 0.596, "percentage": 59.6, "elapsed_time": "6:16:22", "remaining_time": "4:15:07", "throughput": 883.17, "total_tokens": 19944544} {"current_steps": 3730, "total_steps": 6250, "loss": 0.6738, "learning_rate": 1.7513988068407146e-05, "epoch": 0.5968, "percentage": 59.68, "elapsed_time": "6:16:44", "remaining_time": "4:14:31", "throughput": 883.51, "total_tokens": 19971104} {"current_steps": 3735, "total_steps": 6250, "loss": 0.6895, "learning_rate": 1.74540629619601e-05, "epoch": 0.5976, "percentage": 59.76, "elapsed_time": "6:17:05", "remaining_time": "4:13:55", "throughput": 883.79, "total_tokens": 19996352} {"current_steps": 3740, "total_steps": 6250, "loss": 0.7436, "learning_rate": 1.7394185519752545e-05, "epoch": 0.5984, "percentage": 59.84, "elapsed_time": "6:17:29", "remaining_time": "4:13:20", "throughput": 883.99, "total_tokens": 20021744} {"current_steps": 3745, "total_steps": 6250, "loss": 0.7612, "learning_rate": 1.7334356120002957e-05, "epoch": 0.5992, "percentage": 59.92, "elapsed_time": "6:17:50", "remaining_time": "4:12:44", "throughput": 884.26, "total_tokens": 20046560} {"current_steps": 3750, "total_steps": 6250, "loss": 0.7139, "learning_rate": 1.7274575140626318e-05, "epoch": 0.6, "percentage": 60.0, "elapsed_time": "6:18:10", "remaining_time": "4:12:06", "throughput": 884.63, "total_tokens": 20072560} {"current_steps": 3755, "total_steps": 6250, "loss": 0.6556, "learning_rate": 1.7214842959231794e-05, "epoch": 0.6008, "percentage": 60.08, "elapsed_time": "6:18:35", "remaining_time": "4:11:33", "throughput": 885.0, "total_tokens": 20103488} {"current_steps": 3760, "total_steps": 6250, "loss": 0.6884, "learning_rate": 1.7155159953120313e-05, "epoch": 0.6016, "percentage": 60.16, "elapsed_time": "6:19:38", "remaining_time": "4:11:24", "throughput": 883.76, "total_tokens": 20130784} {"current_steps": 3765, "total_steps": 6250, "loss": 0.7729, "learning_rate": 1.7095526499282172e-05, "epoch": 0.6024, "percentage": 60.24, "elapsed_time": "6:20:30", "remaining_time": "4:11:08", "throughput": 882.99, "total_tokens": 20158720} {"current_steps": 3770, "total_steps": 6250, "loss": 0.7427, "learning_rate": 1.703594297439469e-05, "epoch": 0.6032, "percentage": 60.32, "elapsed_time": "6:20:49", "remaining_time": "4:10:31", "throughput": 883.19, "total_tokens": 20180736} {"current_steps": 3775, "total_steps": 6250, "loss": 0.6831, "learning_rate": 1.6976409754819767e-05, "epoch": 0.604, "percentage": 60.4, "elapsed_time": "6:21:15", "remaining_time": "4:09:57", "throughput": 883.2, "total_tokens": 20203744} {"current_steps": 3780, "total_steps": 6250, "loss": 0.6098, "learning_rate": 1.6916927216601593e-05, "epoch": 0.6048, "percentage": 60.48, "elapsed_time": "6:21:44", "remaining_time": "4:09:26", "throughput": 883.36, "total_tokens": 20232784} {"current_steps": 3785, "total_steps": 6250, "loss": 0.812, "learning_rate": 1.6857495735464195e-05, "epoch": 0.6056, "percentage": 60.56, "elapsed_time": "6:22:17", "remaining_time": "4:08:58", "throughput": 883.37, "total_tokens": 20262256} {"current_steps": 3790, "total_steps": 6250, "loss": 0.6337, "learning_rate": 1.6798115686809125e-05, "epoch": 0.6064, "percentage": 60.64, "elapsed_time": "6:22:38", "remaining_time": "4:08:22", "throughput": 883.78, "total_tokens": 20290720} {"current_steps": 3795, "total_steps": 6250, "loss": 0.7105, "learning_rate": 1.6738787445713037e-05, "epoch": 0.6072, "percentage": 60.72, "elapsed_time": "6:23:00", "remaining_time": "4:07:46", "throughput": 883.99, "total_tokens": 20314368} {"current_steps": 3800, "total_steps": 6250, "loss": 0.7776, "learning_rate": 1.6679511386925337e-05, "epoch": 0.608, "percentage": 60.8, "elapsed_time": "6:23:22", "remaining_time": "4:07:10", "throughput": 884.16, "total_tokens": 20337648} {"current_steps": 3805, "total_steps": 6250, "loss": 0.6626, "learning_rate": 1.662028788486583e-05, "epoch": 0.6088, "percentage": 60.88, "elapsed_time": "6:23:44", "remaining_time": "4:06:34", "throughput": 884.6, "total_tokens": 20367344} {"current_steps": 3810, "total_steps": 6250, "loss": 0.6983, "learning_rate": 1.656111731362236e-05, "epoch": 0.6096, "percentage": 60.96, "elapsed_time": "6:24:05", "remaining_time": "4:05:58", "throughput": 884.83, "total_tokens": 20391616} {"current_steps": 3815, "total_steps": 6250, "loss": 0.6948, "learning_rate": 1.650200004694839e-05, "epoch": 0.6104, "percentage": 61.04, "elapsed_time": "6:24:27", "remaining_time": "4:05:23", "throughput": 885.22, "total_tokens": 20419520} {"current_steps": 3820, "total_steps": 6250, "loss": 0.8154, "learning_rate": 1.644293645826072e-05, "epoch": 0.6112, "percentage": 61.12, "elapsed_time": "6:24:48", "remaining_time": "4:04:47", "throughput": 885.56, "total_tokens": 20446048} {"current_steps": 3825, "total_steps": 6250, "loss": 0.7234, "learning_rate": 1.6383926920637077e-05, "epoch": 0.612, "percentage": 61.2, "elapsed_time": "6:25:08", "remaining_time": "4:04:10", "throughput": 885.95, "total_tokens": 20472960} {"current_steps": 3830, "total_steps": 6250, "loss": 0.668, "learning_rate": 1.6324971806813767e-05, "epoch": 0.6128, "percentage": 61.28, "elapsed_time": "6:25:31", "remaining_time": "4:03:35", "throughput": 886.36, "total_tokens": 20502816} {"current_steps": 3835, "total_steps": 6250, "loss": 0.6936, "learning_rate": 1.6266071489183327e-05, "epoch": 0.6136, "percentage": 61.36, "elapsed_time": "6:25:52", "remaining_time": "4:02:59", "throughput": 886.68, "total_tokens": 20529056} {"current_steps": 3840, "total_steps": 6250, "loss": 0.7988, "learning_rate": 1.620722633979219e-05, "epoch": 0.6144, "percentage": 61.44, "elapsed_time": "6:26:13", "remaining_time": "4:02:23", "throughput": 887.03, "total_tokens": 20555392} {"current_steps": 3845, "total_steps": 6250, "loss": 0.7752, "learning_rate": 1.614843673033828e-05, "epoch": 0.6152, "percentage": 61.52, "elapsed_time": "6:26:36", "remaining_time": "4:01:48", "throughput": 887.38, "total_tokens": 20583888} {"current_steps": 3850, "total_steps": 6250, "loss": 0.6784, "learning_rate": 1.6089703032168733e-05, "epoch": 0.616, "percentage": 61.6, "elapsed_time": "6:26:58", "remaining_time": "4:01:13", "throughput": 887.74, "total_tokens": 20612112} {"current_steps": 3855, "total_steps": 6250, "loss": 0.6483, "learning_rate": 1.603102561627751e-05, "epoch": 0.6168, "percentage": 61.68, "elapsed_time": "6:27:20", "remaining_time": "4:00:38", "throughput": 888.09, "total_tokens": 20639296} {"current_steps": 3860, "total_steps": 6250, "loss": 0.6876, "learning_rate": 1.5972404853303062e-05, "epoch": 0.6176, "percentage": 61.76, "elapsed_time": "6:27:39", "remaining_time": "4:00:01", "throughput": 888.38, "total_tokens": 20663680} {"current_steps": 3865, "total_steps": 6250, "loss": 0.7651, "learning_rate": 1.5913841113525992e-05, "epoch": 0.6184, "percentage": 61.84, "elapsed_time": "6:28:02", "remaining_time": "3:59:26", "throughput": 888.69, "total_tokens": 20690592} {"current_steps": 3870, "total_steps": 6250, "loss": 0.6692, "learning_rate": 1.585533476686669e-05, "epoch": 0.6192, "percentage": 61.92, "elapsed_time": "6:28:25", "remaining_time": "3:58:52", "throughput": 888.92, "total_tokens": 20716944} {"current_steps": 3875, "total_steps": 6250, "loss": 0.708, "learning_rate": 1.5796886182883053e-05, "epoch": 0.62, "percentage": 62.0, "elapsed_time": "6:28:46", "remaining_time": "3:58:16", "throughput": 889.2, "total_tokens": 20742128} {"current_steps": 3880, "total_steps": 6250, "loss": 0.6734, "learning_rate": 1.5738495730768105e-05, "epoch": 0.6208, "percentage": 62.08, "elapsed_time": "6:29:07", "remaining_time": "3:57:41", "throughput": 889.57, "total_tokens": 20769344} {"current_steps": 3885, "total_steps": 6250, "loss": 0.7442, "learning_rate": 1.5680163779347667e-05, "epoch": 0.6216, "percentage": 62.16, "elapsed_time": "6:29:28", "remaining_time": "3:57:05", "throughput": 889.81, "total_tokens": 20793920} {"current_steps": 3890, "total_steps": 6250, "loss": 0.786, "learning_rate": 1.562189069707807e-05, "epoch": 0.6224, "percentage": 62.24, "elapsed_time": "6:29:48", "remaining_time": "3:56:29", "throughput": 890.15, "total_tokens": 20819616} {"current_steps": 3895, "total_steps": 6250, "loss": 0.6565, "learning_rate": 1.556367685204374e-05, "epoch": 0.6232, "percentage": 62.32, "elapsed_time": "6:30:09", "remaining_time": "3:55:53", "throughput": 890.36, "total_tokens": 20843056} {"current_steps": 3900, "total_steps": 6250, "loss": 0.8403, "learning_rate": 1.5505522611954975e-05, "epoch": 0.624, "percentage": 62.4, "elapsed_time": "6:30:33", "remaining_time": "3:55:20", "throughput": 890.63, "total_tokens": 20870320} {"current_steps": 3905, "total_steps": 6250, "loss": 0.717, "learning_rate": 1.5447428344145563e-05, "epoch": 0.6248, "percentage": 62.48, "elapsed_time": "6:30:53", "remaining_time": "3:54:44", "throughput": 890.88, "total_tokens": 20894448} {"current_steps": 3910, "total_steps": 6250, "loss": 0.6563, "learning_rate": 1.538939441557048e-05, "epoch": 0.6256, "percentage": 62.56, "elapsed_time": "6:31:19", "remaining_time": "3:54:11", "throughput": 891.29, "total_tokens": 20926800} {"current_steps": 3915, "total_steps": 6250, "loss": 0.7742, "learning_rate": 1.5331421192803565e-05, "epoch": 0.6264, "percentage": 62.64, "elapsed_time": "6:31:40", "remaining_time": "3:53:36", "throughput": 891.64, "total_tokens": 20954016} {"current_steps": 3920, "total_steps": 6250, "loss": 0.6654, "learning_rate": 1.5273509042035172e-05, "epoch": 0.6272, "percentage": 62.72, "elapsed_time": "6:32:04", "remaining_time": "3:53:02", "throughput": 891.94, "total_tokens": 20982512} {"current_steps": 3925, "total_steps": 6250, "loss": 0.6737, "learning_rate": 1.521565832906994e-05, "epoch": 0.628, "percentage": 62.8, "elapsed_time": "6:32:27", "remaining_time": "3:52:28", "throughput": 892.2, "total_tokens": 21008768} {"current_steps": 3930, "total_steps": 6250, "loss": 0.7259, "learning_rate": 1.515786941932441e-05, "epoch": 0.6288, "percentage": 62.88, "elapsed_time": "6:32:51", "remaining_time": "3:51:54", "throughput": 892.54, "total_tokens": 21038144} {"current_steps": 3935, "total_steps": 6250, "loss": 0.6793, "learning_rate": 1.5100142677824753e-05, "epoch": 0.6296, "percentage": 62.96, "elapsed_time": "6:33:13", "remaining_time": "3:51:20", "throughput": 892.83, "total_tokens": 21065120} {"current_steps": 3940, "total_steps": 6250, "loss": 0.6934, "learning_rate": 1.5042478469204435e-05, "epoch": 0.6304, "percentage": 63.04, "elapsed_time": "6:33:35", "remaining_time": "3:50:45", "throughput": 893.13, "total_tokens": 21091296} {"current_steps": 3945, "total_steps": 6250, "loss": 0.7746, "learning_rate": 1.4984877157701932e-05, "epoch": 0.6312, "percentage": 63.12, "elapsed_time": "6:33:56", "remaining_time": "3:50:10", "throughput": 893.44, "total_tokens": 21117568} {"current_steps": 3950, "total_steps": 6250, "loss": 0.6311, "learning_rate": 1.4927339107158437e-05, "epoch": 0.632, "percentage": 63.2, "elapsed_time": "6:34:18", "remaining_time": "3:49:35", "throughput": 893.82, "total_tokens": 21146640} {"current_steps": 3955, "total_steps": 6250, "loss": 0.7614, "learning_rate": 1.486986468101555e-05, "epoch": 0.6328, "percentage": 63.28, "elapsed_time": "6:34:39", "remaining_time": "3:49:00", "throughput": 894.01, "total_tokens": 21169680} {"current_steps": 3960, "total_steps": 6250, "loss": 0.7291, "learning_rate": 1.4812454242312979e-05, "epoch": 0.6336, "percentage": 63.36, "elapsed_time": "6:35:00", "remaining_time": "3:48:25", "throughput": 894.29, "total_tokens": 21195360} {"current_steps": 3965, "total_steps": 6250, "loss": 0.7421, "learning_rate": 1.4755108153686275e-05, "epoch": 0.6344, "percentage": 63.44, "elapsed_time": "6:35:20", "remaining_time": "3:47:49", "throughput": 894.54, "total_tokens": 21218896} {"current_steps": 3970, "total_steps": 6250, "loss": 0.7831, "learning_rate": 1.4697826777364477e-05, "epoch": 0.6352, "percentage": 63.52, "elapsed_time": "6:35:40", "remaining_time": "3:47:14", "throughput": 894.85, "total_tokens": 21244080} {"current_steps": 3975, "total_steps": 6250, "loss": 0.6907, "learning_rate": 1.4640610475167898e-05, "epoch": 0.636, "percentage": 63.6, "elapsed_time": "6:36:01", "remaining_time": "3:46:39", "throughput": 895.17, "total_tokens": 21271024} {"current_steps": 3980, "total_steps": 6250, "loss": 0.7001, "learning_rate": 1.4583459608505801e-05, "epoch": 0.6368, "percentage": 63.68, "elapsed_time": "6:36:23", "remaining_time": "3:46:04", "throughput": 895.55, "total_tokens": 21298992} {"current_steps": 3985, "total_steps": 6250, "loss": 0.6729, "learning_rate": 1.4526374538374132e-05, "epoch": 0.6376, "percentage": 63.76, "elapsed_time": "6:36:44", "remaining_time": "3:45:30", "throughput": 895.8, "total_tokens": 21324032} {"current_steps": 3990, "total_steps": 6250, "loss": 0.6636, "learning_rate": 1.4469355625353198e-05, "epoch": 0.6384, "percentage": 63.84, "elapsed_time": "6:37:11", "remaining_time": "3:44:58", "throughput": 896.07, "total_tokens": 21354256} {"current_steps": 3995, "total_steps": 6250, "loss": 0.6349, "learning_rate": 1.4412403229605454e-05, "epoch": 0.6392, "percentage": 63.92, "elapsed_time": "6:37:33", "remaining_time": "3:44:24", "throughput": 896.39, "total_tokens": 21382144} {"current_steps": 4000, "total_steps": 6250, "loss": 0.6892, "learning_rate": 1.4355517710873184e-05, "epoch": 0.64, "percentage": 64.0, "elapsed_time": "6:37:54", "remaining_time": "3:43:49", "throughput": 896.68, "total_tokens": 21408112} {"current_steps": 4005, "total_steps": 6250, "loss": 0.6602, "learning_rate": 1.4298699428476236e-05, "epoch": 0.6408, "percentage": 64.08, "elapsed_time": "6:38:16", "remaining_time": "3:43:15", "throughput": 897.15, "total_tokens": 21438800} {"current_steps": 4010, "total_steps": 6250, "loss": 0.6613, "learning_rate": 1.4241948741309782e-05, "epoch": 0.6416, "percentage": 64.16, "elapsed_time": "6:38:37", "remaining_time": "3:42:40", "throughput": 897.5, "total_tokens": 21466464} {"current_steps": 4015, "total_steps": 6250, "loss": 0.6821, "learning_rate": 1.418526600784198e-05, "epoch": 0.6424, "percentage": 64.24, "elapsed_time": "6:39:00", "remaining_time": "3:42:06", "throughput": 897.92, "total_tokens": 21496864} {"current_steps": 4020, "total_steps": 6250, "loss": 0.6698, "learning_rate": 1.412865158611179e-05, "epoch": 0.6432, "percentage": 64.32, "elapsed_time": "6:39:22", "remaining_time": "3:41:32", "throughput": 898.22, "total_tokens": 21523456} {"current_steps": 4025, "total_steps": 6250, "loss": 0.5917, "learning_rate": 1.4072105833726684e-05, "epoch": 0.644, "percentage": 64.4, "elapsed_time": "6:39:46", "remaining_time": "3:40:59", "throughput": 898.62, "total_tokens": 21554320} {"current_steps": 4030, "total_steps": 6250, "loss": 0.7332, "learning_rate": 1.401562910786034e-05, "epoch": 0.6448, "percentage": 64.48, "elapsed_time": "6:40:07", "remaining_time": "3:40:25", "throughput": 899.07, "total_tokens": 21584496} {"current_steps": 4035, "total_steps": 6250, "loss": 0.6826, "learning_rate": 1.3959221765250469e-05, "epoch": 0.6456, "percentage": 64.56, "elapsed_time": "6:40:30", "remaining_time": "3:39:51", "throughput": 899.5, "total_tokens": 21615104} {"current_steps": 4040, "total_steps": 6250, "loss": 0.7349, "learning_rate": 1.3902884162196508e-05, "epoch": 0.6464, "percentage": 64.64, "elapsed_time": "6:40:51", "remaining_time": "3:39:16", "throughput": 899.83, "total_tokens": 21642144} {"current_steps": 4045, "total_steps": 6250, "loss": 0.6341, "learning_rate": 1.3846616654557362e-05, "epoch": 0.6472, "percentage": 64.72, "elapsed_time": "6:41:15", "remaining_time": "3:38:43", "throughput": 900.14, "total_tokens": 21671408} {"current_steps": 4050, "total_steps": 6250, "loss": 0.7531, "learning_rate": 1.3790419597749199e-05, "epoch": 0.648, "percentage": 64.8, "elapsed_time": "6:41:39", "remaining_time": "3:38:11", "throughput": 900.39, "total_tokens": 21698880} {"current_steps": 4055, "total_steps": 6250, "loss": 0.6284, "learning_rate": 1.3734293346743168e-05, "epoch": 0.6488, "percentage": 64.88, "elapsed_time": "6:42:00", "remaining_time": "3:37:36", "throughput": 900.78, "total_tokens": 21727280} {"current_steps": 4060, "total_steps": 6250, "loss": 0.7148, "learning_rate": 1.367823825606319e-05, "epoch": 0.6496, "percentage": 64.96, "elapsed_time": "6:42:21", "remaining_time": "3:37:02", "throughput": 901.0, "total_tokens": 21751824} {"current_steps": 4065, "total_steps": 6250, "loss": 0.7022, "learning_rate": 1.3622254679783663e-05, "epoch": 0.6504, "percentage": 65.04, "elapsed_time": "6:42:43", "remaining_time": "3:36:28", "throughput": 901.46, "total_tokens": 21782080} {"current_steps": 4070, "total_steps": 6250, "loss": 0.7308, "learning_rate": 1.3566342971527291e-05, "epoch": 0.6512, "percentage": 65.12, "elapsed_time": "6:43:04", "remaining_time": "3:35:53", "throughput": 901.8, "total_tokens": 21809376} {"current_steps": 4075, "total_steps": 6250, "loss": 0.7338, "learning_rate": 1.3510503484462805e-05, "epoch": 0.652, "percentage": 65.2, "elapsed_time": "6:43:27", "remaining_time": "3:35:20", "throughput": 902.05, "total_tokens": 21836240} {"current_steps": 4080, "total_steps": 6250, "loss": 0.6941, "learning_rate": 1.3454736571302763e-05, "epoch": 0.6528, "percentage": 65.28, "elapsed_time": "6:43:57", "remaining_time": "3:34:51", "throughput": 902.02, "total_tokens": 21862768} {"current_steps": 4085, "total_steps": 6250, "loss": 0.7218, "learning_rate": 1.3399042584301298e-05, "epoch": 0.6536, "percentage": 65.36, "elapsed_time": "6:44:22", "remaining_time": "3:34:18", "throughput": 902.24, "total_tokens": 21890304} {"current_steps": 4090, "total_steps": 6250, "loss": 0.8144, "learning_rate": 1.3343421875251888e-05, "epoch": 0.6544, "percentage": 65.44, "elapsed_time": "6:44:46", "remaining_time": "3:33:45", "throughput": 902.25, "total_tokens": 21912192} {"current_steps": 4095, "total_steps": 6250, "loss": 0.8236, "learning_rate": 1.3287874795485167e-05, "epoch": 0.6552, "percentage": 65.52, "elapsed_time": "6:45:13", "remaining_time": "3:33:15", "throughput": 902.37, "total_tokens": 21939984} {"current_steps": 4100, "total_steps": 6250, "loss": 0.6512, "learning_rate": 1.3232401695866687e-05, "epoch": 0.656, "percentage": 65.6, "elapsed_time": "6:45:50", "remaining_time": "3:32:49", "throughput": 902.13, "total_tokens": 21967168} {"current_steps": 4105, "total_steps": 6250, "loss": 0.7271, "learning_rate": 1.3177002926794685e-05, "epoch": 0.6568, "percentage": 65.68, "elapsed_time": "6:46:25", "remaining_time": "3:32:22", "throughput": 902.17, "total_tokens": 21999904} {"current_steps": 4110, "total_steps": 6250, "loss": 0.635, "learning_rate": 1.3121678838197909e-05, "epoch": 0.6576, "percentage": 65.76, "elapsed_time": "6:46:54", "remaining_time": "3:31:52", "throughput": 902.27, "total_tokens": 22028272} {"current_steps": 4115, "total_steps": 6250, "loss": 0.6708, "learning_rate": 1.3066429779533351e-05, "epoch": 0.6584, "percentage": 65.84, "elapsed_time": "6:47:25", "remaining_time": "3:31:22", "throughput": 902.11, "total_tokens": 22052224} {"current_steps": 4120, "total_steps": 6250, "loss": 0.5916, "learning_rate": 1.3011256099784103e-05, "epoch": 0.6592, "percentage": 65.92, "elapsed_time": "6:48:06", "remaining_time": "3:30:59", "throughput": 901.79, "total_tokens": 22081360} {"current_steps": 4125, "total_steps": 6250, "loss": 0.7399, "learning_rate": 1.2956158147457115e-05, "epoch": 0.66, "percentage": 66.0, "elapsed_time": "6:48:43", "remaining_time": "3:30:33", "throughput": 901.67, "total_tokens": 22112080} {"current_steps": 4130, "total_steps": 6250, "loss": 0.6543, "learning_rate": 1.2901136270580993e-05, "epoch": 0.6608, "percentage": 66.08, "elapsed_time": "6:49:14", "remaining_time": "3:30:04", "throughput": 901.67, "total_tokens": 22139792} {"current_steps": 4135, "total_steps": 6250, "loss": 0.6808, "learning_rate": 1.2846190816703835e-05, "epoch": 0.6616, "percentage": 66.16, "elapsed_time": "6:49:43", "remaining_time": "3:29:34", "throughput": 901.54, "total_tokens": 22163136} {"current_steps": 4140, "total_steps": 6250, "loss": 0.6939, "learning_rate": 1.279132213289096e-05, "epoch": 0.6624, "percentage": 66.24, "elapsed_time": "6:50:16", "remaining_time": "3:29:06", "throughput": 901.53, "total_tokens": 22192464} {"current_steps": 4145, "total_steps": 6250, "loss": 0.6628, "learning_rate": 1.273653056572282e-05, "epoch": 0.6632, "percentage": 66.32, "elapsed_time": "6:50:50", "remaining_time": "3:28:38", "throughput": 901.37, "total_tokens": 22219424} {"current_steps": 4150, "total_steps": 6250, "loss": 0.686, "learning_rate": 1.2681816461292715e-05, "epoch": 0.664, "percentage": 66.4, "elapsed_time": "6:51:20", "remaining_time": "3:28:09", "throughput": 901.29, "total_tokens": 22244496} {"current_steps": 4155, "total_steps": 6250, "loss": 0.7278, "learning_rate": 1.2627180165204671e-05, "epoch": 0.6648, "percentage": 66.48, "elapsed_time": "6:51:55", "remaining_time": "3:27:41", "throughput": 901.12, "total_tokens": 22271600} {"current_steps": 4160, "total_steps": 6250, "loss": 0.6531, "learning_rate": 1.257262202257124e-05, "epoch": 0.6656, "percentage": 66.56, "elapsed_time": "6:52:23", "remaining_time": "3:27:11", "throughput": 901.17, "total_tokens": 22298080} {"current_steps": 4165, "total_steps": 6250, "loss": 0.5756, "learning_rate": 1.251814237801128e-05, "epoch": 0.6664, "percentage": 66.64, "elapsed_time": "6:52:46", "remaining_time": "3:26:38", "throughput": 901.4, "total_tokens": 22324832} {"current_steps": 4170, "total_steps": 6250, "loss": 0.647, "learning_rate": 1.246374157564785e-05, "epoch": 0.6672, "percentage": 66.72, "elapsed_time": "6:53:25", "remaining_time": "3:26:13", "throughput": 901.16, "total_tokens": 22353728} {"current_steps": 4175, "total_steps": 6250, "loss": 0.7024, "learning_rate": 1.2409419959105981e-05, "epoch": 0.668, "percentage": 66.8, "elapsed_time": "6:53:50", "remaining_time": "3:25:40", "throughput": 901.1, "total_tokens": 22374880} {"current_steps": 4180, "total_steps": 6250, "loss": 0.7661, "learning_rate": 1.2355177871510538e-05, "epoch": 0.6688, "percentage": 66.88, "elapsed_time": "6:54:28", "remaining_time": "3:25:15", "throughput": 900.84, "total_tokens": 22402288} {"current_steps": 4185, "total_steps": 6250, "loss": 0.6462, "learning_rate": 1.2301015655484006e-05, "epoch": 0.6696, "percentage": 66.96, "elapsed_time": "6:55:02", "remaining_time": "3:24:47", "throughput": 900.71, "total_tokens": 22430240} {"current_steps": 4190, "total_steps": 6250, "loss": 0.6487, "learning_rate": 1.2246933653144385e-05, "epoch": 0.6704, "percentage": 67.04, "elapsed_time": "6:55:33", "remaining_time": "3:24:18", "throughput": 900.58, "total_tokens": 22454800} {"current_steps": 4195, "total_steps": 6250, "loss": 0.7369, "learning_rate": 1.2192932206103e-05, "epoch": 0.6712, "percentage": 67.12, "elapsed_time": "6:56:06", "remaining_time": "3:23:50", "throughput": 900.49, "total_tokens": 22482528} {"current_steps": 4200, "total_steps": 6250, "loss": 0.6942, "learning_rate": 1.2139011655462337e-05, "epoch": 0.672, "percentage": 67.2, "elapsed_time": "6:56:44", "remaining_time": "3:23:24", "throughput": 900.21, "total_tokens": 22508976} {"current_steps": 4205, "total_steps": 6250, "loss": 0.7691, "learning_rate": 1.2085172341813911e-05, "epoch": 0.6728, "percentage": 67.28, "elapsed_time": "6:57:22", "remaining_time": "3:22:58", "throughput": 900.02, "total_tokens": 22538976} {"current_steps": 4210, "total_steps": 6250, "loss": 0.5865, "learning_rate": 1.2031414605236066e-05, "epoch": 0.6736, "percentage": 67.36, "elapsed_time": "6:57:58", "remaining_time": "3:22:32", "throughput": 899.82, "total_tokens": 22566368} {"current_steps": 4215, "total_steps": 6250, "loss": 0.6916, "learning_rate": 1.1977738785291895e-05, "epoch": 0.6744, "percentage": 67.44, "elapsed_time": "6:58:50", "remaining_time": "3:22:12", "throughput": 899.01, "total_tokens": 22592656} {"current_steps": 4220, "total_steps": 6250, "loss": 0.7436, "learning_rate": 1.1924145221027047e-05, "epoch": 0.6752, "percentage": 67.52, "elapsed_time": "6:59:23", "remaining_time": "3:21:44", "throughput": 898.92, "total_tokens": 22619872} {"current_steps": 4225, "total_steps": 6250, "loss": 0.6728, "learning_rate": 1.1870634250967605e-05, "epoch": 0.676, "percentage": 67.6, "elapsed_time": "7:00:01", "remaining_time": "3:21:18", "throughput": 898.77, "total_tokens": 22650320} {"current_steps": 4230, "total_steps": 6250, "loss": 0.728, "learning_rate": 1.1817206213117946e-05, "epoch": 0.6768, "percentage": 67.68, "elapsed_time": "7:00:27", "remaining_time": "3:20:47", "throughput": 898.88, "total_tokens": 22676896} {"current_steps": 4235, "total_steps": 6250, "loss": 0.6696, "learning_rate": 1.1763861444958573e-05, "epoch": 0.6776, "percentage": 67.76, "elapsed_time": "7:00:50", "remaining_time": "3:20:14", "throughput": 899.08, "total_tokens": 22702352} {"current_steps": 4240, "total_steps": 6250, "loss": 0.7827, "learning_rate": 1.1710600283444047e-05, "epoch": 0.6784, "percentage": 67.84, "elapsed_time": "7:01:15", "remaining_time": "3:19:42", "throughput": 899.22, "total_tokens": 22728288} {"current_steps": 4245, "total_steps": 6250, "loss": 0.7166, "learning_rate": 1.1657423065000811e-05, "epoch": 0.6792, "percentage": 67.92, "elapsed_time": "7:01:40", "remaining_time": "3:19:09", "throughput": 899.5, "total_tokens": 22757632} {"current_steps": 4250, "total_steps": 6250, "loss": 0.7143, "learning_rate": 1.1604330125525079e-05, "epoch": 0.68, "percentage": 68.0, "elapsed_time": "7:02:04", "remaining_time": "3:18:37", "throughput": 899.66, "total_tokens": 22783440} {"current_steps": 4255, "total_steps": 6250, "loss": 0.82, "learning_rate": 1.155132180038072e-05, "epoch": 0.6808, "percentage": 68.08, "elapsed_time": "7:02:29", "remaining_time": "3:18:05", "throughput": 899.81, "total_tokens": 22809616} {"current_steps": 4260, "total_steps": 6250, "loss": 0.7297, "learning_rate": 1.1498398424397106e-05, "epoch": 0.6816, "percentage": 68.16, "elapsed_time": "7:02:51", "remaining_time": "3:17:31", "throughput": 900.06, "total_tokens": 22835792} {"current_steps": 4265, "total_steps": 6250, "loss": 0.6956, "learning_rate": 1.1445560331867053e-05, "epoch": 0.6824, "percentage": 68.24, "elapsed_time": "7:03:17", "remaining_time": "3:17:00", "throughput": 900.27, "total_tokens": 22864560} {"current_steps": 4270, "total_steps": 6250, "loss": 0.7157, "learning_rate": 1.1392807856544683e-05, "epoch": 0.6832, "percentage": 68.32, "elapsed_time": "7:03:44", "remaining_time": "3:16:29", "throughput": 900.43, "total_tokens": 22892912} {"current_steps": 4275, "total_steps": 6250, "loss": 0.753, "learning_rate": 1.1340141331643276e-05, "epoch": 0.684, "percentage": 68.4, "elapsed_time": "7:04:07", "remaining_time": "3:15:56", "throughput": 900.38, "total_tokens": 22912640} {"current_steps": 4280, "total_steps": 6250, "loss": 0.7247, "learning_rate": 1.1287561089833248e-05, "epoch": 0.6848, "percentage": 68.48, "elapsed_time": "7:04:28", "remaining_time": "3:15:22", "throughput": 900.61, "total_tokens": 22937072} {"current_steps": 4285, "total_steps": 6250, "loss": 0.7671, "learning_rate": 1.1235067463239967e-05, "epoch": 0.6856, "percentage": 68.56, "elapsed_time": "7:04:49", "remaining_time": "3:14:48", "throughput": 900.82, "total_tokens": 22961104} {"current_steps": 4290, "total_steps": 6250, "loss": 0.6771, "learning_rate": 1.1182660783441718e-05, "epoch": 0.6864, "percentage": 68.64, "elapsed_time": "7:05:12", "remaining_time": "3:14:16", "throughput": 900.87, "total_tokens": 22983744} {"current_steps": 4295, "total_steps": 6250, "loss": 0.7179, "learning_rate": 1.1130341381467569e-05, "epoch": 0.6872, "percentage": 68.72, "elapsed_time": "7:05:37", "remaining_time": "3:13:44", "throughput": 901.04, "total_tokens": 23010208} {"current_steps": 4300, "total_steps": 6250, "loss": 0.5792, "learning_rate": 1.107810958779531e-05, "epoch": 0.688, "percentage": 68.8, "elapsed_time": "7:06:07", "remaining_time": "3:13:14", "throughput": 901.26, "total_tokens": 23043392} {"current_steps": 4305, "total_steps": 6250, "loss": 0.6574, "learning_rate": 1.1025965732349316e-05, "epoch": 0.6888, "percentage": 68.88, "elapsed_time": "7:06:38", "remaining_time": "3:12:45", "throughput": 901.43, "total_tokens": 23074928} {"current_steps": 4310, "total_steps": 6250, "loss": 0.6544, "learning_rate": 1.0973910144498534e-05, "epoch": 0.6896, "percentage": 68.96, "elapsed_time": "7:07:01", "remaining_time": "3:12:12", "throughput": 901.82, "total_tokens": 23105728} {"current_steps": 4315, "total_steps": 6250, "loss": 0.6503, "learning_rate": 1.0921943153054343e-05, "epoch": 0.6904, "percentage": 69.04, "elapsed_time": "7:07:22", "remaining_time": "3:11:39", "throughput": 902.12, "total_tokens": 23132768} {"current_steps": 4320, "total_steps": 6250, "loss": 0.6502, "learning_rate": 1.0870065086268505e-05, "epoch": 0.6912, "percentage": 69.12, "elapsed_time": "7:07:46", "remaining_time": "3:11:06", "throughput": 902.33, "total_tokens": 23160080} {"current_steps": 4325, "total_steps": 6250, "loss": 0.7114, "learning_rate": 1.0818276271831093e-05, "epoch": 0.692, "percentage": 69.2, "elapsed_time": "7:08:12", "remaining_time": "3:10:35", "throughput": 902.5, "total_tokens": 23187696} {"current_steps": 4330, "total_steps": 6250, "loss": 0.6546, "learning_rate": 1.0766577036868395e-05, "epoch": 0.6928, "percentage": 69.28, "elapsed_time": "7:08:34", "remaining_time": "3:10:02", "throughput": 902.7, "total_tokens": 23211904} {"current_steps": 4335, "total_steps": 6250, "loss": 0.6965, "learning_rate": 1.0714967707940875e-05, "epoch": 0.6936, "percentage": 69.36, "elapsed_time": "7:09:00", "remaining_time": "3:09:31", "throughput": 902.78, "total_tokens": 23238144} {"current_steps": 4340, "total_steps": 6250, "loss": 0.6232, "learning_rate": 1.0663448611041113e-05, "epoch": 0.6944, "percentage": 69.44, "elapsed_time": "7:09:25", "remaining_time": "3:08:59", "throughput": 903.04, "total_tokens": 23267104} {"current_steps": 4345, "total_steps": 6250, "loss": 0.6686, "learning_rate": 1.0612020071591722e-05, "epoch": 0.6952, "percentage": 69.52, "elapsed_time": "7:09:52", "remaining_time": "3:08:28", "throughput": 903.33, "total_tokens": 23298976} {"current_steps": 4350, "total_steps": 6250, "loss": 0.6975, "learning_rate": 1.0560682414443315e-05, "epoch": 0.696, "percentage": 69.6, "elapsed_time": "7:10:18", "remaining_time": "3:07:57", "throughput": 903.6, "total_tokens": 23329552} {"current_steps": 4355, "total_steps": 6250, "loss": 0.7017, "learning_rate": 1.0509435963872422e-05, "epoch": 0.6968, "percentage": 69.68, "elapsed_time": "7:10:42", "remaining_time": "3:07:24", "throughput": 903.93, "total_tokens": 23359664} {"current_steps": 4360, "total_steps": 6250, "loss": 0.6856, "learning_rate": 1.0458281043579482e-05, "epoch": 0.6976, "percentage": 69.76, "elapsed_time": "7:11:19", "remaining_time": "3:06:58", "throughput": 903.65, "total_tokens": 23386320} {"current_steps": 4365, "total_steps": 6250, "loss": 0.6739, "learning_rate": 1.0407217976686775e-05, "epoch": 0.6984, "percentage": 69.84, "elapsed_time": "7:11:47", "remaining_time": "3:06:28", "throughput": 903.84, "total_tokens": 23416512} {"current_steps": 4370, "total_steps": 6250, "loss": 0.6803, "learning_rate": 1.0356247085736386e-05, "epoch": 0.6992, "percentage": 69.92, "elapsed_time": "7:12:10", "remaining_time": "3:05:55", "throughput": 903.94, "total_tokens": 23439904} {"current_steps": 4375, "total_steps": 6250, "loss": 0.7111, "learning_rate": 1.0305368692688174e-05, "epoch": 0.7, "percentage": 70.0, "elapsed_time": "7:12:35", "remaining_time": "3:05:23", "throughput": 904.09, "total_tokens": 23466256} {"current_steps": 4380, "total_steps": 6250, "loss": 0.762, "learning_rate": 1.0254583118917698e-05, "epoch": 0.7008, "percentage": 70.08, "elapsed_time": "7:12:59", "remaining_time": "3:04:51", "throughput": 904.32, "total_tokens": 23493536} {"current_steps": 4385, "total_steps": 6250, "loss": 0.6206, "learning_rate": 1.020389068521426e-05, "epoch": 0.7016, "percentage": 70.16, "elapsed_time": "7:13:20", "remaining_time": "3:04:18", "throughput": 904.43, "total_tokens": 23515632} {"current_steps": 4390, "total_steps": 6250, "loss": 0.6711, "learning_rate": 1.0153291711778826e-05, "epoch": 0.7024, "percentage": 70.24, "elapsed_time": "7:13:44", "remaining_time": "3:03:46", "throughput": 904.56, "total_tokens": 23541152} {"current_steps": 4395, "total_steps": 6250, "loss": 0.7606, "learning_rate": 1.0102786518221997e-05, "epoch": 0.7032, "percentage": 70.32, "elapsed_time": "7:14:11", "remaining_time": "3:03:15", "throughput": 904.58, "total_tokens": 23565424} {"current_steps": 4400, "total_steps": 6250, "loss": 0.7306, "learning_rate": 1.0052375423562038e-05, "epoch": 0.704, "percentage": 70.4, "elapsed_time": "7:14:38", "remaining_time": "3:02:44", "throughput": 904.66, "total_tokens": 23592256} {"current_steps": 4405, "total_steps": 6250, "loss": 0.6121, "learning_rate": 1.0002058746222806e-05, "epoch": 0.7048, "percentage": 70.48, "elapsed_time": "7:15:03", "remaining_time": "3:02:13", "throughput": 904.93, "total_tokens": 23622240} {"current_steps": 4410, "total_steps": 6250, "loss": 0.6273, "learning_rate": 9.951836804031794e-06, "epoch": 0.7056, "percentage": 70.56, "elapsed_time": "7:15:35", "remaining_time": "3:01:44", "throughput": 904.92, "total_tokens": 23650544} {"current_steps": 4415, "total_steps": 6250, "loss": 0.7261, "learning_rate": 9.90170991421808e-06, "epoch": 0.7064, "percentage": 70.64, "elapsed_time": "7:15:57", "remaining_time": "3:01:11", "throughput": 905.12, "total_tokens": 23676016} {"current_steps": 4420, "total_steps": 6250, "loss": 0.8013, "learning_rate": 9.851678393410343e-06, "epoch": 0.7072, "percentage": 70.72, "elapsed_time": "7:16:21", "remaining_time": "3:00:39", "throughput": 905.28, "total_tokens": 23701232} {"current_steps": 4425, "total_steps": 6250, "loss": 0.7189, "learning_rate": 9.801742557634872e-06, "epoch": 0.708, "percentage": 70.8, "elapsed_time": "7:16:46", "remaining_time": "3:00:08", "throughput": 905.58, "total_tokens": 23731984} {"current_steps": 4430, "total_steps": 6250, "loss": 0.7397, "learning_rate": 9.751902722313527e-06, "epoch": 0.7088, "percentage": 70.88, "elapsed_time": "7:17:11", "remaining_time": "2:59:36", "throughput": 905.66, "total_tokens": 23756560} {"current_steps": 4435, "total_steps": 6250, "loss": 0.625, "learning_rate": 9.702159202261801e-06, "epoch": 0.7096, "percentage": 70.96, "elapsed_time": "7:17:33", "remaining_time": "2:59:04", "throughput": 906.0, "total_tokens": 23785504} {"current_steps": 4440, "total_steps": 6250, "loss": 0.7958, "learning_rate": 9.652512311686809e-06, "epoch": 0.7104, "percentage": 71.04, "elapsed_time": "7:17:55", "remaining_time": "2:58:31", "throughput": 906.25, "total_tokens": 23811840} {"current_steps": 4445, "total_steps": 6250, "loss": 0.7092, "learning_rate": 9.602962364185286e-06, "epoch": 0.7112, "percentage": 71.12, "elapsed_time": "7:18:17", "remaining_time": "2:57:58", "throughput": 906.36, "total_tokens": 23834688} {"current_steps": 4450, "total_steps": 6250, "loss": 0.6516, "learning_rate": 9.553509672741645e-06, "epoch": 0.712, "percentage": 71.2, "elapsed_time": "7:18:38", "remaining_time": "2:57:25", "throughput": 906.55, "total_tokens": 23858736} {"current_steps": 4455, "total_steps": 6250, "loss": 0.6276, "learning_rate": 9.504154549725943e-06, "epoch": 0.7128, "percentage": 71.28, "elapsed_time": "7:19:02", "remaining_time": "2:56:53", "throughput": 906.66, "total_tokens": 23883696} {"current_steps": 4460, "total_steps": 6250, "loss": 0.6741, "learning_rate": 9.454897306891972e-06, "epoch": 0.7136, "percentage": 71.36, "elapsed_time": "7:19:23", "remaining_time": "2:56:20", "throughput": 906.94, "total_tokens": 23909904} {"current_steps": 4465, "total_steps": 6250, "loss": 0.7054, "learning_rate": 9.405738255375244e-06, "epoch": 0.7144, "percentage": 71.44, "elapsed_time": "7:19:45", "remaining_time": "2:55:48", "throughput": 907.06, "total_tokens": 23933056} {"current_steps": 4470, "total_steps": 6250, "loss": 0.7593, "learning_rate": 9.356677705691058e-06, "epoch": 0.7152, "percentage": 71.52, "elapsed_time": "7:20:06", "remaining_time": "2:55:15", "throughput": 907.26, "total_tokens": 23957440} {"current_steps": 4475, "total_steps": 6250, "loss": 0.6264, "learning_rate": 9.307715967732491e-06, "epoch": 0.716, "percentage": 71.6, "elapsed_time": "7:20:29", "remaining_time": "2:54:43", "throughput": 907.52, "total_tokens": 23985088} {"current_steps": 4480, "total_steps": 6250, "loss": 0.6596, "learning_rate": 9.258853350768499e-06, "epoch": 0.7168, "percentage": 71.68, "elapsed_time": "7:20:50", "remaining_time": "2:54:10", "throughput": 907.74, "total_tokens": 24010448} {"current_steps": 4485, "total_steps": 6250, "loss": 0.7053, "learning_rate": 9.210090163441929e-06, "epoch": 0.7176, "percentage": 71.76, "elapsed_time": "7:21:10", "remaining_time": "2:53:37", "throughput": 907.98, "total_tokens": 24035040} {"current_steps": 4490, "total_steps": 6250, "loss": 0.6769, "learning_rate": 9.161426713767574e-06, "epoch": 0.7184, "percentage": 71.84, "elapsed_time": "7:21:34", "remaining_time": "2:53:05", "throughput": 908.04, "total_tokens": 24057872} {"current_steps": 4495, "total_steps": 6250, "loss": 0.7486, "learning_rate": 9.112863309130235e-06, "epoch": 0.7192, "percentage": 71.92, "elapsed_time": "7:21:58", "remaining_time": "2:52:33", "throughput": 907.98, "total_tokens": 24077920} {"current_steps": 4500, "total_steps": 6250, "loss": 0.765, "learning_rate": 9.064400256282757e-06, "epoch": 0.72, "percentage": 72.0, "elapsed_time": "7:22:19", "remaining_time": "2:52:01", "throughput": 908.23, "total_tokens": 24104320} {"current_steps": 4505, "total_steps": 6250, "loss": 0.653, "learning_rate": 9.016037861344129e-06, "epoch": 0.7208, "percentage": 72.08, "elapsed_time": "7:22:40", "remaining_time": "2:51:28", "throughput": 908.64, "total_tokens": 24134144} {"current_steps": 4510, "total_steps": 6250, "loss": 0.6412, "learning_rate": 8.967776429797528e-06, "epoch": 0.7216, "percentage": 72.16, "elapsed_time": "7:23:04", "remaining_time": "2:50:56", "throughput": 908.96, "total_tokens": 24164576} {"current_steps": 4515, "total_steps": 6250, "loss": 0.7113, "learning_rate": 8.919616266488373e-06, "epoch": 0.7224, "percentage": 72.24, "elapsed_time": "7:23:27", "remaining_time": "2:50:24", "throughput": 909.24, "total_tokens": 24192736} {"current_steps": 4520, "total_steps": 6250, "loss": 0.8171, "learning_rate": 8.871557675622441e-06, "epoch": 0.7232, "percentage": 72.32, "elapsed_time": "7:23:51", "remaining_time": "2:49:52", "throughput": 909.39, "total_tokens": 24218064} {"current_steps": 4525, "total_steps": 6250, "loss": 0.7845, "learning_rate": 8.8236009607639e-06, "epoch": 0.724, "percentage": 72.4, "elapsed_time": "7:24:14", "remaining_time": "2:49:21", "throughput": 909.59, "total_tokens": 24244832} {"current_steps": 4530, "total_steps": 6250, "loss": 0.7025, "learning_rate": 8.775746424833427e-06, "epoch": 0.7248, "percentage": 72.48, "elapsed_time": "7:24:37", "remaining_time": "2:48:49", "throughput": 909.85, "total_tokens": 24272848} {"current_steps": 4535, "total_steps": 6250, "loss": 0.868, "learning_rate": 8.727994370106288e-06, "epoch": 0.7256, "percentage": 72.56, "elapsed_time": "7:25:02", "remaining_time": "2:48:17", "throughput": 909.97, "total_tokens": 24298240} {"current_steps": 4540, "total_steps": 6250, "loss": 0.6285, "learning_rate": 8.680345098210408e-06, "epoch": 0.7264, "percentage": 72.64, "elapsed_time": "7:25:23", "remaining_time": "2:47:45", "throughput": 910.35, "total_tokens": 24327776} {"current_steps": 4545, "total_steps": 6250, "loss": 0.6583, "learning_rate": 8.632798910124492e-06, "epoch": 0.7272, "percentage": 72.72, "elapsed_time": "7:25:46", "remaining_time": "2:47:13", "throughput": 910.62, "total_tokens": 24355424} {"current_steps": 4550, "total_steps": 6250, "loss": 0.756, "learning_rate": 8.585356106176094e-06, "epoch": 0.728, "percentage": 72.8, "elapsed_time": "7:26:08", "remaining_time": "2:46:41", "throughput": 910.82, "total_tokens": 24381104} {"current_steps": 4555, "total_steps": 6250, "loss": 0.7739, "learning_rate": 8.538016986039754e-06, "epoch": 0.7288, "percentage": 72.88, "elapsed_time": "7:26:28", "remaining_time": "2:46:08", "throughput": 910.97, "total_tokens": 24403760} {"current_steps": 4560, "total_steps": 6250, "loss": 0.6998, "learning_rate": 8.49078184873508e-06, "epoch": 0.7296, "percentage": 72.96, "elapsed_time": "7:26:48", "remaining_time": "2:45:35", "throughput": 911.32, "total_tokens": 24431280} {"current_steps": 4565, "total_steps": 6250, "loss": 0.723, "learning_rate": 8.443650992624877e-06, "epoch": 0.7304, "percentage": 73.04, "elapsed_time": "7:27:09", "remaining_time": "2:45:03", "throughput": 911.64, "total_tokens": 24459120} {"current_steps": 4570, "total_steps": 6250, "loss": 0.7225, "learning_rate": 8.39662471541325e-06, "epoch": 0.7312, "percentage": 73.12, "elapsed_time": "7:27:31", "remaining_time": "2:44:31", "throughput": 911.87, "total_tokens": 24485152} {"current_steps": 4575, "total_steps": 6250, "loss": 0.5801, "learning_rate": 8.34970331414371e-06, "epoch": 0.732, "percentage": 73.2, "elapsed_time": "7:27:53", "remaining_time": "2:43:58", "throughput": 912.14, "total_tokens": 24512416} {"current_steps": 4580, "total_steps": 6250, "loss": 0.6043, "learning_rate": 8.302887085197341e-06, "epoch": 0.7328, "percentage": 73.28, "elapsed_time": "7:28:17", "remaining_time": "2:43:27", "throughput": 912.48, "total_tokens": 24543328} {"current_steps": 4585, "total_steps": 6250, "loss": 0.6533, "learning_rate": 8.256176324290885e-06, "epoch": 0.7336, "percentage": 73.36, "elapsed_time": "7:28:39", "remaining_time": "2:42:55", "throughput": 912.58, "total_tokens": 24566000} {"current_steps": 4590, "total_steps": 6250, "loss": 0.6906, "learning_rate": 8.209571326474896e-06, "epoch": 0.7344, "percentage": 73.44, "elapsed_time": "7:29:09", "remaining_time": "2:42:26", "throughput": 912.59, "total_tokens": 24594080} {"current_steps": 4595, "total_steps": 6250, "loss": 0.6661, "learning_rate": 8.163072386131876e-06, "epoch": 0.7352, "percentage": 73.52, "elapsed_time": "7:29:40", "remaining_time": "2:41:57", "throughput": 912.57, "total_tokens": 24621424} {"current_steps": 4600, "total_steps": 6250, "loss": 0.6663, "learning_rate": 8.116679796974392e-06, "epoch": 0.736, "percentage": 73.6, "elapsed_time": "7:30:01", "remaining_time": "2:41:25", "throughput": 912.7, "total_tokens": 24644288} {"current_steps": 4605, "total_steps": 6250, "loss": 0.7064, "learning_rate": 8.070393852043251e-06, "epoch": 0.7368, "percentage": 73.68, "elapsed_time": "7:30:23", "remaining_time": "2:40:53", "throughput": 913.06, "total_tokens": 24674048} {"current_steps": 4610, "total_steps": 6250, "loss": 0.6837, "learning_rate": 8.024214843705646e-06, "epoch": 0.7376, "percentage": 73.76, "elapsed_time": "7:30:45", "remaining_time": "2:40:21", "throughput": 913.12, "total_tokens": 24696320} {"current_steps": 4615, "total_steps": 6250, "loss": 0.5342, "learning_rate": 7.978143063653298e-06, "epoch": 0.7384, "percentage": 73.84, "elapsed_time": "7:31:13", "remaining_time": "2:39:51", "throughput": 913.42, "total_tokens": 24729280} {"current_steps": 4620, "total_steps": 6250, "loss": 0.6907, "learning_rate": 7.93217880290059e-06, "epoch": 0.7392, "percentage": 73.92, "elapsed_time": "7:31:36", "remaining_time": "2:39:20", "throughput": 913.7, "total_tokens": 24758080} {"current_steps": 4625, "total_steps": 6250, "loss": 0.6856, "learning_rate": 7.886322351782783e-06, "epoch": 0.74, "percentage": 74.0, "elapsed_time": "7:31:58", "remaining_time": "2:38:48", "throughput": 914.03, "total_tokens": 24787472} {"current_steps": 4630, "total_steps": 6250, "loss": 0.713, "learning_rate": 7.840573999954153e-06, "epoch": 0.7408, "percentage": 74.08, "elapsed_time": "7:32:24", "remaining_time": "2:38:17", "throughput": 914.2, "total_tokens": 24815936} {"current_steps": 4635, "total_steps": 6250, "loss": 0.7692, "learning_rate": 7.79493403638614e-06, "epoch": 0.7416, "percentage": 74.16, "elapsed_time": "7:32:45", "remaining_time": "2:37:45", "throughput": 914.39, "total_tokens": 24840096} {"current_steps": 4640, "total_steps": 6250, "loss": 0.7177, "learning_rate": 7.749402749365572e-06, "epoch": 0.7424, "percentage": 74.24, "elapsed_time": "7:33:09", "remaining_time": "2:37:14", "throughput": 914.56, "total_tokens": 24866480} {"current_steps": 4645, "total_steps": 6250, "loss": 0.7124, "learning_rate": 7.703980426492791e-06, "epoch": 0.7432, "percentage": 74.32, "elapsed_time": "7:33:29", "remaining_time": "2:36:41", "throughput": 914.74, "total_tokens": 24889456} {"current_steps": 4650, "total_steps": 6250, "loss": 0.7038, "learning_rate": 7.658667354679883e-06, "epoch": 0.744, "percentage": 74.4, "elapsed_time": "7:33:50", "remaining_time": "2:36:09", "throughput": 914.92, "total_tokens": 24913824} {"current_steps": 4655, "total_steps": 6250, "loss": 0.6662, "learning_rate": 7.613463820148831e-06, "epoch": 0.7448, "percentage": 74.48, "elapsed_time": "7:34:12", "remaining_time": "2:35:37", "throughput": 915.17, "total_tokens": 24940880} {"current_steps": 4660, "total_steps": 6250, "loss": 0.7949, "learning_rate": 7.568370108429732e-06, "epoch": 0.7456, "percentage": 74.56, "elapsed_time": "7:34:35", "remaining_time": "2:35:06", "throughput": 915.33, "total_tokens": 24965696} {"current_steps": 4665, "total_steps": 6250, "loss": 0.7146, "learning_rate": 7.523386504358984e-06, "epoch": 0.7464, "percentage": 74.64, "elapsed_time": "7:34:56", "remaining_time": "2:34:34", "throughput": 915.58, "total_tokens": 24992096} {"current_steps": 4670, "total_steps": 6250, "loss": 0.669, "learning_rate": 7.478513292077463e-06, "epoch": 0.7472, "percentage": 74.72, "elapsed_time": "7:35:22", "remaining_time": "2:34:03", "throughput": 915.9, "total_tokens": 25024320} {"current_steps": 4675, "total_steps": 6250, "loss": 0.7789, "learning_rate": 7.433750755028773e-06, "epoch": 0.748, "percentage": 74.8, "elapsed_time": "7:35:43", "remaining_time": "2:33:31", "throughput": 916.09, "total_tokens": 25049152} {"current_steps": 4680, "total_steps": 6250, "loss": 0.6992, "learning_rate": 7.389099175957429e-06, "epoch": 0.7488, "percentage": 74.88, "elapsed_time": "7:36:03", "remaining_time": "2:32:59", "throughput": 916.46, "total_tokens": 25077328} {"current_steps": 4685, "total_steps": 6250, "loss": 0.6421, "learning_rate": 7.344558836907067e-06, "epoch": 0.7496, "percentage": 74.96, "elapsed_time": "7:36:27", "remaining_time": "2:32:28", "throughput": 916.67, "total_tokens": 25105008} {"current_steps": 4690, "total_steps": 6250, "loss": 0.7656, "learning_rate": 7.300130019218687e-06, "epoch": 0.7504, "percentage": 75.04, "elapsed_time": "7:36:48", "remaining_time": "2:31:56", "throughput": 916.93, "total_tokens": 25131392} {"current_steps": 4695, "total_steps": 6250, "loss": 0.6506, "learning_rate": 7.255813003528833e-06, "epoch": 0.7512, "percentage": 75.12, "elapsed_time": "7:37:10", "remaining_time": "2:31:24", "throughput": 917.24, "total_tokens": 25159984} {"current_steps": 4700, "total_steps": 6250, "loss": 0.6253, "learning_rate": 7.211608069767867e-06, "epoch": 0.752, "percentage": 75.2, "elapsed_time": "7:37:35", "remaining_time": "2:30:54", "throughput": 917.41, "total_tokens": 25188192} {"current_steps": 4705, "total_steps": 6250, "loss": 0.6776, "learning_rate": 7.1675154971581785e-06, "epoch": 0.7528, "percentage": 75.28, "elapsed_time": "7:38:03", "remaining_time": "2:30:24", "throughput": 917.47, "total_tokens": 25215360} {"current_steps": 4710, "total_steps": 6250, "loss": 0.8286, "learning_rate": 7.123535564212422e-06, "epoch": 0.7536, "percentage": 75.36, "elapsed_time": "7:38:26", "remaining_time": "2:29:53", "throughput": 917.62, "total_tokens": 25240384} {"current_steps": 4715, "total_steps": 6250, "loss": 0.6152, "learning_rate": 7.079668548731758e-06, "epoch": 0.7544, "percentage": 75.44, "elapsed_time": "7:38:46", "remaining_time": "2:29:21", "throughput": 917.76, "total_tokens": 25263104} {"current_steps": 4720, "total_steps": 6250, "loss": 0.7227, "learning_rate": 7.035914727804085e-06, "epoch": 0.7552, "percentage": 75.52, "elapsed_time": "7:39:07", "remaining_time": "2:28:49", "throughput": 917.97, "total_tokens": 25288176} {"current_steps": 4725, "total_steps": 6250, "loss": 0.6808, "learning_rate": 6.992274377802327e-06, "epoch": 0.756, "percentage": 75.6, "elapsed_time": "7:39:30", "remaining_time": "2:28:18", "throughput": 918.13, "total_tokens": 25313536} {"current_steps": 4730, "total_steps": 6250, "loss": 0.7039, "learning_rate": 6.94874777438265e-06, "epoch": 0.7568, "percentage": 75.68, "elapsed_time": "7:39:54", "remaining_time": "2:27:47", "throughput": 918.29, "total_tokens": 25339744} {"current_steps": 4735, "total_steps": 6250, "loss": 0.7081, "learning_rate": 6.905335192482737e-06, "epoch": 0.7576, "percentage": 75.76, "elapsed_time": "7:40:20", "remaining_time": "2:27:17", "throughput": 918.44, "total_tokens": 25367440} {"current_steps": 4740, "total_steps": 6250, "loss": 0.6139, "learning_rate": 6.862036906320058e-06, "epoch": 0.7584, "percentage": 75.84, "elapsed_time": "7:40:41", "remaining_time": "2:26:45", "throughput": 918.75, "total_tokens": 25395952} {"current_steps": 4745, "total_steps": 6250, "loss": 0.8142, "learning_rate": 6.818853189390104e-06, "epoch": 0.7592, "percentage": 75.92, "elapsed_time": "7:41:02", "remaining_time": "2:26:13", "throughput": 919.0, "total_tokens": 25421744} {"current_steps": 4750, "total_steps": 6250, "loss": 0.6538, "learning_rate": 6.775784314464717e-06, "epoch": 0.76, "percentage": 76.0, "elapsed_time": "7:41:27", "remaining_time": "2:25:43", "throughput": 919.14, "total_tokens": 25448944} {"current_steps": 4755, "total_steps": 6250, "loss": 0.6409, "learning_rate": 6.732830553590305e-06, "epoch": 0.7608, "percentage": 76.08, "elapsed_time": "7:41:49", "remaining_time": "2:25:11", "throughput": 919.42, "total_tokens": 25476640} {"current_steps": 4760, "total_steps": 6250, "loss": 0.6814, "learning_rate": 6.689992178086174e-06, "epoch": 0.7616, "percentage": 76.16, "elapsed_time": "7:42:14", "remaining_time": "2:24:41", "throughput": 919.55, "total_tokens": 25503328} {"current_steps": 4765, "total_steps": 6250, "loss": 0.739, "learning_rate": 6.647269458542793e-06, "epoch": 0.7624, "percentage": 76.24, "elapsed_time": "7:42:38", "remaining_time": "2:24:10", "throughput": 919.74, "total_tokens": 25530384} {"current_steps": 4770, "total_steps": 6250, "loss": 0.6775, "learning_rate": 6.604662664820063e-06, "epoch": 0.7632, "percentage": 76.32, "elapsed_time": "7:43:02", "remaining_time": "2:23:40", "throughput": 919.96, "total_tokens": 25558880} {"current_steps": 4775, "total_steps": 6250, "loss": 0.8087, "learning_rate": 6.562172066045655e-06, "epoch": 0.764, "percentage": 76.4, "elapsed_time": "7:43:23", "remaining_time": "2:23:08", "throughput": 920.17, "total_tokens": 25584016} {"current_steps": 4780, "total_steps": 6250, "loss": 0.6836, "learning_rate": 6.519797930613289e-06, "epoch": 0.7648, "percentage": 76.48, "elapsed_time": "7:43:45", "remaining_time": "2:22:37", "throughput": 920.45, "total_tokens": 25611712} {"current_steps": 4785, "total_steps": 6250, "loss": 0.7174, "learning_rate": 6.4775405261810364e-06, "epoch": 0.7656, "percentage": 76.56, "elapsed_time": "7:44:10", "remaining_time": "2:22:06", "throughput": 920.67, "total_tokens": 25640928} {"current_steps": 4790, "total_steps": 6250, "loss": 0.6151, "learning_rate": 6.435400119669618e-06, "epoch": 0.7664, "percentage": 76.64, "elapsed_time": "7:44:30", "remaining_time": "2:21:34", "throughput": 920.95, "total_tokens": 25667376} {"current_steps": 4795, "total_steps": 6250, "loss": 0.7291, "learning_rate": 6.3933769772607535e-06, "epoch": 0.7672, "percentage": 76.72, "elapsed_time": "7:44:55", "remaining_time": "2:21:04", "throughput": 921.2, "total_tokens": 25697136} {"current_steps": 4800, "total_steps": 6250, "loss": 0.7215, "learning_rate": 6.3514713643954475e-06, "epoch": 0.768, "percentage": 76.8, "elapsed_time": "7:45:15", "remaining_time": "2:20:32", "throughput": 921.31, "total_tokens": 25718912} {"current_steps": 4805, "total_steps": 6250, "loss": 0.7092, "learning_rate": 6.309683545772327e-06, "epoch": 0.7688, "percentage": 76.88, "elapsed_time": "7:45:37", "remaining_time": "2:20:01", "throughput": 921.56, "total_tokens": 25746400} {"current_steps": 4810, "total_steps": 6250, "loss": 0.6675, "learning_rate": 6.268013785345969e-06, "epoch": 0.7696, "percentage": 76.96, "elapsed_time": "7:46:00", "remaining_time": "2:19:30", "throughput": 921.73, "total_tokens": 25772192} {"current_steps": 4815, "total_steps": 6250, "loss": 0.7428, "learning_rate": 6.226462346325221e-06, "epoch": 0.7704, "percentage": 77.04, "elapsed_time": "7:46:24", "remaining_time": "2:19:00", "throughput": 922.02, "total_tokens": 25802256} {"current_steps": 4820, "total_steps": 6250, "loss": 0.7039, "learning_rate": 6.185029491171554e-06, "epoch": 0.7712, "percentage": 77.12, "elapsed_time": "7:46:45", "remaining_time": "2:18:28", "throughput": 922.32, "total_tokens": 25829952} {"current_steps": 4825, "total_steps": 6250, "loss": 0.6733, "learning_rate": 6.143715481597404e-06, "epoch": 0.772, "percentage": 77.2, "elapsed_time": "7:47:07", "remaining_time": "2:17:57", "throughput": 922.49, "total_tokens": 25854752} {"current_steps": 4830, "total_steps": 6250, "loss": 0.7872, "learning_rate": 6.102520578564508e-06, "epoch": 0.7728, "percentage": 77.28, "elapsed_time": "7:47:27", "remaining_time": "2:17:25", "throughput": 922.77, "total_tokens": 25881264} {"current_steps": 4835, "total_steps": 6250, "loss": 0.7586, "learning_rate": 6.061445042282271e-06, "epoch": 0.7736, "percentage": 77.36, "elapsed_time": "7:47:46", "remaining_time": "2:16:53", "throughput": 923.01, "total_tokens": 25906064} {"current_steps": 4840, "total_steps": 6250, "loss": 0.7269, "learning_rate": 6.020489132206089e-06, "epoch": 0.7744, "percentage": 77.44, "elapsed_time": "7:48:06", "remaining_time": "2:16:22", "throughput": 923.25, "total_tokens": 25931280} {"current_steps": 4845, "total_steps": 6250, "loss": 0.6304, "learning_rate": 5.979653107035757e-06, "epoch": 0.7752, "percentage": 77.52, "elapsed_time": "7:48:30", "remaining_time": "2:15:51", "throughput": 923.47, "total_tokens": 25958880} {"current_steps": 4850, "total_steps": 6250, "loss": 0.6855, "learning_rate": 5.9389372247138e-06, "epoch": 0.776, "percentage": 77.6, "elapsed_time": "7:48:50", "remaining_time": "2:15:20", "throughput": 923.72, "total_tokens": 25984528} {"current_steps": 4855, "total_steps": 6250, "loss": 0.7141, "learning_rate": 5.898341742423865e-06, "epoch": 0.7768, "percentage": 77.68, "elapsed_time": "7:49:12", "remaining_time": "2:14:49", "throughput": 924.04, "total_tokens": 26014272} {"current_steps": 4860, "total_steps": 6250, "loss": 0.668, "learning_rate": 5.857866916589089e-06, "epoch": 0.7776, "percentage": 77.76, "elapsed_time": "7:49:36", "remaining_time": "2:14:18", "throughput": 924.37, "total_tokens": 26045888} {"current_steps": 4865, "total_steps": 6250, "loss": 0.7404, "learning_rate": 5.81751300287045e-06, "epoch": 0.7784, "percentage": 77.84, "elapsed_time": "7:50:01", "remaining_time": "2:13:48", "throughput": 924.4, "total_tokens": 26069232} {"current_steps": 4870, "total_steps": 6250, "loss": 0.633, "learning_rate": 5.777280256165218e-06, "epoch": 0.7792, "percentage": 77.92, "elapsed_time": "7:50:24", "remaining_time": "2:13:17", "throughput": 924.59, "total_tokens": 26095936} {"current_steps": 4875, "total_steps": 6250, "loss": 0.6365, "learning_rate": 5.737168930605272e-06, "epoch": 0.78, "percentage": 78.0, "elapsed_time": "7:50:47", "remaining_time": "2:12:47", "throughput": 924.71, "total_tokens": 26121184} {"current_steps": 4880, "total_steps": 6250, "loss": 0.6427, "learning_rate": 5.6971792795555505e-06, "epoch": 0.7808, "percentage": 78.08, "elapsed_time": "7:51:09", "remaining_time": "2:12:16", "throughput": 924.93, "total_tokens": 26147504} {"current_steps": 4885, "total_steps": 6250, "loss": 0.6509, "learning_rate": 5.6573115556124325e-06, "epoch": 0.7816, "percentage": 78.16, "elapsed_time": "7:51:31", "remaining_time": "2:11:45", "throughput": 925.16, "total_tokens": 26174208} {"current_steps": 4890, "total_steps": 6250, "loss": 0.7382, "learning_rate": 5.617566010602113e-06, "epoch": 0.7824, "percentage": 78.24, "elapsed_time": "7:51:51", "remaining_time": "2:11:13", "throughput": 925.43, "total_tokens": 26200112} {"current_steps": 4895, "total_steps": 6250, "loss": 0.7537, "learning_rate": 5.577942895579064e-06, "epoch": 0.7832, "percentage": 78.32, "elapsed_time": "7:52:14", "remaining_time": "2:10:43", "throughput": 925.65, "total_tokens": 26227952} {"current_steps": 4900, "total_steps": 6250, "loss": 0.673, "learning_rate": 5.538442460824417e-06, "epoch": 0.784, "percentage": 78.4, "elapsed_time": "7:52:41", "remaining_time": "2:10:13", "throughput": 925.89, "total_tokens": 26259392} {"current_steps": 4905, "total_steps": 6250, "loss": 0.6684, "learning_rate": 5.499064955844382e-06, "epoch": 0.7848, "percentage": 78.48, "elapsed_time": "7:53:02", "remaining_time": "2:09:42", "throughput": 926.11, "total_tokens": 26285456} {"current_steps": 4910, "total_steps": 6250, "loss": 0.7051, "learning_rate": 5.4598106293686916e-06, "epoch": 0.7856, "percentage": 78.56, "elapsed_time": "7:53:26", "remaining_time": "2:09:12", "throughput": 926.43, "total_tokens": 26316544} {"current_steps": 4915, "total_steps": 6250, "loss": 0.6481, "learning_rate": 5.420679729348993e-06, "epoch": 0.7864, "percentage": 78.64, "elapsed_time": "7:53:47", "remaining_time": "2:08:41", "throughput": 926.63, "total_tokens": 26341840} {"current_steps": 4920, "total_steps": 6250, "loss": 0.7953, "learning_rate": 5.381672502957324e-06, "epoch": 0.7872, "percentage": 78.72, "elapsed_time": "7:54:08", "remaining_time": "2:08:10", "throughput": 926.97, "total_tokens": 26371008} {"current_steps": 4925, "total_steps": 6250, "loss": 0.6966, "learning_rate": 5.342789196584527e-06, "epoch": 0.788, "percentage": 78.8, "elapsed_time": "7:54:32", "remaining_time": "2:07:40", "throughput": 927.22, "total_tokens": 26400048} {"current_steps": 4930, "total_steps": 6250, "loss": 0.6804, "learning_rate": 5.304030055838705e-06, "epoch": 0.7888, "percentage": 78.88, "elapsed_time": "7:54:54", "remaining_time": "2:07:09", "throughput": 927.39, "total_tokens": 26425408} {"current_steps": 4935, "total_steps": 6250, "loss": 0.6282, "learning_rate": 5.26539532554364e-06, "epoch": 0.7896, "percentage": 78.96, "elapsed_time": "7:55:17", "remaining_time": "2:06:38", "throughput": 927.58, "total_tokens": 26452352} {"current_steps": 4940, "total_steps": 6250, "loss": 0.588, "learning_rate": 5.226885249737293e-06, "epoch": 0.7904, "percentage": 79.04, "elapsed_time": "7:55:39", "remaining_time": "2:06:08", "throughput": 927.81, "total_tokens": 26479456} {"current_steps": 4945, "total_steps": 6250, "loss": 0.738, "learning_rate": 5.1885000716702355e-06, "epoch": 0.7912, "percentage": 79.12, "elapsed_time": "7:56:01", "remaining_time": "2:05:37", "throughput": 928.01, "total_tokens": 26504912} {"current_steps": 4950, "total_steps": 6250, "loss": 0.661, "learning_rate": 5.150240033804116e-06, "epoch": 0.792, "percentage": 79.2, "elapsed_time": "7:56:24", "remaining_time": "2:05:07", "throughput": 928.05, "total_tokens": 26528320} {"current_steps": 4955, "total_steps": 6250, "loss": 0.8033, "learning_rate": 5.112105377810128e-06, "epoch": 0.7928, "percentage": 79.28, "elapsed_time": "7:56:48", "remaining_time": "2:04:36", "throughput": 928.19, "total_tokens": 26553984} {"current_steps": 4960, "total_steps": 6250, "loss": 0.6161, "learning_rate": 5.074096344567475e-06, "epoch": 0.7936, "percentage": 79.36, "elapsed_time": "7:57:11", "remaining_time": "2:04:06", "throughput": 928.44, "total_tokens": 26582768} {"current_steps": 4965, "total_steps": 6250, "loss": 0.7286, "learning_rate": 5.036213174161877e-06, "epoch": 0.7944, "percentage": 79.44, "elapsed_time": "7:57:33", "remaining_time": "2:03:35", "throughput": 928.7, "total_tokens": 26610272} {"current_steps": 4970, "total_steps": 6250, "loss": 0.7065, "learning_rate": 4.998456105884025e-06, "epoch": 0.7952, "percentage": 79.52, "elapsed_time": "7:57:55", "remaining_time": "2:03:05", "throughput": 928.9, "total_tokens": 26636352} {"current_steps": 4975, "total_steps": 6250, "loss": 0.6842, "learning_rate": 4.960825378228082e-06, "epoch": 0.796, "percentage": 79.6, "elapsed_time": "7:58:18", "remaining_time": "2:02:34", "throughput": 929.23, "total_tokens": 26667824} {"current_steps": 4980, "total_steps": 6250, "loss": 0.7069, "learning_rate": 4.9233212288901845e-06, "epoch": 0.7968, "percentage": 79.68, "elapsed_time": "7:58:45", "remaining_time": "2:02:05", "throughput": 929.43, "total_tokens": 26698272} {"current_steps": 4985, "total_steps": 6250, "loss": 0.5942, "learning_rate": 4.885943894766909e-06, "epoch": 0.7976, "percentage": 79.76, "elapsed_time": "7:59:12", "remaining_time": "2:01:36", "throughput": 929.53, "total_tokens": 26725984} {"current_steps": 4990, "total_steps": 6250, "loss": 0.8419, "learning_rate": 4.848693611953825e-06, "epoch": 0.7984, "percentage": 79.84, "elapsed_time": "7:59:35", "remaining_time": "2:01:05", "throughput": 929.66, "total_tokens": 26751360} {"current_steps": 4995, "total_steps": 6250, "loss": 0.5888, "learning_rate": 4.811570615743952e-06, "epoch": 0.7992, "percentage": 79.92, "elapsed_time": "8:00:01", "remaining_time": "2:00:36", "throughput": 929.91, "total_tokens": 26782672} {"current_steps": 5000, "total_steps": 6250, "loss": 0.6504, "learning_rate": 4.7745751406263165e-06, "epoch": 0.8, "percentage": 80.0, "elapsed_time": "8:00:28", "remaining_time": "2:00:07", "throughput": 929.97, "total_tokens": 26809120} {"current_steps": 5005, "total_steps": 6250, "loss": 0.6603, "learning_rate": 4.737707420284451e-06, "epoch": 0.8008, "percentage": 80.08, "elapsed_time": "8:00:54", "remaining_time": "1:59:37", "throughput": 930.16, "total_tokens": 26839552} {"current_steps": 5010, "total_steps": 6250, "loss": 0.627, "learning_rate": 4.700967687594901e-06, "epoch": 0.8016, "percentage": 80.16, "elapsed_time": "8:01:28", "remaining_time": "1:59:10", "throughput": 929.94, "total_tokens": 26864416} {"current_steps": 5015, "total_steps": 6250, "loss": 0.6509, "learning_rate": 4.664356174625795e-06, "epoch": 0.8024, "percentage": 80.24, "elapsed_time": "8:02:34", "remaining_time": "1:58:50", "throughput": 928.73, "total_tokens": 26890368} {"current_steps": 5020, "total_steps": 6250, "loss": 0.6673, "learning_rate": 4.627873112635345e-06, "epoch": 0.8032, "percentage": 80.32, "elapsed_time": "8:03:20", "remaining_time": "1:58:25", "throughput": 928.11, "total_tokens": 26916064} {"current_steps": 5025, "total_steps": 6250, "loss": 0.7972, "learning_rate": 4.591518732070402e-06, "epoch": 0.804, "percentage": 80.4, "elapsed_time": "8:04:02", "remaining_time": "1:57:59", "throughput": 927.64, "total_tokens": 26940528} {"current_steps": 5030, "total_steps": 6250, "loss": 0.6977, "learning_rate": 4.5552932625649944e-06, "epoch": 0.8048, "percentage": 80.48, "elapsed_time": "8:04:36", "remaining_time": "1:57:32", "throughput": 927.38, "total_tokens": 26965296} {"current_steps": 5035, "total_steps": 6250, "loss": 0.8094, "learning_rate": 4.5191969329388625e-06, "epoch": 0.8056, "percentage": 80.56, "elapsed_time": "8:05:09", "remaining_time": "1:57:04", "throughput": 927.12, "total_tokens": 26988240} {"current_steps": 5040, "total_steps": 6250, "loss": 0.7441, "learning_rate": 4.483229971196054e-06, "epoch": 0.8064, "percentage": 80.64, "elapsed_time": "8:05:36", "remaining_time": "1:56:35", "throughput": 927.22, "total_tokens": 27015632} {"current_steps": 5045, "total_steps": 6250, "loss": 0.6618, "learning_rate": 4.44739260452344e-06, "epoch": 0.8072, "percentage": 80.72, "elapsed_time": "8:06:19", "remaining_time": "1:56:09", "throughput": 926.71, "total_tokens": 27040528} {"current_steps": 5050, "total_steps": 6250, "loss": 0.7527, "learning_rate": 4.411685059289314e-06, "epoch": 0.808, "percentage": 80.8, "elapsed_time": "8:06:54", "remaining_time": "1:55:42", "throughput": 926.46, "total_tokens": 27066560} {"current_steps": 5055, "total_steps": 6250, "loss": 0.7844, "learning_rate": 4.376107561041937e-06, "epoch": 0.8088, "percentage": 80.88, "elapsed_time": "8:07:17", "remaining_time": "1:55:11", "throughput": 926.52, "total_tokens": 27089408} {"current_steps": 5060, "total_steps": 6250, "loss": 0.7598, "learning_rate": 4.340660334508115e-06, "epoch": 0.8096, "percentage": 80.96, "elapsed_time": "8:07:40", "remaining_time": "1:54:41", "throughput": 926.67, "total_tokens": 27114832} {"current_steps": 5065, "total_steps": 6250, "loss": 0.6645, "learning_rate": 4.305343603591802e-06, "epoch": 0.8104, "percentage": 81.04, "elapsed_time": "8:08:02", "remaining_time": "1:54:10", "throughput": 926.86, "total_tokens": 27140320} {"current_steps": 5070, "total_steps": 6250, "loss": 0.7065, "learning_rate": 4.270157591372667e-06, "epoch": 0.8112, "percentage": 81.12, "elapsed_time": "8:08:27", "remaining_time": "1:53:40", "throughput": 927.12, "total_tokens": 27171200} {"current_steps": 5075, "total_steps": 6250, "loss": 0.7481, "learning_rate": 4.235102520104681e-06, "epoch": 0.812, "percentage": 81.2, "elapsed_time": "8:08:49", "remaining_time": "1:53:10", "throughput": 927.23, "total_tokens": 27195056} {"current_steps": 5080, "total_steps": 6250, "loss": 0.6154, "learning_rate": 4.200178611214736e-06, "epoch": 0.8128, "percentage": 81.28, "elapsed_time": "8:09:12", "remaining_time": "1:52:40", "throughput": 927.39, "total_tokens": 27220816} {"current_steps": 5085, "total_steps": 6250, "loss": 0.6661, "learning_rate": 4.165386085301212e-06, "epoch": 0.8136, "percentage": 81.36, "elapsed_time": "8:09:33", "remaining_time": "1:52:09", "throughput": 927.58, "total_tokens": 27246400} {"current_steps": 5090, "total_steps": 6250, "loss": 0.7043, "learning_rate": 4.130725162132612e-06, "epoch": 0.8144, "percentage": 81.44, "elapsed_time": "8:09:54", "remaining_time": "1:51:38", "throughput": 927.73, "total_tokens": 27269936} {"current_steps": 5095, "total_steps": 6250, "loss": 0.8173, "learning_rate": 4.096196060646168e-06, "epoch": 0.8152, "percentage": 81.52, "elapsed_time": "8:10:19", "remaining_time": "1:51:09", "throughput": 927.72, "total_tokens": 27293488} {"current_steps": 5100, "total_steps": 6250, "loss": 0.7154, "learning_rate": 4.061798998946459e-06, "epoch": 0.816, "percentage": 81.6, "elapsed_time": "8:10:49", "remaining_time": "1:50:40", "throughput": 927.65, "total_tokens": 27318592} {"current_steps": 5105, "total_steps": 6250, "loss": 0.6336, "learning_rate": 4.027534194304005e-06, "epoch": 0.8168, "percentage": 81.68, "elapsed_time": "8:11:14", "remaining_time": "1:50:10", "throughput": 927.71, "total_tokens": 27343616} {"current_steps": 5110, "total_steps": 6250, "loss": 0.7355, "learning_rate": 3.99340186315395e-06, "epoch": 0.8176, "percentage": 81.76, "elapsed_time": "8:11:36", "remaining_time": "1:49:40", "throughput": 927.88, "total_tokens": 27369216} {"current_steps": 5115, "total_steps": 6250, "loss": 0.6034, "learning_rate": 3.959402221094635e-06, "epoch": 0.8184, "percentage": 81.84, "elapsed_time": "8:12:01", "remaining_time": "1:49:10", "throughput": 928.1, "total_tokens": 27398704} {"current_steps": 5120, "total_steps": 6250, "loss": 0.7962, "learning_rate": 3.925535482886286e-06, "epoch": 0.8192, "percentage": 81.92, "elapsed_time": "8:12:26", "remaining_time": "1:48:40", "throughput": 928.18, "total_tokens": 27424176} {"current_steps": 5125, "total_steps": 6250, "loss": 0.7289, "learning_rate": 3.891801862449629e-06, "epoch": 0.82, "percentage": 82.0, "elapsed_time": "8:12:53", "remaining_time": "1:48:11", "throughput": 928.29, "total_tokens": 27452656} {"current_steps": 5130, "total_steps": 6250, "loss": 0.6644, "learning_rate": 3.858201572864537e-06, "epoch": 0.8208, "percentage": 82.08, "elapsed_time": "8:13:20", "remaining_time": "1:47:42", "throughput": 928.31, "total_tokens": 27478656} {"current_steps": 5135, "total_steps": 6250, "loss": 0.7519, "learning_rate": 3.824734826368703e-06, "epoch": 0.8216, "percentage": 82.16, "elapsed_time": "8:13:45", "remaining_time": "1:47:12", "throughput": 928.5, "total_tokens": 27507184} {"current_steps": 5140, "total_steps": 6250, "loss": 0.7611, "learning_rate": 3.7914018343562895e-06, "epoch": 0.8224, "percentage": 82.24, "elapsed_time": "8:14:06", "remaining_time": "1:46:42", "throughput": 928.82, "total_tokens": 27536112} {"current_steps": 5145, "total_steps": 6250, "loss": 0.6713, "learning_rate": 3.75820280737659e-06, "epoch": 0.8232, "percentage": 82.32, "elapsed_time": "8:14:28", "remaining_time": "1:46:12", "throughput": 929.04, "total_tokens": 27563728} {"current_steps": 5150, "total_steps": 6250, "loss": 0.6522, "learning_rate": 3.725137955132707e-06, "epoch": 0.824, "percentage": 82.4, "elapsed_time": "8:14:53", "remaining_time": "1:45:42", "throughput": 929.07, "total_tokens": 27587120} {"current_steps": 5155, "total_steps": 6250, "loss": 0.7707, "learning_rate": 3.692207486480209e-06, "epoch": 0.8248, "percentage": 82.48, "elapsed_time": "8:15:15", "remaining_time": "1:45:12", "throughput": 929.08, "total_tokens": 27608240} {"current_steps": 5160, "total_steps": 6250, "loss": 0.6148, "learning_rate": 3.6594116094258337e-06, "epoch": 0.8256, "percentage": 82.56, "elapsed_time": "8:15:42", "remaining_time": "1:44:42", "throughput": 929.24, "total_tokens": 27637840} {"current_steps": 5165, "total_steps": 6250, "loss": 0.6884, "learning_rate": 3.626750531126169e-06, "epoch": 0.8264, "percentage": 82.64, "elapsed_time": "8:16:06", "remaining_time": "1:44:13", "throughput": 929.29, "total_tokens": 27662144} {"current_steps": 5170, "total_steps": 6250, "loss": 0.6954, "learning_rate": 3.594224457886336e-06, "epoch": 0.8272, "percentage": 82.72, "elapsed_time": "8:16:46", "remaining_time": "1:43:46", "throughput": 929.04, "total_tokens": 27691184} {"current_steps": 5175, "total_steps": 6250, "loss": 0.6736, "learning_rate": 3.561833595158698e-06, "epoch": 0.828, "percentage": 82.8, "elapsed_time": "8:17:07", "remaining_time": "1:43:16", "throughput": 929.32, "total_tokens": 27719376} {"current_steps": 5180, "total_steps": 6250, "loss": 0.7575, "learning_rate": 3.529578147541532e-06, "epoch": 0.8288, "percentage": 82.88, "elapsed_time": "8:17:35", "remaining_time": "1:42:46", "throughput": 929.46, "total_tokens": 27749248} {"current_steps": 5185, "total_steps": 6250, "loss": 0.6607, "learning_rate": 3.4974583187777852e-06, "epoch": 0.8296, "percentage": 82.96, "elapsed_time": "8:17:58", "remaining_time": "1:42:17", "throughput": 929.74, "total_tokens": 27779136} {"current_steps": 5190, "total_steps": 6250, "loss": 0.844, "learning_rate": 3.4654743117537524e-06, "epoch": 0.8304, "percentage": 83.04, "elapsed_time": "8:18:18", "remaining_time": "1:41:46", "throughput": 929.89, "total_tokens": 27802592} {"current_steps": 5195, "total_steps": 6250, "loss": 0.6596, "learning_rate": 3.433626328497805e-06, "epoch": 0.8312, "percentage": 83.12, "elapsed_time": "8:18:40", "remaining_time": "1:41:16", "throughput": 930.04, "total_tokens": 27826864} {"current_steps": 5200, "total_steps": 6250, "loss": 0.7834, "learning_rate": 3.4019145701791184e-06, "epoch": 0.832, "percentage": 83.2, "elapsed_time": "8:19:01", "remaining_time": "1:40:45", "throughput": 930.21, "total_tokens": 27851680} {"current_steps": 5205, "total_steps": 6250, "loss": 0.6874, "learning_rate": 3.3703392371063845e-06, "epoch": 0.8328, "percentage": 83.28, "elapsed_time": "8:19:25", "remaining_time": "1:40:16", "throughput": 930.41, "total_tokens": 27880208} {"current_steps": 5210, "total_steps": 6250, "loss": 0.6468, "learning_rate": 3.338900528726571e-06, "epoch": 0.8336, "percentage": 83.36, "elapsed_time": "8:19:47", "remaining_time": "1:39:45", "throughput": 930.64, "total_tokens": 27907392} {"current_steps": 5215, "total_steps": 6250, "loss": 0.6675, "learning_rate": 3.3075986436236493e-06, "epoch": 0.8344, "percentage": 83.44, "elapsed_time": "8:20:12", "remaining_time": "1:39:16", "throughput": 930.75, "total_tokens": 27934560} {"current_steps": 5220, "total_steps": 6250, "loss": 0.6704, "learning_rate": 3.2764337795173435e-06, "epoch": 0.8352, "percentage": 83.52, "elapsed_time": "8:20:38", "remaining_time": "1:38:47", "throughput": 930.91, "total_tokens": 27963248} {"current_steps": 5225, "total_steps": 6250, "loss": 0.6903, "learning_rate": 3.245406133261858e-06, "epoch": 0.836, "percentage": 83.6, "elapsed_time": "8:21:03", "remaining_time": "1:38:17", "throughput": 931.04, "total_tokens": 27989872} {"current_steps": 5230, "total_steps": 6250, "loss": 0.7441, "learning_rate": 3.2145159008446807e-06, "epoch": 0.8368, "percentage": 83.68, "elapsed_time": "8:21:24", "remaining_time": "1:37:47", "throughput": 931.12, "total_tokens": 28012208} {"current_steps": 5235, "total_steps": 6250, "loss": 0.6636, "learning_rate": 3.1837632773853098e-06, "epoch": 0.8376, "percentage": 83.76, "elapsed_time": "8:21:53", "remaining_time": "1:37:18", "throughput": 931.2, "total_tokens": 28041200} {"current_steps": 5240, "total_steps": 6250, "loss": 0.7246, "learning_rate": 3.15314845713402e-06, "epoch": 0.8384, "percentage": 83.84, "elapsed_time": "8:22:17", "remaining_time": "1:36:49", "throughput": 931.33, "total_tokens": 28068272} {"current_steps": 5245, "total_steps": 6250, "loss": 0.6583, "learning_rate": 3.122671633470664e-06, "epoch": 0.8392, "percentage": 83.92, "elapsed_time": "8:22:40", "remaining_time": "1:36:19", "throughput": 931.44, "total_tokens": 28092768} {"current_steps": 5250, "total_steps": 6250, "loss": 0.6823, "learning_rate": 3.0923329989034132e-06, "epoch": 0.84, "percentage": 84.0, "elapsed_time": "8:23:05", "remaining_time": "1:35:49", "throughput": 931.69, "total_tokens": 28122944} {"current_steps": 5255, "total_steps": 6250, "loss": 0.7467, "learning_rate": 3.062132745067581e-06, "epoch": 0.8408, "percentage": 84.08, "elapsed_time": "8:23:27", "remaining_time": "1:35:19", "throughput": 931.93, "total_tokens": 28151424} {"current_steps": 5260, "total_steps": 6250, "loss": 0.7541, "learning_rate": 3.0320710627243813e-06, "epoch": 0.8416, "percentage": 84.16, "elapsed_time": "8:23:54", "remaining_time": "1:34:50", "throughput": 931.94, "total_tokens": 28176752} {"current_steps": 5265, "total_steps": 6250, "loss": 0.6829, "learning_rate": 3.002148141759739e-06, "epoch": 0.8424, "percentage": 84.24, "elapsed_time": "8:24:47", "remaining_time": "1:34:26", "throughput": 931.26, "total_tokens": 28205456} {"current_steps": 5270, "total_steps": 6250, "loss": 0.692, "learning_rate": 2.97236417118309e-06, "epoch": 0.8432, "percentage": 84.32, "elapsed_time": "8:25:29", "remaining_time": "1:33:59", "throughput": 930.8, "total_tokens": 28230304} {"current_steps": 5275, "total_steps": 6250, "loss": 0.7628, "learning_rate": 2.942719339126171e-06, "epoch": 0.844, "percentage": 84.4, "elapsed_time": "8:25:51", "remaining_time": "1:33:30", "throughput": 930.94, "total_tokens": 28255536} {"current_steps": 5280, "total_steps": 6250, "loss": 0.6972, "learning_rate": 2.9132138328418573e-06, "epoch": 0.8448, "percentage": 84.48, "elapsed_time": "8:26:13", "remaining_time": "1:33:00", "throughput": 931.06, "total_tokens": 28279600} {"current_steps": 5285, "total_steps": 6250, "loss": 0.6801, "learning_rate": 2.8838478387029606e-06, "epoch": 0.8456, "percentage": 84.56, "elapsed_time": "8:26:38", "remaining_time": "1:32:30", "throughput": 931.12, "total_tokens": 28304688} {"current_steps": 5290, "total_steps": 6250, "loss": 0.6697, "learning_rate": 2.8546215422010638e-06, "epoch": 0.8464, "percentage": 84.64, "elapsed_time": "8:27:09", "remaining_time": "1:32:02", "throughput": 931.06, "total_tokens": 28331584} {"current_steps": 5295, "total_steps": 6250, "loss": 0.6816, "learning_rate": 2.8255351279453446e-06, "epoch": 0.8472, "percentage": 84.72, "elapsed_time": "8:27:43", "remaining_time": "1:31:34", "throughput": 930.97, "total_tokens": 28360256} {"current_steps": 5300, "total_steps": 6250, "loss": 0.7763, "learning_rate": 2.7965887796613884e-06, "epoch": 0.848, "percentage": 84.8, "elapsed_time": "8:28:14", "remaining_time": "1:31:06", "throughput": 930.82, "total_tokens": 28385168} {"current_steps": 5305, "total_steps": 6250, "loss": 0.7837, "learning_rate": 2.767782680190073e-06, "epoch": 0.8488, "percentage": 84.88, "elapsed_time": "8:28:46", "remaining_time": "1:30:37", "throughput": 930.58, "total_tokens": 28407248} {"current_steps": 5310, "total_steps": 6250, "loss": 0.6975, "learning_rate": 2.739117011486378e-06, "epoch": 0.8496, "percentage": 84.96, "elapsed_time": "8:29:19", "remaining_time": "1:30:09", "throughput": 930.47, "total_tokens": 28434304} {"current_steps": 5315, "total_steps": 6250, "loss": 0.7119, "learning_rate": 2.710591954618247e-06, "epoch": 0.8504, "percentage": 85.04, "elapsed_time": "8:29:55", "remaining_time": "1:29:42", "throughput": 930.39, "total_tokens": 28465424} {"current_steps": 5320, "total_steps": 6250, "loss": 0.7644, "learning_rate": 2.6822076897654452e-06, "epoch": 0.8512, "percentage": 85.12, "elapsed_time": "8:30:31", "remaining_time": "1:29:14", "throughput": 930.22, "total_tokens": 28494416} {"current_steps": 5325, "total_steps": 6250, "loss": 0.644, "learning_rate": 2.6539643962184057e-06, "epoch": 0.852, "percentage": 85.2, "elapsed_time": "8:31:04", "remaining_time": "1:28:46", "throughput": 930.05, "total_tokens": 28519552} {"current_steps": 5330, "total_steps": 6250, "loss": 0.7378, "learning_rate": 2.6258622523771287e-06, "epoch": 0.8528, "percentage": 85.28, "elapsed_time": "8:31:35", "remaining_time": "1:28:18", "throughput": 929.95, "total_tokens": 28545632} {"current_steps": 5335, "total_steps": 6250, "loss": 0.7267, "learning_rate": 2.5979014357500248e-06, "epoch": 0.8536, "percentage": 85.36, "elapsed_time": "8:32:09", "remaining_time": "1:27:50", "throughput": 929.77, "total_tokens": 28571440} {"current_steps": 5340, "total_steps": 6250, "loss": 0.6015, "learning_rate": 2.570082122952816e-06, "epoch": 0.8544, "percentage": 85.44, "elapsed_time": "8:32:41", "remaining_time": "1:27:22", "throughput": 929.71, "total_tokens": 28599472} {"current_steps": 5345, "total_steps": 6250, "loss": 0.6327, "learning_rate": 2.5424044897073895e-06, "epoch": 0.8552, "percentage": 85.52, "elapsed_time": "8:33:15", "remaining_time": "1:26:54", "throughput": 929.65, "total_tokens": 28629136} {"current_steps": 5350, "total_steps": 6250, "loss": 0.739, "learning_rate": 2.514868710840723e-06, "epoch": 0.856, "percentage": 85.6, "elapsed_time": "8:33:46", "remaining_time": "1:26:25", "throughput": 929.36, "total_tokens": 28648928} {"current_steps": 5355, "total_steps": 6250, "loss": 0.7279, "learning_rate": 2.4874749602837697e-06, "epoch": 0.8568, "percentage": 85.68, "elapsed_time": "8:34:18", "remaining_time": "1:25:57", "throughput": 929.23, "total_tokens": 28675056} {"current_steps": 5360, "total_steps": 6250, "loss": 0.726, "learning_rate": 2.4602234110703364e-06, "epoch": 0.8576, "percentage": 85.76, "elapsed_time": "8:34:50", "remaining_time": "1:25:29", "throughput": 929.04, "total_tokens": 28698416} {"current_steps": 5365, "total_steps": 6250, "loss": 0.7046, "learning_rate": 2.43311423533602e-06, "epoch": 0.8584, "percentage": 85.84, "elapsed_time": "8:35:25", "remaining_time": "1:25:01", "throughput": 929.0, "total_tokens": 28729856} {"current_steps": 5370, "total_steps": 6250, "loss": 0.6922, "learning_rate": 2.406147604317119e-06, "epoch": 0.8592, "percentage": 85.92, "elapsed_time": "8:35:59", "remaining_time": "1:24:33", "throughput": 928.87, "total_tokens": 28757360} {"current_steps": 5375, "total_steps": 6250, "loss": 0.6664, "learning_rate": 2.379323688349516e-06, "epoch": 0.86, "percentage": 86.0, "elapsed_time": "8:36:30", "remaining_time": "1:24:04", "throughput": 928.69, "total_tokens": 28780624} {"current_steps": 5380, "total_steps": 6250, "loss": 0.6532, "learning_rate": 2.3526426568676483e-06, "epoch": 0.8608, "percentage": 86.08, "elapsed_time": "8:37:04", "remaining_time": "1:23:36", "throughput": 928.49, "total_tokens": 28805616} {"current_steps": 5385, "total_steps": 6250, "loss": 0.6678, "learning_rate": 2.326104678403415e-06, "epoch": 0.8616, "percentage": 86.16, "elapsed_time": "8:37:36", "remaining_time": "1:23:08", "throughput": 928.41, "total_tokens": 28833504} {"current_steps": 5390, "total_steps": 6250, "loss": 0.6152, "learning_rate": 2.299709920585108e-06, "epoch": 0.8624, "percentage": 86.24, "elapsed_time": "8:38:10", "remaining_time": "1:22:40", "throughput": 928.35, "total_tokens": 28862704} {"current_steps": 5395, "total_steps": 6250, "loss": 0.7131, "learning_rate": 2.2734585501363673e-06, "epoch": 0.8632, "percentage": 86.32, "elapsed_time": "8:38:41", "remaining_time": "1:22:12", "throughput": 928.17, "total_tokens": 28886224} {"current_steps": 5400, "total_steps": 6250, "loss": 0.735, "learning_rate": 2.2473507328751086e-06, "epoch": 0.864, "percentage": 86.4, "elapsed_time": "8:39:13", "remaining_time": "1:21:43", "throughput": 928.05, "total_tokens": 28911760} {"current_steps": 5405, "total_steps": 6250, "loss": 0.6706, "learning_rate": 2.2213866337125022e-06, "epoch": 0.8648, "percentage": 86.48, "elapsed_time": "8:39:48", "remaining_time": "1:21:15", "throughput": 927.95, "total_tokens": 28941360} {"current_steps": 5410, "total_steps": 6250, "loss": 0.7683, "learning_rate": 2.1955664166519036e-06, "epoch": 0.8656, "percentage": 86.56, "elapsed_time": "8:40:20", "remaining_time": "1:20:47", "throughput": 927.76, "total_tokens": 28965568} {"current_steps": 5415, "total_steps": 6250, "loss": 0.623, "learning_rate": 2.1698902447878477e-06, "epoch": 0.8664, "percentage": 86.64, "elapsed_time": "8:40:52", "remaining_time": "1:20:19", "throughput": 927.76, "total_tokens": 28994432} {"current_steps": 5420, "total_steps": 6250, "loss": 0.7774, "learning_rate": 2.1443582803049755e-06, "epoch": 0.8672, "percentage": 86.72, "elapsed_time": "8:41:24", "remaining_time": "1:19:50", "throughput": 927.5, "total_tokens": 29016560} {"current_steps": 5425, "total_steps": 6250, "loss": 0.6332, "learning_rate": 2.118970684477062e-06, "epoch": 0.868, "percentage": 86.8, "elapsed_time": "8:41:57", "remaining_time": "1:19:22", "throughput": 927.41, "total_tokens": 29043920} {"current_steps": 5430, "total_steps": 6250, "loss": 0.6658, "learning_rate": 2.093727617665955e-06, "epoch": 0.8688, "percentage": 86.88, "elapsed_time": "8:42:29", "remaining_time": "1:18:54", "throughput": 927.4, "total_tokens": 29073840} {"current_steps": 5435, "total_steps": 6250, "loss": 0.7078, "learning_rate": 2.068629239320588e-06, "epoch": 0.8696, "percentage": 86.96, "elapsed_time": "8:43:04", "remaining_time": "1:18:26", "throughput": 927.29, "total_tokens": 29102752} {"current_steps": 5440, "total_steps": 6250, "loss": 0.7049, "learning_rate": 2.043675707975959e-06, "epoch": 0.8704, "percentage": 87.04, "elapsed_time": "8:43:37", "remaining_time": "1:17:57", "throughput": 927.09, "total_tokens": 29126576} {"current_steps": 5445, "total_steps": 6250, "loss": 0.7931, "learning_rate": 2.0188671812521292e-06, "epoch": 0.8712, "percentage": 87.12, "elapsed_time": "8:44:08", "remaining_time": "1:17:29", "throughput": 927.02, "total_tokens": 29153120} {"current_steps": 5450, "total_steps": 6250, "loss": 0.8394, "learning_rate": 1.9942038158532407e-06, "epoch": 0.872, "percentage": 87.2, "elapsed_time": "8:44:40", "remaining_time": "1:17:01", "throughput": 926.98, "total_tokens": 29182192} {"current_steps": 5455, "total_steps": 6250, "loss": 0.6915, "learning_rate": 1.969685767566512e-06, "epoch": 0.8728, "percentage": 87.28, "elapsed_time": "8:45:11", "remaining_time": "1:16:32", "throughput": 926.83, "total_tokens": 29206368} {"current_steps": 5460, "total_steps": 6250, "loss": 0.6627, "learning_rate": 1.9453131912612694e-06, "epoch": 0.8736, "percentage": 87.36, "elapsed_time": "8:45:47", "remaining_time": "1:16:04", "throughput": 926.73, "total_tokens": 29235984} {"current_steps": 5465, "total_steps": 6250, "loss": 0.6671, "learning_rate": 1.921086240887937e-06, "epoch": 0.8744, "percentage": 87.44, "elapsed_time": "8:46:19", "remaining_time": "1:15:36", "throughput": 926.57, "total_tokens": 29260672} {"current_steps": 5470, "total_steps": 6250, "loss": 0.665, "learning_rate": 1.8970050694771064e-06, "epoch": 0.8752, "percentage": 87.52, "elapsed_time": "8:46:52", "remaining_time": "1:15:07", "throughput": 926.48, "total_tokens": 29287792} {"current_steps": 5475, "total_steps": 6250, "loss": 0.663, "learning_rate": 1.8730698291385518e-06, "epoch": 0.876, "percentage": 87.6, "elapsed_time": "8:47:25", "remaining_time": "1:14:39", "throughput": 926.34, "total_tokens": 29314656} {"current_steps": 5480, "total_steps": 6250, "loss": 0.7054, "learning_rate": 1.8492806710602496e-06, "epoch": 0.8768, "percentage": 87.68, "elapsed_time": "8:47:56", "remaining_time": "1:14:10", "throughput": 926.19, "total_tokens": 29338976} {"current_steps": 5485, "total_steps": 6250, "loss": 0.6905, "learning_rate": 1.8256377455074525e-06, "epoch": 0.8776, "percentage": 87.76, "elapsed_time": "8:48:30", "remaining_time": "1:13:42", "throughput": 926.03, "total_tokens": 29364912} {"current_steps": 5490, "total_steps": 6250, "loss": 0.7641, "learning_rate": 1.802141201821736e-06, "epoch": 0.8784, "percentage": 87.84, "elapsed_time": "8:49:04", "remaining_time": "1:13:14", "throughput": 925.93, "total_tokens": 29392960} {"current_steps": 5495, "total_steps": 6250, "loss": 0.6918, "learning_rate": 1.7787911884200314e-06, "epoch": 0.8792, "percentage": 87.92, "elapsed_time": "8:49:36", "remaining_time": "1:12:46", "throughput": 925.73, "total_tokens": 29416848} {"current_steps": 5500, "total_steps": 6250, "loss": 0.6281, "learning_rate": 1.7555878527937164e-06, "epoch": 0.88, "percentage": 88.0, "elapsed_time": "8:50:10", "remaining_time": "1:12:17", "throughput": 925.66, "total_tokens": 29445856} {"current_steps": 5505, "total_steps": 6250, "loss": 0.7199, "learning_rate": 1.7325313415076705e-06, "epoch": 0.8808, "percentage": 88.08, "elapsed_time": "8:50:46", "remaining_time": "1:11:49", "throughput": 925.52, "total_tokens": 29474400} {"current_steps": 5510, "total_steps": 6250, "loss": 0.7022, "learning_rate": 1.7096218001993513e-06, "epoch": 0.8816, "percentage": 88.16, "elapsed_time": "8:51:19", "remaining_time": "1:11:21", "throughput": 925.39, "total_tokens": 29501312} {"current_steps": 5515, "total_steps": 6250, "loss": 0.635, "learning_rate": 1.686859373577876e-06, "epoch": 0.8824, "percentage": 88.24, "elapsed_time": "8:51:52", "remaining_time": "1:10:53", "throughput": 925.34, "total_tokens": 29530160} {"current_steps": 5520, "total_steps": 6250, "loss": 0.6752, "learning_rate": 1.6642442054230934e-06, "epoch": 0.8832, "percentage": 88.32, "elapsed_time": "8:52:24", "remaining_time": "1:10:24", "throughput": 925.25, "total_tokens": 29557168} {"current_steps": 5525, "total_steps": 6250, "loss": 0.7824, "learning_rate": 1.6417764385846996e-06, "epoch": 0.884, "percentage": 88.4, "elapsed_time": "8:52:57", "remaining_time": "1:09:56", "throughput": 925.19, "total_tokens": 29584832} {"current_steps": 5530, "total_steps": 6250, "loss": 0.6823, "learning_rate": 1.6194562149813242e-06, "epoch": 0.8848, "percentage": 88.48, "elapsed_time": "8:53:28", "remaining_time": "1:09:27", "throughput": 925.05, "total_tokens": 29609504} {"current_steps": 5535, "total_steps": 6250, "loss": 0.6777, "learning_rate": 1.5972836755996285e-06, "epoch": 0.8856, "percentage": 88.56, "elapsed_time": "8:54:02", "remaining_time": "1:08:59", "throughput": 924.92, "total_tokens": 29636768} {"current_steps": 5540, "total_steps": 6250, "loss": 0.7372, "learning_rate": 1.5752589604934255e-06, "epoch": 0.8864, "percentage": 88.64, "elapsed_time": "8:54:35", "remaining_time": "1:08:30", "throughput": 924.7, "total_tokens": 29660496} {"current_steps": 5545, "total_steps": 6250, "loss": 0.7126, "learning_rate": 1.5533822087827805e-06, "epoch": 0.8872, "percentage": 88.72, "elapsed_time": "8:55:09", "remaining_time": "1:08:02", "throughput": 924.55, "total_tokens": 29686928} {"current_steps": 5550, "total_steps": 6250, "loss": 0.6564, "learning_rate": 1.5316535586531483e-06, "epoch": 0.888, "percentage": 88.8, "elapsed_time": "8:55:44", "remaining_time": "1:07:34", "throughput": 924.41, "total_tokens": 29714800} {"current_steps": 5555, "total_steps": 6250, "loss": 0.8006, "learning_rate": 1.5100731473544933e-06, "epoch": 0.8888, "percentage": 88.88, "elapsed_time": "8:56:17", "remaining_time": "1:07:05", "throughput": 924.3, "total_tokens": 29741808} {"current_steps": 5560, "total_steps": 6250, "loss": 0.7322, "learning_rate": 1.4886411112004255e-06, "epoch": 0.8896, "percentage": 88.96, "elapsed_time": "8:56:48", "remaining_time": "1:06:37", "throughput": 924.08, "total_tokens": 29763088} {"current_steps": 5565, "total_steps": 6250, "loss": 0.7243, "learning_rate": 1.4673575855673277e-06, "epoch": 0.8904, "percentage": 89.04, "elapsed_time": "8:57:22", "remaining_time": "1:06:08", "throughput": 923.99, "total_tokens": 29791520} {"current_steps": 5570, "total_steps": 6250, "loss": 0.6955, "learning_rate": 1.4462227048935183e-06, "epoch": 0.8912, "percentage": 89.12, "elapsed_time": "8:57:53", "remaining_time": "1:05:40", "throughput": 923.9, "total_tokens": 29817600} {"current_steps": 5575, "total_steps": 6250, "loss": 0.6658, "learning_rate": 1.425236602678387e-06, "epoch": 0.892, "percentage": 89.2, "elapsed_time": "8:58:25", "remaining_time": "1:05:11", "throughput": 923.79, "total_tokens": 29843136} {"current_steps": 5580, "total_steps": 6250, "loss": 0.7943, "learning_rate": 1.4043994114815661e-06, "epoch": 0.8928, "percentage": 89.28, "elapsed_time": "8:58:56", "remaining_time": "1:04:42", "throughput": 923.57, "total_tokens": 29864864} {"current_steps": 5585, "total_steps": 6250, "loss": 0.7734, "learning_rate": 1.38371126292208e-06, "epoch": 0.8936, "percentage": 89.36, "elapsed_time": "8:59:28", "remaining_time": "1:04:14", "throughput": 923.44, "total_tokens": 29890416} {"current_steps": 5590, "total_steps": 6250, "loss": 0.7008, "learning_rate": 1.3631722876775138e-06, "epoch": 0.8944, "percentage": 89.44, "elapsed_time": "9:00:01", "remaining_time": "1:03:45", "throughput": 923.29, "total_tokens": 29916400} {"current_steps": 5595, "total_steps": 6250, "loss": 0.6434, "learning_rate": 1.3427826154832042e-06, "epoch": 0.8952, "percentage": 89.52, "elapsed_time": "9:00:33", "remaining_time": "1:03:16", "throughput": 923.25, "total_tokens": 29944304} {"current_steps": 5600, "total_steps": 6250, "loss": 0.6952, "learning_rate": 1.3225423751313942e-06, "epoch": 0.896, "percentage": 89.6, "elapsed_time": "9:01:05", "remaining_time": "1:02:48", "throughput": 923.05, "total_tokens": 29967648} {"current_steps": 5605, "total_steps": 6250, "loss": 0.6331, "learning_rate": 1.3024516944704496e-06, "epoch": 0.8968, "percentage": 89.68, "elapsed_time": "9:01:39", "remaining_time": "1:02:19", "throughput": 922.75, "total_tokens": 29989312} {"current_steps": 5610, "total_steps": 6250, "loss": 0.7894, "learning_rate": 1.2825107004040272e-06, "epoch": 0.8976, "percentage": 89.76, "elapsed_time": "9:02:12", "remaining_time": "1:01:51", "throughput": 922.53, "total_tokens": 30012384} {"current_steps": 5615, "total_steps": 6250, "loss": 0.6819, "learning_rate": 1.2627195188902791e-06, "epoch": 0.8984, "percentage": 89.84, "elapsed_time": "9:02:47", "remaining_time": "1:01:23", "throughput": 922.46, "total_tokens": 30042656} {"current_steps": 5620, "total_steps": 6250, "loss": 0.8208, "learning_rate": 1.2430782749410673e-06, "epoch": 0.8992, "percentage": 89.92, "elapsed_time": "9:03:20", "remaining_time": "1:00:54", "throughput": 922.34, "total_tokens": 30068464} {"current_steps": 5625, "total_steps": 6250, "loss": 0.7203, "learning_rate": 1.2235870926211619e-06, "epoch": 0.9, "percentage": 90.0, "elapsed_time": "9:03:53", "remaining_time": "1:00:25", "throughput": 922.15, "total_tokens": 30093216} {"current_steps": 5630, "total_steps": 6250, "loss": 0.7368, "learning_rate": 1.2042460950474648e-06, "epoch": 0.9008, "percentage": 90.08, "elapsed_time": "9:04:25", "remaining_time": "0:59:57", "throughput": 922.01, "total_tokens": 30117488} {"current_steps": 5635, "total_steps": 6250, "loss": 0.7681, "learning_rate": 1.1850554043882328e-06, "epoch": 0.9016, "percentage": 90.16, "elapsed_time": "9:04:57", "remaining_time": "0:59:28", "throughput": 921.9, "total_tokens": 30144016} {"current_steps": 5640, "total_steps": 6250, "loss": 0.6962, "learning_rate": 1.1660151418622922e-06, "epoch": 0.9024, "percentage": 90.24, "elapsed_time": "9:05:35", "remaining_time": "0:59:00", "throughput": 921.86, "total_tokens": 30177184} {"current_steps": 5645, "total_steps": 6250, "loss": 0.7056, "learning_rate": 1.1471254277382881e-06, "epoch": 0.9032, "percentage": 90.32, "elapsed_time": "9:06:11", "remaining_time": "0:58:32", "throughput": 921.71, "total_tokens": 30206048} {"current_steps": 5650, "total_steps": 6250, "loss": 0.7089, "learning_rate": 1.1283863813339263e-06, "epoch": 0.904, "percentage": 90.4, "elapsed_time": "9:06:44", "remaining_time": "0:58:03", "throughput": 921.52, "total_tokens": 30229936} {"current_steps": 5655, "total_steps": 6250, "loss": 0.7794, "learning_rate": 1.1097981210152043e-06, "epoch": 0.9048, "percentage": 90.48, "elapsed_time": "9:07:17", "remaining_time": "0:57:35", "throughput": 921.43, "total_tokens": 30257760} {"current_steps": 5660, "total_steps": 6250, "loss": 0.77, "learning_rate": 1.0913607641956841e-06, "epoch": 0.9056, "percentage": 90.56, "elapsed_time": "9:07:52", "remaining_time": "0:57:06", "throughput": 921.32, "total_tokens": 30286464} {"current_steps": 5665, "total_steps": 6250, "loss": 0.708, "learning_rate": 1.0730744273357213e-06, "epoch": 0.9064, "percentage": 90.64, "elapsed_time": "9:08:26", "remaining_time": "0:56:38", "throughput": 921.31, "total_tokens": 30317040} {"current_steps": 5670, "total_steps": 6250, "loss": 0.6423, "learning_rate": 1.0549392259417646e-06, "epoch": 0.9072, "percentage": 90.72, "elapsed_time": "9:08:59", "remaining_time": "0:56:09", "throughput": 921.17, "total_tokens": 30342672} {"current_steps": 5675, "total_steps": 6250, "loss": 0.8176, "learning_rate": 1.0369552745656013e-06, "epoch": 0.908, "percentage": 90.8, "elapsed_time": "9:09:31", "remaining_time": "0:55:40", "throughput": 921.1, "total_tokens": 30369952} {"current_steps": 5680, "total_steps": 6250, "loss": 0.6924, "learning_rate": 1.0191226868036418e-06, "epoch": 0.9088, "percentage": 90.88, "elapsed_time": "9:10:07", "remaining_time": "0:55:12", "throughput": 921.02, "total_tokens": 30400800} {"current_steps": 5685, "total_steps": 6250, "loss": 0.576, "learning_rate": 1.001441575296208e-06, "epoch": 0.9096, "percentage": 90.96, "elapsed_time": "9:10:44", "remaining_time": "0:54:44", "throughput": 921.07, "total_tokens": 30436240} {"current_steps": 5690, "total_steps": 6250, "loss": 0.6206, "learning_rate": 9.839120517267985e-07, "epoch": 0.9104, "percentage": 91.04, "elapsed_time": "9:11:16", "remaining_time": "0:54:15", "throughput": 921.04, "total_tokens": 30465232} {"current_steps": 5695, "total_steps": 6250, "loss": 0.7424, "learning_rate": 9.665342268214166e-07, "epoch": 0.9112, "percentage": 91.12, "elapsed_time": "9:11:49", "remaining_time": "0:53:46", "throughput": 920.87, "total_tokens": 30489776} {"current_steps": 5700, "total_steps": 6250, "loss": 0.6868, "learning_rate": 9.493082103478517e-07, "epoch": 0.912, "percentage": 91.2, "elapsed_time": "9:12:22", "remaining_time": "0:53:17", "throughput": 920.71, "total_tokens": 30514592} {"current_steps": 5705, "total_steps": 6250, "loss": 0.7017, "learning_rate": 9.322341111149852e-07, "epoch": 0.9128, "percentage": 91.28, "elapsed_time": "9:12:57", "remaining_time": "0:52:49", "throughput": 920.64, "total_tokens": 30544112} {"current_steps": 5710, "total_steps": 6250, "loss": 0.6429, "learning_rate": 9.153120369721046e-07, "epoch": 0.9136, "percentage": 91.36, "elapsed_time": "9:13:34", "remaining_time": "0:52:21", "throughput": 920.6, "total_tokens": 30577440} {"current_steps": 5715, "total_steps": 6250, "loss": 0.6507, "learning_rate": 8.985420948082329e-07, "epoch": 0.9144, "percentage": 91.44, "elapsed_time": "9:14:08", "remaining_time": "0:51:52", "throughput": 920.42, "total_tokens": 30602704} {"current_steps": 5720, "total_steps": 6250, "loss": 0.7508, "learning_rate": 8.819243905514308e-07, "epoch": 0.9152, "percentage": 91.52, "elapsed_time": "9:14:40", "remaining_time": "0:51:23", "throughput": 920.29, "total_tokens": 30627360} {"current_steps": 5725, "total_steps": 6250, "loss": 0.6506, "learning_rate": 8.65459029168153e-07, "epoch": 0.916, "percentage": 91.6, "elapsed_time": "9:15:12", "remaining_time": "0:50:54", "throughput": 920.29, "total_tokens": 30657216} {"current_steps": 5730, "total_steps": 6250, "loss": 0.6426, "learning_rate": 8.491461146625773e-07, "epoch": 0.9168, "percentage": 91.68, "elapsed_time": "9:15:43", "remaining_time": "0:50:25", "throughput": 920.21, "total_tokens": 30683472} {"current_steps": 5735, "total_steps": 6250, "loss": 0.6227, "learning_rate": 8.329857500759292e-07, "epoch": 0.9176, "percentage": 91.76, "elapsed_time": "9:16:16", "remaining_time": "0:49:57", "throughput": 920.03, "total_tokens": 30707392} {"current_steps": 5740, "total_steps": 6250, "loss": 0.839, "learning_rate": 8.169780374858577e-07, "epoch": 0.9184, "percentage": 91.84, "elapsed_time": "9:16:49", "remaining_time": "0:49:28", "throughput": 919.87, "total_tokens": 30732160} {"current_steps": 5745, "total_steps": 6250, "loss": 0.6817, "learning_rate": 8.011230780057749e-07, "epoch": 0.9192, "percentage": 91.92, "elapsed_time": "9:17:21", "remaining_time": "0:48:59", "throughput": 919.82, "total_tokens": 30760336} {"current_steps": 5750, "total_steps": 6250, "loss": 0.7016, "learning_rate": 7.854209717842231e-07, "epoch": 0.92, "percentage": 92.0, "elapsed_time": "9:17:54", "remaining_time": "0:48:30", "throughput": 919.78, "total_tokens": 30788800} {"current_steps": 5755, "total_steps": 6250, "loss": 0.702, "learning_rate": 7.698718180042392e-07, "epoch": 0.9208, "percentage": 92.08, "elapsed_time": "9:18:25", "remaining_time": "0:48:01", "throughput": 919.66, "total_tokens": 30813632} {"current_steps": 5760, "total_steps": 6250, "loss": 0.7203, "learning_rate": 7.544757148827297e-07, "epoch": 0.9216, "percentage": 92.16, "elapsed_time": "9:18:58", "remaining_time": "0:47:33", "throughput": 919.55, "total_tokens": 30840816} {"current_steps": 5765, "total_steps": 6250, "loss": 0.6873, "learning_rate": 7.392327596698473e-07, "epoch": 0.9224, "percentage": 92.24, "elapsed_time": "9:19:31", "remaining_time": "0:47:04", "throughput": 919.29, "total_tokens": 30861664} {"current_steps": 5770, "total_steps": 6250, "loss": 0.6975, "learning_rate": 7.241430486483819e-07, "epoch": 0.9232, "percentage": 92.32, "elapsed_time": "9:20:04", "remaining_time": "0:46:35", "throughput": 919.09, "total_tokens": 30886064} {"current_steps": 5775, "total_steps": 6250, "loss": 0.6058, "learning_rate": 7.092066771331507e-07, "epoch": 0.924, "percentage": 92.4, "elapsed_time": "9:20:36", "remaining_time": "0:46:06", "throughput": 918.96, "total_tokens": 30910608} {"current_steps": 5780, "total_steps": 6250, "loss": 0.8128, "learning_rate": 6.944237394703984e-07, "epoch": 0.9248, "percentage": 92.48, "elapsed_time": "9:21:09", "remaining_time": "0:45:37", "throughput": 918.8, "total_tokens": 30935008} {"current_steps": 5785, "total_steps": 6250, "loss": 0.7329, "learning_rate": 6.797943290371839e-07, "epoch": 0.9256, "percentage": 92.56, "elapsed_time": "9:21:40", "remaining_time": "0:45:08", "throughput": 918.68, "total_tokens": 30959792} {"current_steps": 5790, "total_steps": 6250, "loss": 0.673, "learning_rate": 6.653185382408194e-07, "epoch": 0.9264, "percentage": 92.64, "elapsed_time": "9:22:12", "remaining_time": "0:44:39", "throughput": 918.57, "total_tokens": 30985856} {"current_steps": 5795, "total_steps": 6250, "loss": 0.7395, "learning_rate": 6.509964585182687e-07, "epoch": 0.9272, "percentage": 92.72, "elapsed_time": "9:22:47", "remaining_time": "0:44:11", "throughput": 918.45, "total_tokens": 31013888} {"current_steps": 5800, "total_steps": 6250, "loss": 0.753, "learning_rate": 6.368281803355691e-07, "epoch": 0.928, "percentage": 92.8, "elapsed_time": "9:23:19", "remaining_time": "0:43:42", "throughput": 918.31, "total_tokens": 31038352} {"current_steps": 5805, "total_steps": 6250, "loss": 0.7573, "learning_rate": 6.228137931872713e-07, "epoch": 0.9288, "percentage": 92.88, "elapsed_time": "9:23:53", "remaining_time": "0:43:13", "throughput": 918.23, "total_tokens": 31066624} {"current_steps": 5810, "total_steps": 6250, "loss": 0.759, "learning_rate": 6.089533855958507e-07, "epoch": 0.9296, "percentage": 92.96, "elapsed_time": "9:24:25", "remaining_time": "0:42:44", "throughput": 918.13, "total_tokens": 31093184} {"current_steps": 5815, "total_steps": 6250, "loss": 0.7482, "learning_rate": 5.95247045111183e-07, "epoch": 0.9304, "percentage": 93.04, "elapsed_time": "9:24:58", "remaining_time": "0:42:15", "throughput": 918.0, "total_tokens": 31118352} {"current_steps": 5820, "total_steps": 6250, "loss": 0.6295, "learning_rate": 5.816948583099613e-07, "epoch": 0.9312, "percentage": 93.12, "elapsed_time": "9:25:30", "remaining_time": "0:41:46", "throughput": 917.92, "total_tokens": 31145616} {"current_steps": 5825, "total_steps": 6250, "loss": 0.7596, "learning_rate": 5.68296910795163e-07, "epoch": 0.932, "percentage": 93.2, "elapsed_time": "9:26:01", "remaining_time": "0:41:17", "throughput": 917.73, "total_tokens": 31167088} {"current_steps": 5830, "total_steps": 6250, "loss": 0.689, "learning_rate": 5.550532871955061e-07, "epoch": 0.9328, "percentage": 93.28, "elapsed_time": "9:26:33", "remaining_time": "0:40:48", "throughput": 917.61, "total_tokens": 31192672} {"current_steps": 5835, "total_steps": 6250, "loss": 0.6387, "learning_rate": 5.419640711649188e-07, "epoch": 0.9336, "percentage": 93.36, "elapsed_time": "9:27:09", "remaining_time": "0:40:20", "throughput": 917.56, "total_tokens": 31224016} {"current_steps": 5840, "total_steps": 6250, "loss": 0.7316, "learning_rate": 5.290293453819955e-07, "epoch": 0.9344, "percentage": 93.44, "elapsed_time": "9:27:41", "remaining_time": "0:39:51", "throughput": 917.36, "total_tokens": 31247008} {"current_steps": 5845, "total_steps": 6250, "loss": 0.7255, "learning_rate": 5.162491915495005e-07, "epoch": 0.9352, "percentage": 93.52, "elapsed_time": "9:28:13", "remaining_time": "0:39:22", "throughput": 917.27, "total_tokens": 31273232} {"current_steps": 5850, "total_steps": 6250, "loss": 0.7188, "learning_rate": 5.036236903938285e-07, "epoch": 0.936, "percentage": 93.6, "elapsed_time": "9:28:45", "remaining_time": "0:38:53", "throughput": 917.19, "total_tokens": 31299504} {"current_steps": 5855, "total_steps": 6250, "loss": 0.6763, "learning_rate": 4.911529216645088e-07, "epoch": 0.9368, "percentage": 93.68, "elapsed_time": "9:29:17", "remaining_time": "0:38:24", "throughput": 917.09, "total_tokens": 31325792} {"current_steps": 5860, "total_steps": 6250, "loss": 0.6109, "learning_rate": 4.788369641336943e-07, "epoch": 0.9376, "percentage": 93.76, "elapsed_time": "9:29:50", "remaining_time": "0:37:55", "throughput": 916.96, "total_tokens": 31351216} {"current_steps": 5865, "total_steps": 6250, "loss": 0.7778, "learning_rate": 4.666758955956613e-07, "epoch": 0.9384, "percentage": 93.84, "elapsed_time": "9:30:23", "remaining_time": "0:37:26", "throughput": 916.81, "total_tokens": 31376464} {"current_steps": 5870, "total_steps": 6250, "loss": 0.6315, "learning_rate": 4.546697928663357e-07, "epoch": 0.9392, "percentage": 93.92, "elapsed_time": "9:30:58", "remaining_time": "0:36:57", "throughput": 916.82, "total_tokens": 31408832} {"current_steps": 5875, "total_steps": 6250, "loss": 0.7918, "learning_rate": 4.4281873178278475e-07, "epoch": 0.94, "percentage": 94.0, "elapsed_time": "9:31:30", "remaining_time": "0:36:28", "throughput": 916.65, "total_tokens": 31432352} {"current_steps": 5880, "total_steps": 6250, "loss": 0.6983, "learning_rate": 4.311227872027479e-07, "epoch": 0.9408, "percentage": 94.08, "elapsed_time": "9:32:05", "remaining_time": "0:35:59", "throughput": 916.46, "total_tokens": 31457392} {"current_steps": 5885, "total_steps": 6250, "loss": 0.7233, "learning_rate": 4.1958203300417054e-07, "epoch": 0.9416, "percentage": 94.16, "elapsed_time": "9:32:36", "remaining_time": "0:35:30", "throughput": 916.36, "total_tokens": 31482704} {"current_steps": 5890, "total_steps": 6250, "loss": 0.6402, "learning_rate": 4.0819654208472947e-07, "epoch": 0.9424, "percentage": 94.24, "elapsed_time": "9:33:09", "remaining_time": "0:35:01", "throughput": 916.32, "total_tokens": 31512368} {"current_steps": 5895, "total_steps": 6250, "loss": 0.6942, "learning_rate": 3.9696638636137206e-07, "epoch": 0.9432, "percentage": 94.32, "elapsed_time": "9:33:44", "remaining_time": "0:34:33", "throughput": 916.18, "total_tokens": 31539040} {"current_steps": 5900, "total_steps": 6250, "loss": 0.7119, "learning_rate": 3.8589163676986674e-07, "epoch": 0.944, "percentage": 94.4, "elapsed_time": "9:34:15", "remaining_time": "0:34:03", "throughput": 916.07, "total_tokens": 31563712} {"current_steps": 5905, "total_steps": 6250, "loss": 0.6575, "learning_rate": 3.7497236326434757e-07, "epoch": 0.9448, "percentage": 94.48, "elapsed_time": "9:34:48", "remaining_time": "0:33:34", "throughput": 915.89, "total_tokens": 31587760} {"current_steps": 5910, "total_steps": 6250, "loss": 0.704, "learning_rate": 3.6420863481688437e-07, "epoch": 0.9456, "percentage": 94.56, "elapsed_time": "9:35:19", "remaining_time": "0:33:05", "throughput": 915.8, "total_tokens": 31612976} {"current_steps": 5915, "total_steps": 6250, "loss": 0.7876, "learning_rate": 3.536005194170328e-07, "epoch": 0.9464, "percentage": 94.64, "elapsed_time": "9:35:52", "remaining_time": "0:32:36", "throughput": 915.68, "total_tokens": 31639472} {"current_steps": 5920, "total_steps": 6250, "loss": 0.7033, "learning_rate": 3.431480840714152e-07, "epoch": 0.9472, "percentage": 94.72, "elapsed_time": "9:36:27", "remaining_time": "0:32:08", "throughput": 915.67, "total_tokens": 31670768} {"current_steps": 5925, "total_steps": 6250, "loss": 0.7095, "learning_rate": 3.328513948032991e-07, "epoch": 0.948, "percentage": 94.8, "elapsed_time": "9:36:58", "remaining_time": "0:31:38", "throughput": 915.6, "total_tokens": 31696624} {"current_steps": 5930, "total_steps": 6250, "loss": 0.6629, "learning_rate": 3.227105166521638e-07, "epoch": 0.9488, "percentage": 94.88, "elapsed_time": "9:37:29", "remaining_time": "0:31:09", "throughput": 915.57, "total_tokens": 31723840} {"current_steps": 5935, "total_steps": 6250, "loss": 0.591, "learning_rate": 3.127255136733093e-07, "epoch": 0.9496, "percentage": 94.96, "elapsed_time": "9:38:02", "remaining_time": "0:30:40", "throughput": 915.52, "total_tokens": 31752736} {"current_steps": 5940, "total_steps": 6250, "loss": 0.6641, "learning_rate": 3.0289644893744527e-07, "epoch": 0.9504, "percentage": 95.04, "elapsed_time": "9:38:35", "remaining_time": "0:30:11", "throughput": 915.38, "total_tokens": 31777760} {"current_steps": 5945, "total_steps": 6250, "loss": 0.6156, "learning_rate": 2.9322338453028066e-07, "epoch": 0.9512, "percentage": 95.12, "elapsed_time": "9:39:08", "remaining_time": "0:29:42", "throughput": 915.29, "total_tokens": 31805264} {"current_steps": 5950, "total_steps": 6250, "loss": 0.7834, "learning_rate": 2.8370638155215123e-07, "epoch": 0.952, "percentage": 95.2, "elapsed_time": "9:39:39", "remaining_time": "0:29:13", "throughput": 915.15, "total_tokens": 31828656} {"current_steps": 5955, "total_steps": 6250, "loss": 0.6998, "learning_rate": 2.743455001176176e-07, "epoch": 0.9528, "percentage": 95.28, "elapsed_time": "9:40:11", "remaining_time": "0:28:44", "throughput": 915.08, "total_tokens": 31855424} {"current_steps": 5960, "total_steps": 6250, "loss": 0.7458, "learning_rate": 2.6514079935509584e-07, "epoch": 0.9536, "percentage": 95.36, "elapsed_time": "9:40:42", "remaining_time": "0:28:15", "throughput": 914.94, "total_tokens": 31879168} {"current_steps": 5965, "total_steps": 6250, "loss": 0.7061, "learning_rate": 2.560923374064772e-07, "epoch": 0.9544, "percentage": 95.44, "elapsed_time": "9:41:15", "remaining_time": "0:27:46", "throughput": 914.78, "total_tokens": 31903824} {"current_steps": 5970, "total_steps": 6250, "loss": 0.8603, "learning_rate": 2.472001714267674e-07, "epoch": 0.9552, "percentage": 95.52, "elapsed_time": "9:41:46", "remaining_time": "0:27:17", "throughput": 914.64, "total_tokens": 31927184} {"current_steps": 5975, "total_steps": 6250, "loss": 0.6273, "learning_rate": 2.384643575837203e-07, "epoch": 0.956, "percentage": 95.6, "elapsed_time": "9:42:19", "remaining_time": "0:26:48", "throughput": 914.59, "total_tokens": 31955104} {"current_steps": 5980, "total_steps": 6250, "loss": 0.714, "learning_rate": 2.298849510574824e-07, "epoch": 0.9568, "percentage": 95.68, "elapsed_time": "9:42:54", "remaining_time": "0:26:19", "throughput": 914.55, "total_tokens": 31985888} {"current_steps": 5985, "total_steps": 6250, "loss": 0.6899, "learning_rate": 2.2146200604024613e-07, "epoch": 0.9576, "percentage": 95.76, "elapsed_time": "9:43:29", "remaining_time": "0:25:50", "throughput": 914.43, "total_tokens": 32013520} {"current_steps": 5990, "total_steps": 6250, "loss": 0.677, "learning_rate": 2.1319557573591108e-07, "epoch": 0.9584, "percentage": 95.84, "elapsed_time": "9:44:01", "remaining_time": "0:25:20", "throughput": 914.32, "total_tokens": 32038880} {"current_steps": 5995, "total_steps": 6250, "loss": 0.7033, "learning_rate": 2.050857123597455e-07, "epoch": 0.9592, "percentage": 95.92, "elapsed_time": "9:44:32", "remaining_time": "0:24:51", "throughput": 914.17, "total_tokens": 32062160} {"current_steps": 6000, "total_steps": 6250, "loss": 0.6431, "learning_rate": 1.9713246713805588e-07, "epoch": 0.96, "percentage": 96.0, "elapsed_time": "9:45:05", "remaining_time": "0:24:22", "throughput": 913.97, "total_tokens": 32085712} {"current_steps": 6005, "total_steps": 6250, "loss": 0.683, "learning_rate": 1.8933589030785682e-07, "epoch": 0.9608, "percentage": 96.08, "elapsed_time": "9:45:39", "remaining_time": "0:23:53", "throughput": 913.93, "total_tokens": 32115232} {"current_steps": 6010, "total_steps": 6250, "loss": 0.751, "learning_rate": 1.8169603111656552e-07, "epoch": 0.9616, "percentage": 96.16, "elapsed_time": "9:46:12", "remaining_time": "0:23:24", "throughput": 913.86, "total_tokens": 32142992} {"current_steps": 6015, "total_steps": 6250, "loss": 0.5808, "learning_rate": 1.7421293782168835e-07, "epoch": 0.9624, "percentage": 96.24, "elapsed_time": "9:46:47", "remaining_time": "0:22:55", "throughput": 913.9, "total_tokens": 32176176} {"current_steps": 6020, "total_steps": 6250, "loss": 0.6852, "learning_rate": 1.6688665769050703e-07, "epoch": 0.9632, "percentage": 96.32, "elapsed_time": "9:47:21", "remaining_time": "0:22:26", "throughput": 913.84, "total_tokens": 32204992} {"current_steps": 6025, "total_steps": 6250, "loss": 0.6778, "learning_rate": 1.5971723699979013e-07, "epoch": 0.964, "percentage": 96.4, "elapsed_time": "9:47:54", "remaining_time": "0:21:57", "throughput": 913.77, "total_tokens": 32232960} {"current_steps": 6030, "total_steps": 6250, "loss": 0.7036, "learning_rate": 1.5270472103549315e-07, "epoch": 0.9648, "percentage": 96.48, "elapsed_time": "9:48:28", "remaining_time": "0:21:28", "throughput": 913.74, "total_tokens": 32262672} {"current_steps": 6035, "total_steps": 6250, "loss": 0.655, "learning_rate": 1.4584915409248112e-07, "epoch": 0.9656, "percentage": 96.56, "elapsed_time": "9:48:59", "remaining_time": "0:20:58", "throughput": 913.59, "total_tokens": 32285504} {"current_steps": 6040, "total_steps": 6250, "loss": 0.7324, "learning_rate": 1.3915057947423705e-07, "epoch": 0.9664, "percentage": 96.64, "elapsed_time": "9:49:31", "remaining_time": "0:20:29", "throughput": 913.51, "total_tokens": 32312288} {"current_steps": 6045, "total_steps": 6250, "loss": 0.7166, "learning_rate": 1.3260903949260107e-07, "epoch": 0.9672, "percentage": 96.72, "elapsed_time": "9:50:03", "remaining_time": "0:20:00", "throughput": 913.44, "total_tokens": 32339424} {"current_steps": 6050, "total_steps": 6250, "loss": 0.7, "learning_rate": 1.2622457546749567e-07, "epoch": 0.968, "percentage": 96.8, "elapsed_time": "9:50:35", "remaining_time": "0:19:31", "throughput": 913.28, "total_tokens": 32362848} {"current_steps": 6055, "total_steps": 6250, "loss": 0.7519, "learning_rate": 1.1999722772666476e-07, "epoch": 0.9688, "percentage": 96.88, "elapsed_time": "9:51:12", "remaining_time": "0:19:02", "throughput": 913.2, "total_tokens": 32393264} {"current_steps": 6060, "total_steps": 6250, "loss": 0.7524, "learning_rate": 1.1392703560542117e-07, "epoch": 0.9696, "percentage": 96.96, "elapsed_time": "9:51:45", "remaining_time": "0:18:33", "throughput": 913.05, "total_tokens": 32418464} {"current_steps": 6065, "total_steps": 6250, "loss": 0.5829, "learning_rate": 1.080140374463967e-07, "epoch": 0.9704, "percentage": 97.04, "elapsed_time": "9:52:17", "remaining_time": "0:18:04", "throughput": 913.09, "total_tokens": 32449248} {"current_steps": 6070, "total_steps": 6250, "loss": 0.7017, "learning_rate": 1.0225827059930083e-07, "epoch": 0.9712, "percentage": 97.12, "elapsed_time": "9:52:48", "remaining_time": "0:17:34", "throughput": 913.09, "total_tokens": 32477312} {"current_steps": 6075, "total_steps": 6250, "loss": 0.6852, "learning_rate": 9.665977142068738e-08, "epoch": 0.972, "percentage": 97.2, "elapsed_time": "9:53:22", "remaining_time": "0:17:05", "throughput": 913.0, "total_tokens": 32505024} {"current_steps": 6080, "total_steps": 6250, "loss": 0.733, "learning_rate": 9.121857527372158e-08, "epoch": 0.9728, "percentage": 97.28, "elapsed_time": "9:53:55", "remaining_time": "0:16:36", "throughput": 912.85, "total_tokens": 32530080} {"current_steps": 6085, "total_steps": 6250, "loss": 0.6721, "learning_rate": 8.593471652794949e-08, "epoch": 0.9736, "percentage": 97.36, "elapsed_time": "9:54:30", "remaining_time": "0:16:07", "throughput": 912.73, "total_tokens": 32557488} {"current_steps": 6090, "total_steps": 6250, "loss": 0.6572, "learning_rate": 8.080822855909831e-08, "epoch": 0.9744, "percentage": 97.44, "elapsed_time": "9:55:04", "remaining_time": "0:15:38", "throughput": 912.76, "total_tokens": 32589072} {"current_steps": 6095, "total_steps": 6250, "loss": 0.7535, "learning_rate": 7.583914374885426e-08, "epoch": 0.9752, "percentage": 97.52, "elapsed_time": "9:55:34", "remaining_time": "0:15:08", "throughput": 912.64, "total_tokens": 32613296} {"current_steps": 6100, "total_steps": 6250, "loss": 0.639, "learning_rate": 7.102749348465165e-08, "epoch": 0.976, "percentage": 97.6, "elapsed_time": "9:56:08", "remaining_time": "0:14:39", "throughput": 912.61, "total_tokens": 32642512} {"current_steps": 6105, "total_steps": 6250, "loss": 0.7558, "learning_rate": 6.637330815949527e-08, "epoch": 0.9768, "percentage": 97.68, "elapsed_time": "9:56:39", "remaining_time": "0:14:10", "throughput": 912.46, "total_tokens": 32666064} {"current_steps": 6110, "total_steps": 6250, "loss": 0.7228, "learning_rate": 6.187661717174386e-08, "epoch": 0.9776, "percentage": 97.76, "elapsed_time": "9:57:10", "remaining_time": "0:13:40", "throughput": 912.35, "total_tokens": 32690016} {"current_steps": 6115, "total_steps": 6250, "loss": 0.7079, "learning_rate": 5.753744892494639e-08, "epoch": 0.9784, "percentage": 97.84, "elapsed_time": "9:57:42", "remaining_time": "0:13:11", "throughput": 912.26, "total_tokens": 32716240} {"current_steps": 6120, "total_steps": 6250, "loss": 0.7692, "learning_rate": 5.335583082764495e-08, "epoch": 0.9792, "percentage": 97.92, "elapsed_time": "9:58:14", "remaining_time": "0:12:42", "throughput": 912.15, "total_tokens": 32741648} {"current_steps": 6125, "total_steps": 6250, "loss": 0.6285, "learning_rate": 4.9331789293211026e-08, "epoch": 0.98, "percentage": 98.0, "elapsed_time": "9:58:50", "remaining_time": "0:12:13", "throughput": 912.04, "total_tokens": 32770224} {"current_steps": 6130, "total_steps": 6250, "loss": 0.7464, "learning_rate": 4.546534973968175e-08, "epoch": 0.9808, "percentage": 98.08, "elapsed_time": "9:59:23", "remaining_time": "0:11:44", "throughput": 912.02, "total_tokens": 32798864} {"current_steps": 6135, "total_steps": 6250, "loss": 0.6632, "learning_rate": 4.1756536589585004e-08, "epoch": 0.9816, "percentage": 98.16, "elapsed_time": "9:59:57", "remaining_time": "0:11:14", "throughput": 911.98, "total_tokens": 32829136} {"current_steps": 6140, "total_steps": 6250, "loss": 0.7378, "learning_rate": 3.820537326980622e-08, "epoch": 0.9824, "percentage": 98.24, "elapsed_time": "10:00:29", "remaining_time": "0:10:45", "throughput": 911.99, "total_tokens": 32858976} {"current_steps": 6145, "total_steps": 6250, "loss": 0.7125, "learning_rate": 3.481188221142184e-08, "epoch": 0.9832, "percentage": 98.32, "elapsed_time": "10:01:02", "remaining_time": "0:10:16", "throughput": 911.91, "total_tokens": 32886208} {"current_steps": 6150, "total_steps": 6250, "loss": 0.7723, "learning_rate": 3.157608484956332e-08, "epoch": 0.984, "percentage": 98.4, "elapsed_time": "10:01:35", "remaining_time": "0:09:46", "throughput": 911.84, "total_tokens": 32912960} {"current_steps": 6155, "total_steps": 6250, "loss": 0.6472, "learning_rate": 2.8498001623286642e-08, "epoch": 0.9848, "percentage": 98.48, "elapsed_time": "10:02:08", "remaining_time": "0:09:17", "throughput": 911.77, "total_tokens": 32941072} {"current_steps": 6160, "total_steps": 6250, "loss": 0.7462, "learning_rate": 2.557765197543638e-08, "epoch": 0.9856, "percentage": 98.56, "elapsed_time": "10:02:40", "remaining_time": "0:08:48", "throughput": 911.72, "total_tokens": 32968304} {"current_steps": 6165, "total_steps": 6250, "loss": 0.7079, "learning_rate": 2.281505435253184e-08, "epoch": 0.9864, "percentage": 98.64, "elapsed_time": "10:03:13", "remaining_time": "0:08:19", "throughput": 911.56, "total_tokens": 32993008} {"current_steps": 6170, "total_steps": 6250, "loss": 0.7058, "learning_rate": 2.0210226204639414e-08, "epoch": 0.9872, "percentage": 98.72, "elapsed_time": "10:03:46", "remaining_time": "0:07:49", "throughput": 911.45, "total_tokens": 33018128} {"current_steps": 6175, "total_steps": 6250, "loss": 0.5942, "learning_rate": 1.7763183985269883e-08, "epoch": 0.988, "percentage": 98.8, "elapsed_time": "10:04:21", "remaining_time": "0:07:20", "throughput": 911.37, "total_tokens": 33047968} {"current_steps": 6180, "total_steps": 6250, "loss": 0.7738, "learning_rate": 1.5473943151270153e-08, "epoch": 0.9888, "percentage": 98.88, "elapsed_time": "10:04:55", "remaining_time": "0:06:51", "throughput": 911.21, "total_tokens": 33072560} {"current_steps": 6185, "total_steps": 6250, "loss": 0.781, "learning_rate": 1.3342518162728912e-08, "epoch": 0.9896, "percentage": 98.96, "elapsed_time": "10:05:27", "remaining_time": "0:06:21", "throughput": 911.07, "total_tokens": 33096928} {"current_steps": 6190, "total_steps": 6250, "loss": 0.6607, "learning_rate": 1.136892248288779e-08, "epoch": 0.9904, "percentage": 99.04, "elapsed_time": "10:06:02", "remaining_time": "0:05:52", "throughput": 910.94, "total_tokens": 33123808} {"current_steps": 6195, "total_steps": 6250, "loss": 0.7506, "learning_rate": 9.553168578049775e-09, "epoch": 0.9912, "percentage": 99.12, "elapsed_time": "10:06:34", "remaining_time": "0:05:23", "throughput": 910.81, "total_tokens": 33148688} {"current_steps": 6200, "total_steps": 6250, "loss": 0.6521, "learning_rate": 7.895267917501504e-09, "epoch": 0.992, "percentage": 99.2, "elapsed_time": "10:07:06", "remaining_time": "0:04:53", "throughput": 910.77, "total_tokens": 33176624} {"current_steps": 6205, "total_steps": 6250, "loss": 0.709, "learning_rate": 6.395230973443856e-09, "epoch": 0.9928, "percentage": 99.28, "elapsed_time": "10:07:38", "remaining_time": "0:04:24", "throughput": 910.58, "total_tokens": 33198160} {"current_steps": 6210, "total_steps": 6250, "loss": 0.6685, "learning_rate": 5.053067220925356e-09, "epoch": 0.9936, "percentage": 99.36, "elapsed_time": "10:08:12", "remaining_time": "0:03:55", "throughput": 910.49, "total_tokens": 33226336} {"current_steps": 6215, "total_steps": 6250, "loss": 0.6672, "learning_rate": 3.868785137786657e-09, "epoch": 0.9944, "percentage": 99.44, "elapsed_time": "10:08:43", "remaining_time": "0:03:25", "throughput": 910.25, "total_tokens": 33245824} {"current_steps": 6220, "total_steps": 6250, "loss": 0.7053, "learning_rate": 2.842392204591149e-09, "epoch": 0.9952, "percentage": 99.52, "elapsed_time": "10:09:15", "remaining_time": "0:02:56", "throughput": 910.23, "total_tokens": 33274176} {"current_steps": 6225, "total_steps": 6250, "loss": 0.7184, "learning_rate": 1.973894904597207e-09, "epoch": 0.996, "percentage": 99.6, "elapsed_time": "10:09:49", "remaining_time": "0:02:26", "throughput": 910.17, "total_tokens": 33302528} {"current_steps": 6230, "total_steps": 6250, "loss": 0.7092, "learning_rate": 1.2632987237054528e-09, "epoch": 0.9968, "percentage": 99.68, "elapsed_time": "10:10:21", "remaining_time": "0:01:57", "throughput": 910.13, "total_tokens": 33330384} {"current_steps": 6235, "total_steps": 6250, "loss": 0.6142, "learning_rate": 7.106081504254514e-10, "epoch": 0.9976, "percentage": 99.76, "elapsed_time": "10:10:53", "remaining_time": "0:01:28", "throughput": 910.1, "total_tokens": 33357968} {"current_steps": 6240, "total_steps": 6250, "loss": 0.7147, "learning_rate": 3.158266758562789e-10, "epoch": 0.9984, "percentage": 99.84, "elapsed_time": "10:11:27", "remaining_time": "0:00:58", "throughput": 909.9, "total_tokens": 33381536} {"current_steps": 6245, "total_steps": 6250, "loss": 0.7005, "learning_rate": 7.89567936476665e-11, "epoch": 0.9992, "percentage": 99.92, "elapsed_time": "10:11:59", "remaining_time": "0:00:29", "throughput": 909.88, "total_tokens": 33409984} {"current_steps": 6250, "total_steps": 6250, "loss": 0.7516, "learning_rate": 0.0, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "10:12:31", "remaining_time": "0:00:00", "throughput": 909.84, "total_tokens": 33437856} {"current_steps": 6250, "total_steps": 6250, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "10:12:31", "remaining_time": "0:00:00", "throughput": 909.83, "total_tokens": 33437856}