s1K_llama3.1_8b_32kcontext / trainer_log.jsonl
sedrickkeh's picture
Training in progress, epoch 5
bfb46ab verified
{"current_steps": 1, "total_steps": 315, "loss": 0.4365, "lr": 6.25e-07, "epoch": 0.015873015873015872, "percentage": 0.32, "elapsed_time": "0:00:14", "remaining_time": "1:13:40"}
{"current_steps": 2, "total_steps": 315, "loss": 0.4611, "lr": 1.25e-06, "epoch": 0.031746031746031744, "percentage": 0.63, "elapsed_time": "0:00:18", "remaining_time": "0:49:23"}
{"current_steps": 3, "total_steps": 315, "loss": 0.4612, "lr": 1.8750000000000003e-06, "epoch": 0.047619047619047616, "percentage": 0.95, "elapsed_time": "0:00:24", "remaining_time": "0:41:43"}
{"current_steps": 4, "total_steps": 315, "loss": 0.4394, "lr": 2.5e-06, "epoch": 0.06349206349206349, "percentage": 1.27, "elapsed_time": "0:00:28", "remaining_time": "0:37:03"}
{"current_steps": 5, "total_steps": 315, "loss": 0.5477, "lr": 3.125e-06, "epoch": 0.07936507936507936, "percentage": 1.59, "elapsed_time": "0:00:32", "remaining_time": "0:33:59"}
{"current_steps": 6, "total_steps": 315, "loss": 0.4767, "lr": 3.7500000000000005e-06, "epoch": 0.09523809523809523, "percentage": 1.9, "elapsed_time": "0:00:37", "remaining_time": "0:31:50"}
{"current_steps": 7, "total_steps": 315, "loss": 0.4885, "lr": 4.3750000000000005e-06, "epoch": 0.1111111111111111, "percentage": 2.22, "elapsed_time": "0:00:41", "remaining_time": "0:30:41"}
{"current_steps": 8, "total_steps": 315, "loss": 0.4022, "lr": 5e-06, "epoch": 0.12698412698412698, "percentage": 2.54, "elapsed_time": "0:00:46", "remaining_time": "0:29:45"}
{"current_steps": 9, "total_steps": 315, "loss": 0.5179, "lr": 5.625e-06, "epoch": 0.14285714285714285, "percentage": 2.86, "elapsed_time": "0:00:50", "remaining_time": "0:28:45"}
{"current_steps": 10, "total_steps": 315, "loss": 0.5245, "lr": 6.25e-06, "epoch": 0.15873015873015872, "percentage": 3.17, "elapsed_time": "0:00:54", "remaining_time": "0:27:55"}
{"current_steps": 11, "total_steps": 315, "loss": 0.4668, "lr": 6.875e-06, "epoch": 0.1746031746031746, "percentage": 3.49, "elapsed_time": "0:00:59", "remaining_time": "0:27:17"}
{"current_steps": 12, "total_steps": 315, "loss": 0.4321, "lr": 7.500000000000001e-06, "epoch": 0.19047619047619047, "percentage": 3.81, "elapsed_time": "0:01:03", "remaining_time": "0:26:51"}
{"current_steps": 13, "total_steps": 315, "loss": 0.4084, "lr": 8.125000000000001e-06, "epoch": 0.20634920634920634, "percentage": 4.13, "elapsed_time": "0:01:08", "remaining_time": "0:26:29"}
{"current_steps": 14, "total_steps": 315, "loss": 0.4557, "lr": 8.750000000000001e-06, "epoch": 0.2222222222222222, "percentage": 4.44, "elapsed_time": "0:01:13", "remaining_time": "0:26:19"}
{"current_steps": 15, "total_steps": 315, "loss": 0.4589, "lr": 9.375000000000001e-06, "epoch": 0.23809523809523808, "percentage": 4.76, "elapsed_time": "0:01:17", "remaining_time": "0:25:52"}
{"current_steps": 16, "total_steps": 315, "loss": 0.4847, "lr": 1e-05, "epoch": 0.25396825396825395, "percentage": 5.08, "elapsed_time": "0:01:22", "remaining_time": "0:25:33"}
{"current_steps": 17, "total_steps": 315, "loss": 0.5561, "lr": 9.999724009977419e-06, "epoch": 0.2698412698412698, "percentage": 5.4, "elapsed_time": "0:01:26", "remaining_time": "0:25:10"}
{"current_steps": 18, "total_steps": 315, "loss": 0.3696, "lr": 9.998896070377873e-06, "epoch": 0.2857142857142857, "percentage": 5.71, "elapsed_time": "0:01:30", "remaining_time": "0:25:01"}
{"current_steps": 19, "total_steps": 315, "loss": 0.4165, "lr": 9.99751627260259e-06, "epoch": 0.30158730158730157, "percentage": 6.03, "elapsed_time": "0:01:35", "remaining_time": "0:24:52"}
{"current_steps": 20, "total_steps": 315, "loss": 0.4077, "lr": 9.995584768975735e-06, "epoch": 0.31746031746031744, "percentage": 6.35, "elapsed_time": "0:01:40", "remaining_time": "0:24:44"}
{"current_steps": 21, "total_steps": 315, "loss": 0.443, "lr": 9.993101772727602e-06, "epoch": 0.3333333333333333, "percentage": 6.67, "elapsed_time": "0:01:44", "remaining_time": "0:24:28"}
{"current_steps": 22, "total_steps": 315, "loss": 0.6172, "lr": 9.990067557971068e-06, "epoch": 0.3492063492063492, "percentage": 6.98, "elapsed_time": "0:01:49", "remaining_time": "0:24:14"}
{"current_steps": 23, "total_steps": 315, "loss": 0.449, "lr": 9.986482459671332e-06, "epoch": 0.36507936507936506, "percentage": 7.3, "elapsed_time": "0:01:54", "remaining_time": "0:24:08"}
{"current_steps": 24, "total_steps": 315, "loss": 0.4212, "lr": 9.982346873608936e-06, "epoch": 0.38095238095238093, "percentage": 7.62, "elapsed_time": "0:01:58", "remaining_time": "0:23:57"}
{"current_steps": 25, "total_steps": 315, "loss": 0.4472, "lr": 9.977661256336081e-06, "epoch": 0.3968253968253968, "percentage": 7.94, "elapsed_time": "0:02:02", "remaining_time": "0:23:45"}
{"current_steps": 26, "total_steps": 315, "loss": 0.4493, "lr": 9.972426125126208e-06, "epoch": 0.4126984126984127, "percentage": 8.25, "elapsed_time": "0:02:07", "remaining_time": "0:23:34"}
{"current_steps": 27, "total_steps": 315, "loss": 0.6344, "lr": 9.966642057916915e-06, "epoch": 0.42857142857142855, "percentage": 8.57, "elapsed_time": "0:02:12", "remaining_time": "0:23:33"}
{"current_steps": 28, "total_steps": 315, "loss": 0.348, "lr": 9.960309693246135e-06, "epoch": 0.4444444444444444, "percentage": 8.89, "elapsed_time": "0:02:17", "remaining_time": "0:23:26"}
{"current_steps": 29, "total_steps": 315, "loss": 0.4737, "lr": 9.953429730181653e-06, "epoch": 0.4603174603174603, "percentage": 9.21, "elapsed_time": "0:02:21", "remaining_time": "0:23:18"}
{"current_steps": 30, "total_steps": 315, "loss": 0.4073, "lr": 9.94600292824394e-06, "epoch": 0.47619047619047616, "percentage": 9.52, "elapsed_time": "0:02:26", "remaining_time": "0:23:10"}
{"current_steps": 31, "total_steps": 315, "loss": 0.4142, "lr": 9.938030107322284e-06, "epoch": 0.49206349206349204, "percentage": 9.84, "elapsed_time": "0:02:30", "remaining_time": "0:23:02"}
{"current_steps": 32, "total_steps": 315, "loss": 0.4375, "lr": 9.929512147584297e-06, "epoch": 0.5079365079365079, "percentage": 10.16, "elapsed_time": "0:02:35", "remaining_time": "0:22:55"}
{"current_steps": 33, "total_steps": 315, "loss": 0.3821, "lr": 9.920449989378741e-06, "epoch": 0.5238095238095238, "percentage": 10.48, "elapsed_time": "0:02:40", "remaining_time": "0:22:50"}
{"current_steps": 34, "total_steps": 315, "loss": 0.4905, "lr": 9.910844633131712e-06, "epoch": 0.5396825396825397, "percentage": 10.79, "elapsed_time": "0:02:44", "remaining_time": "0:22:40"}
{"current_steps": 35, "total_steps": 315, "loss": 0.4102, "lr": 9.90069713923621e-06, "epoch": 0.5555555555555556, "percentage": 11.11, "elapsed_time": "0:02:48", "remaining_time": "0:22:31"}
{"current_steps": 36, "total_steps": 315, "loss": 0.3664, "lr": 9.890008627935057e-06, "epoch": 0.5714285714285714, "percentage": 11.43, "elapsed_time": "0:02:53", "remaining_time": "0:22:27"}
{"current_steps": 37, "total_steps": 315, "loss": 0.4242, "lr": 9.878780279197246e-06, "epoch": 0.5873015873015873, "percentage": 11.75, "elapsed_time": "0:02:58", "remaining_time": "0:22:20"}
{"current_steps": 38, "total_steps": 315, "loss": 0.3822, "lr": 9.867013332587667e-06, "epoch": 0.6031746031746031, "percentage": 12.06, "elapsed_time": "0:03:02", "remaining_time": "0:22:11"}
{"current_steps": 39, "total_steps": 315, "loss": 0.3681, "lr": 9.854709087130261e-06, "epoch": 0.6190476190476191, "percentage": 12.38, "elapsed_time": "0:03:07", "remaining_time": "0:22:05"}
{"current_steps": 40, "total_steps": 315, "loss": 0.3989, "lr": 9.841868901164621e-06, "epoch": 0.6349206349206349, "percentage": 12.7, "elapsed_time": "0:03:11", "remaining_time": "0:21:57"}
{"current_steps": 41, "total_steps": 315, "loss": 0.415, "lr": 9.828494192196037e-06, "epoch": 0.6507936507936508, "percentage": 13.02, "elapsed_time": "0:03:16", "remaining_time": "0:21:53"}
{"current_steps": 42, "total_steps": 315, "loss": 0.5562, "lr": 9.814586436738998e-06, "epoch": 0.6666666666666666, "percentage": 13.33, "elapsed_time": "0:03:21", "remaining_time": "0:21:47"}
{"current_steps": 43, "total_steps": 315, "loss": 0.4761, "lr": 9.8001471701542e-06, "epoch": 0.6825396825396826, "percentage": 13.65, "elapsed_time": "0:03:25", "remaining_time": "0:21:39"}
{"current_steps": 44, "total_steps": 315, "loss": 0.3765, "lr": 9.785177986479049e-06, "epoch": 0.6984126984126984, "percentage": 13.97, "elapsed_time": "0:03:29", "remaining_time": "0:21:32"}
{"current_steps": 45, "total_steps": 315, "loss": 0.3527, "lr": 9.76968053825168e-06, "epoch": 0.7142857142857143, "percentage": 14.29, "elapsed_time": "0:03:34", "remaining_time": "0:21:27"}
{"current_steps": 46, "total_steps": 315, "loss": 0.3922, "lr": 9.753656536328529e-06, "epoch": 0.7301587301587301, "percentage": 14.6, "elapsed_time": "0:03:39", "remaining_time": "0:21:22"}
{"current_steps": 47, "total_steps": 315, "loss": 0.4186, "lr": 9.737107749695456e-06, "epoch": 0.746031746031746, "percentage": 14.92, "elapsed_time": "0:03:44", "remaining_time": "0:21:19"}
{"current_steps": 48, "total_steps": 315, "loss": 0.3813, "lr": 9.72003600527246e-06, "epoch": 0.7619047619047619, "percentage": 15.24, "elapsed_time": "0:03:49", "remaining_time": "0:21:15"}
{"current_steps": 49, "total_steps": 315, "loss": 0.4344, "lr": 9.702443187711991e-06, "epoch": 0.7777777777777778, "percentage": 15.56, "elapsed_time": "0:03:54", "remaining_time": "0:21:10"}
{"current_steps": 50, "total_steps": 315, "loss": 0.3941, "lr": 9.6843312391909e-06, "epoch": 0.7936507936507936, "percentage": 15.87, "elapsed_time": "0:03:58", "remaining_time": "0:21:03"}
{"current_steps": 51, "total_steps": 315, "loss": 0.416, "lr": 9.665702159196014e-06, "epoch": 0.8095238095238095, "percentage": 16.19, "elapsed_time": "0:04:02", "remaining_time": "0:20:55"}
{"current_steps": 52, "total_steps": 315, "loss": 0.4598, "lr": 9.646558004303419e-06, "epoch": 0.8253968253968254, "percentage": 16.51, "elapsed_time": "0:04:07", "remaining_time": "0:20:52"}
{"current_steps": 53, "total_steps": 315, "loss": 0.3808, "lr": 9.62690088795141e-06, "epoch": 0.8412698412698413, "percentage": 16.83, "elapsed_time": "0:04:12", "remaining_time": "0:20:46"}
{"current_steps": 54, "total_steps": 315, "loss": 0.4116, "lr": 9.606732980207186e-06, "epoch": 0.8571428571428571, "percentage": 17.14, "elapsed_time": "0:04:17", "remaining_time": "0:20:44"}
{"current_steps": 55, "total_steps": 315, "loss": 0.4522, "lr": 9.586056507527266e-06, "epoch": 0.873015873015873, "percentage": 17.46, "elapsed_time": "0:04:22", "remaining_time": "0:20:38"}
{"current_steps": 56, "total_steps": 315, "loss": 0.3886, "lr": 9.564873752511719e-06, "epoch": 0.8888888888888888, "percentage": 17.78, "elapsed_time": "0:04:26", "remaining_time": "0:20:32"}
{"current_steps": 57, "total_steps": 315, "loss": 0.4676, "lr": 9.543187053652156e-06, "epoch": 0.9047619047619048, "percentage": 18.1, "elapsed_time": "0:04:31", "remaining_time": "0:20:28"}
{"current_steps": 58, "total_steps": 315, "loss": 0.3943, "lr": 9.520998805073583e-06, "epoch": 0.9206349206349206, "percentage": 18.41, "elapsed_time": "0:04:36", "remaining_time": "0:20:24"}
{"current_steps": 59, "total_steps": 315, "loss": 0.428, "lr": 9.498311456270091e-06, "epoch": 0.9365079365079365, "percentage": 18.73, "elapsed_time": "0:04:40", "remaining_time": "0:20:18"}
{"current_steps": 60, "total_steps": 315, "loss": 0.4173, "lr": 9.475127511834438e-06, "epoch": 0.9523809523809523, "percentage": 19.05, "elapsed_time": "0:04:45", "remaining_time": "0:20:14"}
{"current_steps": 61, "total_steps": 315, "loss": 0.3549, "lr": 9.451449531181571e-06, "epoch": 0.9682539682539683, "percentage": 19.37, "elapsed_time": "0:04:50", "remaining_time": "0:20:08"}
{"current_steps": 62, "total_steps": 315, "loss": 0.3883, "lr": 9.427280128266049e-06, "epoch": 0.9841269841269841, "percentage": 19.68, "elapsed_time": "0:04:55", "remaining_time": "0:20:04"}
{"current_steps": 63, "total_steps": 315, "loss": 0.2915, "lr": 9.4026219712935e-06, "epoch": 1.0, "percentage": 20.0, "elapsed_time": "0:04:59", "remaining_time": "0:19:59"}
{"current_steps": 64, "total_steps": 315, "loss": 0.3061, "lr": 9.377477782426041e-06, "epoch": 1.0158730158730158, "percentage": 20.32, "elapsed_time": "0:05:59", "remaining_time": "0:23:28"}
{"current_steps": 65, "total_steps": 315, "loss": 0.2833, "lr": 9.351850337481774e-06, "epoch": 1.0317460317460316, "percentage": 20.63, "elapsed_time": "0:06:04", "remaining_time": "0:23:21"}
{"current_steps": 66, "total_steps": 315, "loss": 0.321, "lr": 9.325742465628342e-06, "epoch": 1.0476190476190477, "percentage": 20.95, "elapsed_time": "0:06:09", "remaining_time": "0:23:13"}
{"current_steps": 67, "total_steps": 315, "loss": 0.3441, "lr": 9.299157049070604e-06, "epoch": 1.0634920634920635, "percentage": 21.27, "elapsed_time": "0:06:14", "remaining_time": "0:23:04"}
{"current_steps": 68, "total_steps": 315, "loss": 0.3403, "lr": 9.272097022732444e-06, "epoch": 1.0793650793650793, "percentage": 21.59, "elapsed_time": "0:06:18", "remaining_time": "0:22:54"}
{"current_steps": 69, "total_steps": 315, "loss": 0.2966, "lr": 9.244565373932775e-06, "epoch": 1.0952380952380953, "percentage": 21.9, "elapsed_time": "0:06:23", "remaining_time": "0:22:46"}
{"current_steps": 70, "total_steps": 315, "loss": 0.3033, "lr": 9.216565142055745e-06, "epoch": 1.1111111111111112, "percentage": 22.22, "elapsed_time": "0:06:27", "remaining_time": "0:22:36"}
{"current_steps": 71, "total_steps": 315, "loss": 0.2468, "lr": 9.188099418215208e-06, "epoch": 1.126984126984127, "percentage": 22.54, "elapsed_time": "0:06:32", "remaining_time": "0:22:29"}
{"current_steps": 72, "total_steps": 315, "loss": 0.2306, "lr": 9.159171344913469e-06, "epoch": 1.1428571428571428, "percentage": 22.86, "elapsed_time": "0:06:37", "remaining_time": "0:22:20"}
{"current_steps": 73, "total_steps": 315, "loss": 0.243, "lr": 9.129784115694368e-06, "epoch": 1.1587301587301586, "percentage": 23.17, "elapsed_time": "0:06:41", "remaining_time": "0:22:11"}
{"current_steps": 74, "total_steps": 315, "loss": 0.2564, "lr": 9.09994097479073e-06, "epoch": 1.1746031746031746, "percentage": 23.49, "elapsed_time": "0:06:46", "remaining_time": "0:22:03"}
{"current_steps": 75, "total_steps": 315, "loss": 0.257, "lr": 9.069645216766207e-06, "epoch": 1.1904761904761905, "percentage": 23.81, "elapsed_time": "0:06:50", "remaining_time": "0:21:54"}
{"current_steps": 76, "total_steps": 315, "loss": 0.266, "lr": 9.038900186151574e-06, "epoch": 1.2063492063492063, "percentage": 24.13, "elapsed_time": "0:06:55", "remaining_time": "0:21:47"}
{"current_steps": 77, "total_steps": 315, "loss": 0.3483, "lr": 9.007709277075512e-06, "epoch": 1.2222222222222223, "percentage": 24.44, "elapsed_time": "0:07:00", "remaining_time": "0:21:38"}
{"current_steps": 78, "total_steps": 315, "loss": 0.3127, "lr": 8.976075932889896e-06, "epoch": 1.2380952380952381, "percentage": 24.76, "elapsed_time": "0:07:04", "remaining_time": "0:21:31"}
{"current_steps": 79, "total_steps": 315, "loss": 0.2439, "lr": 8.944003645789678e-06, "epoch": 1.253968253968254, "percentage": 25.08, "elapsed_time": "0:07:09", "remaining_time": "0:21:23"}
{"current_steps": 80, "total_steps": 315, "loss": 0.2308, "lr": 8.911495956427358e-06, "epoch": 1.2698412698412698, "percentage": 25.4, "elapsed_time": "0:07:14", "remaining_time": "0:21:15"}
{"current_steps": 81, "total_steps": 315, "loss": 0.324, "lr": 8.8785564535221e-06, "epoch": 1.2857142857142856, "percentage": 25.71, "elapsed_time": "0:07:18", "remaining_time": "0:21:07"}
{"current_steps": 82, "total_steps": 315, "loss": 0.2778, "lr": 8.845188773463567e-06, "epoch": 1.3015873015873016, "percentage": 26.03, "elapsed_time": "0:07:23", "remaining_time": "0:21:00"}
{"current_steps": 83, "total_steps": 315, "loss": 0.2716, "lr": 8.811396599910467e-06, "epoch": 1.3174603174603174, "percentage": 26.35, "elapsed_time": "0:07:28", "remaining_time": "0:20:53"}
{"current_steps": 84, "total_steps": 315, "loss": 0.255, "lr": 8.777183663383897e-06, "epoch": 1.3333333333333333, "percentage": 26.67, "elapsed_time": "0:07:33", "remaining_time": "0:20:47"}
{"current_steps": 85, "total_steps": 315, "loss": 0.3788, "lr": 8.742553740855507e-06, "epoch": 1.3492063492063493, "percentage": 26.98, "elapsed_time": "0:07:38", "remaining_time": "0:20:40"}
{"current_steps": 86, "total_steps": 315, "loss": 0.3025, "lr": 8.707510655330536e-06, "epoch": 1.3650793650793651, "percentage": 27.3, "elapsed_time": "0:07:42", "remaining_time": "0:20:32"}
{"current_steps": 87, "total_steps": 315, "loss": 0.3145, "lr": 8.672058275425773e-06, "epoch": 1.380952380952381, "percentage": 27.62, "elapsed_time": "0:07:47", "remaining_time": "0:20:25"}
{"current_steps": 88, "total_steps": 315, "loss": 0.2297, "lr": 8.636200514942466e-06, "epoch": 1.3968253968253967, "percentage": 27.94, "elapsed_time": "0:07:52", "remaining_time": "0:20:18"}
{"current_steps": 89, "total_steps": 315, "loss": 0.3053, "lr": 8.59994133243427e-06, "epoch": 1.4126984126984126, "percentage": 28.25, "elapsed_time": "0:07:57", "remaining_time": "0:20:13"}
{"current_steps": 90, "total_steps": 315, "loss": 0.2567, "lr": 8.563284730770222e-06, "epoch": 1.4285714285714286, "percentage": 28.57, "elapsed_time": "0:08:02", "remaining_time": "0:20:06"}
{"current_steps": 91, "total_steps": 315, "loss": 0.2339, "lr": 8.52623475669285e-06, "epoch": 1.4444444444444444, "percentage": 28.89, "elapsed_time": "0:08:07", "remaining_time": "0:20:00"}
{"current_steps": 92, "total_steps": 315, "loss": 0.2888, "lr": 8.488795500371427e-06, "epoch": 1.4603174603174602, "percentage": 29.21, "elapsed_time": "0:08:12", "remaining_time": "0:19:53"}
{"current_steps": 93, "total_steps": 315, "loss": 0.2689, "lr": 8.450971094950433e-06, "epoch": 1.4761904761904763, "percentage": 29.52, "elapsed_time": "0:08:16", "remaining_time": "0:19:45"}
{"current_steps": 94, "total_steps": 315, "loss": 0.3078, "lr": 8.412765716093273e-06, "epoch": 1.492063492063492, "percentage": 29.84, "elapsed_time": "0:08:21", "remaining_time": "0:19:39"}
{"current_steps": 95, "total_steps": 315, "loss": 0.2912, "lr": 8.374183581521288e-06, "epoch": 1.507936507936508, "percentage": 30.16, "elapsed_time": "0:08:27", "remaining_time": "0:19:35"}
{"current_steps": 96, "total_steps": 315, "loss": 0.3256, "lr": 8.335228950548164e-06, "epoch": 1.5238095238095237, "percentage": 30.48, "elapsed_time": "0:08:32", "remaining_time": "0:19:28"}
{"current_steps": 97, "total_steps": 315, "loss": 0.2535, "lr": 8.29590612360969e-06, "epoch": 1.5396825396825395, "percentage": 30.79, "elapsed_time": "0:08:36", "remaining_time": "0:19:20"}
{"current_steps": 98, "total_steps": 315, "loss": 0.278, "lr": 8.256219441789023e-06, "epoch": 1.5555555555555556, "percentage": 31.11, "elapsed_time": "0:08:41", "remaining_time": "0:19:13"}
{"current_steps": 99, "total_steps": 315, "loss": 0.2403, "lr": 8.216173286337449e-06, "epoch": 1.5714285714285714, "percentage": 31.43, "elapsed_time": "0:08:45", "remaining_time": "0:19:07"}
{"current_steps": 100, "total_steps": 315, "loss": 0.2594, "lr": 8.175772078190706e-06, "epoch": 1.5873015873015874, "percentage": 31.75, "elapsed_time": "0:08:50", "remaining_time": "0:19:00"}
{"current_steps": 101, "total_steps": 315, "loss": 0.2489, "lr": 8.135020277480933e-06, "epoch": 1.6031746031746033, "percentage": 32.06, "elapsed_time": "0:08:55", "remaining_time": "0:18:55"}
{"current_steps": 102, "total_steps": 315, "loss": 0.2904, "lr": 8.093922383044293e-06, "epoch": 1.619047619047619, "percentage": 32.38, "elapsed_time": "0:09:00", "remaining_time": "0:18:49"}
{"current_steps": 103, "total_steps": 315, "loss": 0.2269, "lr": 8.052482931924307e-06, "epoch": 1.6349206349206349, "percentage": 32.7, "elapsed_time": "0:09:05", "remaining_time": "0:18:43"}
{"current_steps": 104, "total_steps": 315, "loss": 0.2961, "lr": 8.010706498870997e-06, "epoch": 1.6507936507936507, "percentage": 33.02, "elapsed_time": "0:09:10", "remaining_time": "0:18:37"}
{"current_steps": 105, "total_steps": 315, "loss": 0.2793, "lr": 7.968597695835845e-06, "epoch": 1.6666666666666665, "percentage": 33.33, "elapsed_time": "0:09:15", "remaining_time": "0:18:31"}
{"current_steps": 106, "total_steps": 315, "loss": 0.2727, "lr": 7.926161171462647e-06, "epoch": 1.6825396825396826, "percentage": 33.65, "elapsed_time": "0:09:21", "remaining_time": "0:18:26"}
{"current_steps": 107, "total_steps": 315, "loss": 0.3002, "lr": 7.883401610574338e-06, "epoch": 1.6984126984126984, "percentage": 33.97, "elapsed_time": "0:09:25", "remaining_time": "0:18:19"}
{"current_steps": 108, "total_steps": 315, "loss": 0.267, "lr": 7.84032373365578e-06, "epoch": 1.7142857142857144, "percentage": 34.29, "elapsed_time": "0:09:30", "remaining_time": "0:18:13"}
{"current_steps": 109, "total_steps": 315, "loss": 0.2372, "lr": 7.796932296332666e-06, "epoch": 1.7301587301587302, "percentage": 34.6, "elapsed_time": "0:09:35", "remaining_time": "0:18:07"}
{"current_steps": 110, "total_steps": 315, "loss": 0.209, "lr": 7.753232088846505e-06, "epoch": 1.746031746031746, "percentage": 34.92, "elapsed_time": "0:09:40", "remaining_time": "0:18:01"}
{"current_steps": 111, "total_steps": 315, "loss": 0.3326, "lr": 7.709227935525796e-06, "epoch": 1.7619047619047619, "percentage": 35.24, "elapsed_time": "0:09:44", "remaining_time": "0:17:55"}
{"current_steps": 112, "total_steps": 315, "loss": 0.2302, "lr": 7.664924694253444e-06, "epoch": 1.7777777777777777, "percentage": 35.56, "elapsed_time": "0:09:49", "remaining_time": "0:17:48"}
{"current_steps": 113, "total_steps": 315, "loss": 0.2521, "lr": 7.620327255930475e-06, "epoch": 1.7936507936507935, "percentage": 35.87, "elapsed_time": "0:09:54", "remaining_time": "0:17:42"}
{"current_steps": 114, "total_steps": 315, "loss": 0.281, "lr": 7.575440543936092e-06, "epoch": 1.8095238095238095, "percentage": 36.19, "elapsed_time": "0:09:59", "remaining_time": "0:17:36"}
{"current_steps": 115, "total_steps": 315, "loss": 0.2883, "lr": 7.530269513584158e-06, "epoch": 1.8253968253968254, "percentage": 36.51, "elapsed_time": "0:10:03", "remaining_time": "0:17:30"}
{"current_steps": 116, "total_steps": 315, "loss": 0.2206, "lr": 7.484819151576148e-06, "epoch": 1.8412698412698414, "percentage": 36.83, "elapsed_time": "0:10:09", "remaining_time": "0:17:25"}
{"current_steps": 117, "total_steps": 315, "loss": 0.2747, "lr": 7.439094475450638e-06, "epoch": 1.8571428571428572, "percentage": 37.14, "elapsed_time": "0:10:13", "remaining_time": "0:17:18"}
{"current_steps": 118, "total_steps": 315, "loss": 0.2526, "lr": 7.393100533029383e-06, "epoch": 1.873015873015873, "percentage": 37.46, "elapsed_time": "0:10:18", "remaining_time": "0:17:12"}
{"current_steps": 119, "total_steps": 315, "loss": 0.2664, "lr": 7.346842401860069e-06, "epoch": 1.8888888888888888, "percentage": 37.78, "elapsed_time": "0:10:22", "remaining_time": "0:17:05"}
{"current_steps": 120, "total_steps": 315, "loss": 0.3116, "lr": 7.300325188655762e-06, "epoch": 1.9047619047619047, "percentage": 38.1, "elapsed_time": "0:10:27", "remaining_time": "0:16:59"}
{"current_steps": 121, "total_steps": 315, "loss": 0.2469, "lr": 7.253554028731149e-06, "epoch": 1.9206349206349205, "percentage": 38.41, "elapsed_time": "0:10:31", "remaining_time": "0:16:52"}
{"current_steps": 122, "total_steps": 315, "loss": 0.3119, "lr": 7.206534085435626e-06, "epoch": 1.9365079365079365, "percentage": 38.73, "elapsed_time": "0:10:36", "remaining_time": "0:16:46"}
{"current_steps": 123, "total_steps": 315, "loss": 0.3276, "lr": 7.159270549583278e-06, "epoch": 1.9523809523809523, "percentage": 39.05, "elapsed_time": "0:10:41", "remaining_time": "0:16:40"}
{"current_steps": 124, "total_steps": 315, "loss": 0.3258, "lr": 7.111768638879834e-06, "epoch": 1.9682539682539684, "percentage": 39.37, "elapsed_time": "0:10:45", "remaining_time": "0:16:34"}
{"current_steps": 125, "total_steps": 315, "loss": 0.2642, "lr": 7.064033597346658e-06, "epoch": 1.9841269841269842, "percentage": 39.68, "elapsed_time": "0:10:50", "remaining_time": "0:16:28"}
{"current_steps": 126, "total_steps": 315, "loss": 0.2064, "lr": 7.016070694741824e-06, "epoch": 2.0, "percentage": 40.0, "elapsed_time": "0:10:54", "remaining_time": "0:16:22"}
{"current_steps": 127, "total_steps": 315, "loss": 0.1503, "lr": 6.967885225978366e-06, "epoch": 2.015873015873016, "percentage": 40.32, "elapsed_time": "0:12:01", "remaining_time": "0:17:48"}
{"current_steps": 128, "total_steps": 315, "loss": 0.1975, "lr": 6.919482510539723e-06, "epoch": 2.0317460317460316, "percentage": 40.63, "elapsed_time": "0:12:06", "remaining_time": "0:17:41"}
{"current_steps": 129, "total_steps": 315, "loss": 0.1729, "lr": 6.870867891892511e-06, "epoch": 2.0476190476190474, "percentage": 40.95, "elapsed_time": "0:12:11", "remaining_time": "0:17:34"}
{"current_steps": 130, "total_steps": 315, "loss": 0.1817, "lr": 6.822046736896607e-06, "epoch": 2.0634920634920633, "percentage": 41.27, "elapsed_time": "0:12:16", "remaining_time": "0:17:27"}
{"current_steps": 131, "total_steps": 315, "loss": 0.1369, "lr": 6.773024435212678e-06, "epoch": 2.0793650793650795, "percentage": 41.59, "elapsed_time": "0:12:21", "remaining_time": "0:17:21"}
{"current_steps": 132, "total_steps": 315, "loss": 0.1838, "lr": 6.723806398707186e-06, "epoch": 2.0952380952380953, "percentage": 41.9, "elapsed_time": "0:12:25", "remaining_time": "0:17:14"}
{"current_steps": 133, "total_steps": 315, "loss": 0.1644, "lr": 6.674398060854931e-06, "epoch": 2.111111111111111, "percentage": 42.22, "elapsed_time": "0:12:30", "remaining_time": "0:17:07"}
{"current_steps": 134, "total_steps": 315, "loss": 0.1492, "lr": 6.624804876139227e-06, "epoch": 2.126984126984127, "percentage": 42.54, "elapsed_time": "0:12:35", "remaining_time": "0:16:59"}
{"current_steps": 135, "total_steps": 315, "loss": 0.1795, "lr": 6.57503231944974e-06, "epoch": 2.142857142857143, "percentage": 42.86, "elapsed_time": "0:12:39", "remaining_time": "0:16:53"}
{"current_steps": 136, "total_steps": 315, "loss": 0.1627, "lr": 6.525085885478088e-06, "epoch": 2.1587301587301586, "percentage": 43.17, "elapsed_time": "0:12:45", "remaining_time": "0:16:47"}
{"current_steps": 137, "total_steps": 315, "loss": 0.1748, "lr": 6.4749710881112485e-06, "epoch": 2.1746031746031744, "percentage": 43.49, "elapsed_time": "0:12:50", "remaining_time": "0:16:40"}
{"current_steps": 138, "total_steps": 315, "loss": 0.1992, "lr": 6.424693459822843e-06, "epoch": 2.1904761904761907, "percentage": 43.81, "elapsed_time": "0:12:55", "remaining_time": "0:16:34"}
{"current_steps": 139, "total_steps": 315, "loss": 0.1592, "lr": 6.374258551062377e-06, "epoch": 2.2063492063492065, "percentage": 44.13, "elapsed_time": "0:12:59", "remaining_time": "0:16:26"}
{"current_steps": 140, "total_steps": 315, "loss": 0.1651, "lr": 6.3236719296424985e-06, "epoch": 2.2222222222222223, "percentage": 44.44, "elapsed_time": "0:13:03", "remaining_time": "0:16:19"}
{"current_steps": 141, "total_steps": 315, "loss": 0.1316, "lr": 6.272939180124316e-06, "epoch": 2.238095238095238, "percentage": 44.76, "elapsed_time": "0:13:08", "remaining_time": "0:16:13"}
{"current_steps": 142, "total_steps": 315, "loss": 0.1803, "lr": 6.222065903200909e-06, "epoch": 2.253968253968254, "percentage": 45.08, "elapsed_time": "0:13:13", "remaining_time": "0:16:06"}
{"current_steps": 143, "total_steps": 315, "loss": 0.1498, "lr": 6.171057715079012e-06, "epoch": 2.2698412698412698, "percentage": 45.4, "elapsed_time": "0:13:18", "remaining_time": "0:16:00"}
{"current_steps": 144, "total_steps": 315, "loss": 0.1352, "lr": 6.119920246859025e-06, "epoch": 2.2857142857142856, "percentage": 45.71, "elapsed_time": "0:13:23", "remaining_time": "0:15:53"}
{"current_steps": 145, "total_steps": 315, "loss": 0.1555, "lr": 6.068659143913349e-06, "epoch": 2.3015873015873014, "percentage": 46.03, "elapsed_time": "0:13:27", "remaining_time": "0:15:47"}
{"current_steps": 146, "total_steps": 315, "loss": 0.1515, "lr": 6.0172800652631706e-06, "epoch": 2.317460317460317, "percentage": 46.35, "elapsed_time": "0:13:32", "remaining_time": "0:15:40"}
{"current_steps": 147, "total_steps": 315, "loss": 0.1414, "lr": 5.965788682953717e-06, "epoch": 2.3333333333333335, "percentage": 46.67, "elapsed_time": "0:13:36", "remaining_time": "0:15:33"}
{"current_steps": 148, "total_steps": 315, "loss": 0.1582, "lr": 5.914190681428098e-06, "epoch": 2.3492063492063493, "percentage": 46.98, "elapsed_time": "0:13:41", "remaining_time": "0:15:26"}
{"current_steps": 149, "total_steps": 315, "loss": 0.1948, "lr": 5.862491756899753e-06, "epoch": 2.365079365079365, "percentage": 47.3, "elapsed_time": "0:13:45", "remaining_time": "0:15:20"}
{"current_steps": 150, "total_steps": 315, "loss": 0.1588, "lr": 5.8106976167236236e-06, "epoch": 2.380952380952381, "percentage": 47.62, "elapsed_time": "0:13:50", "remaining_time": "0:15:13"}
{"current_steps": 151, "total_steps": 315, "loss": 0.1354, "lr": 5.758813978766077e-06, "epoch": 2.3968253968253967, "percentage": 47.94, "elapsed_time": "0:13:55", "remaining_time": "0:15:07"}
{"current_steps": 152, "total_steps": 315, "loss": 0.1673, "lr": 5.706846570773677e-06, "epoch": 2.4126984126984126, "percentage": 48.25, "elapsed_time": "0:13:59", "remaining_time": "0:15:00"}
{"current_steps": 153, "total_steps": 315, "loss": 0.1474, "lr": 5.654801129740863e-06, "epoch": 2.4285714285714284, "percentage": 48.57, "elapsed_time": "0:14:04", "remaining_time": "0:14:54"}
{"current_steps": 154, "total_steps": 315, "loss": 0.2067, "lr": 5.6026834012766155e-06, "epoch": 2.4444444444444446, "percentage": 48.89, "elapsed_time": "0:14:08", "remaining_time": "0:14:47"}
{"current_steps": 155, "total_steps": 315, "loss": 0.1449, "lr": 5.550499138970158e-06, "epoch": 2.4603174603174605, "percentage": 49.21, "elapsed_time": "0:14:13", "remaining_time": "0:14:40"}
{"current_steps": 156, "total_steps": 315, "loss": 0.1716, "lr": 5.4982541037557825e-06, "epoch": 2.4761904761904763, "percentage": 49.52, "elapsed_time": "0:14:17", "remaining_time": "0:14:34"}
{"current_steps": 157, "total_steps": 315, "loss": 0.1932, "lr": 5.44595406327687e-06, "epoch": 2.492063492063492, "percentage": 49.84, "elapsed_time": "0:14:22", "remaining_time": "0:14:28"}
{"current_steps": 158, "total_steps": 315, "loss": 0.1787, "lr": 5.393604791249158e-06, "epoch": 2.507936507936508, "percentage": 50.16, "elapsed_time": "0:14:27", "remaining_time": "0:14:21"}
{"current_steps": 159, "total_steps": 315, "loss": 0.1448, "lr": 5.341212066823356e-06, "epoch": 2.5238095238095237, "percentage": 50.48, "elapsed_time": "0:14:32", "remaining_time": "0:14:16"}
{"current_steps": 160, "total_steps": 315, "loss": 0.1788, "lr": 5.288781673947143e-06, "epoch": 2.5396825396825395, "percentage": 50.79, "elapsed_time": "0:14:37", "remaining_time": "0:14:09"}
{"current_steps": 161, "total_steps": 315, "loss": 0.1582, "lr": 5.2363194007266435e-06, "epoch": 2.5555555555555554, "percentage": 51.11, "elapsed_time": "0:14:41", "remaining_time": "0:14:03"}
{"current_steps": 162, "total_steps": 315, "loss": 0.1242, "lr": 5.183831038787449e-06, "epoch": 2.571428571428571, "percentage": 51.43, "elapsed_time": "0:14:46", "remaining_time": "0:13:56"}
{"current_steps": 163, "total_steps": 315, "loss": 0.1534, "lr": 5.131322382635236e-06, "epoch": 2.5873015873015874, "percentage": 51.75, "elapsed_time": "0:14:51", "remaining_time": "0:13:50"}
{"current_steps": 164, "total_steps": 315, "loss": 0.1479, "lr": 5.078799229016083e-06, "epoch": 2.6031746031746033, "percentage": 52.06, "elapsed_time": "0:14:55", "remaining_time": "0:13:44"}
{"current_steps": 165, "total_steps": 315, "loss": 0.1646, "lr": 5.0262673762765316e-06, "epoch": 2.619047619047619, "percentage": 52.38, "elapsed_time": "0:14:59", "remaining_time": "0:13:38"}
{"current_steps": 166, "total_steps": 315, "loss": 0.1708, "lr": 4.973732623723471e-06, "epoch": 2.634920634920635, "percentage": 52.7, "elapsed_time": "0:15:04", "remaining_time": "0:13:31"}
{"current_steps": 167, "total_steps": 315, "loss": 0.1294, "lr": 4.921200770983919e-06, "epoch": 2.6507936507936507, "percentage": 53.02, "elapsed_time": "0:15:09", "remaining_time": "0:13:26"}
{"current_steps": 168, "total_steps": 315, "loss": 0.1558, "lr": 4.8686776173647655e-06, "epoch": 2.6666666666666665, "percentage": 53.33, "elapsed_time": "0:15:15", "remaining_time": "0:13:20"}
{"current_steps": 169, "total_steps": 315, "loss": 0.1592, "lr": 4.816168961212553e-06, "epoch": 2.682539682539683, "percentage": 53.65, "elapsed_time": "0:15:19", "remaining_time": "0:13:14"}
{"current_steps": 170, "total_steps": 315, "loss": 0.1494, "lr": 4.763680599273357e-06, "epoch": 2.6984126984126986, "percentage": 53.97, "elapsed_time": "0:15:24", "remaining_time": "0:13:08"}
{"current_steps": 171, "total_steps": 315, "loss": 0.189, "lr": 4.711218326052859e-06, "epoch": 2.7142857142857144, "percentage": 54.29, "elapsed_time": "0:15:29", "remaining_time": "0:13:02"}
{"current_steps": 172, "total_steps": 315, "loss": 0.1343, "lr": 4.6587879331766465e-06, "epoch": 2.7301587301587302, "percentage": 54.6, "elapsed_time": "0:15:34", "remaining_time": "0:12:56"}
{"current_steps": 173, "total_steps": 315, "loss": 0.1931, "lr": 4.606395208750844e-06, "epoch": 2.746031746031746, "percentage": 54.92, "elapsed_time": "0:15:39", "remaining_time": "0:12:50"}
{"current_steps": 174, "total_steps": 315, "loss": 0.1393, "lr": 4.554045936723132e-06, "epoch": 2.761904761904762, "percentage": 55.24, "elapsed_time": "0:15:43", "remaining_time": "0:12:44"}
{"current_steps": 175, "total_steps": 315, "loss": 0.1446, "lr": 4.501745896244219e-06, "epoch": 2.7777777777777777, "percentage": 55.56, "elapsed_time": "0:15:48", "remaining_time": "0:12:38"}
{"current_steps": 176, "total_steps": 315, "loss": 0.1862, "lr": 4.4495008610298435e-06, "epoch": 2.7936507936507935, "percentage": 55.87, "elapsed_time": "0:15:53", "remaining_time": "0:12:33"}
{"current_steps": 177, "total_steps": 315, "loss": 0.1534, "lr": 4.397316598723385e-06, "epoch": 2.8095238095238093, "percentage": 56.19, "elapsed_time": "0:15:58", "remaining_time": "0:12:27"}
{"current_steps": 178, "total_steps": 315, "loss": 0.1519, "lr": 4.345198870259139e-06, "epoch": 2.825396825396825, "percentage": 56.51, "elapsed_time": "0:16:03", "remaining_time": "0:12:21"}
{"current_steps": 179, "total_steps": 315, "loss": 0.1756, "lr": 4.2931534292263265e-06, "epoch": 2.8412698412698414, "percentage": 56.83, "elapsed_time": "0:16:09", "remaining_time": "0:12:16"}
{"current_steps": 180, "total_steps": 315, "loss": 0.1506, "lr": 4.241186021233925e-06, "epoch": 2.857142857142857, "percentage": 57.14, "elapsed_time": "0:16:13", "remaining_time": "0:12:10"}
{"current_steps": 181, "total_steps": 315, "loss": 0.1507, "lr": 4.189302383276378e-06, "epoch": 2.873015873015873, "percentage": 57.46, "elapsed_time": "0:16:18", "remaining_time": "0:12:04"}
{"current_steps": 182, "total_steps": 315, "loss": 0.1472, "lr": 4.137508243100249e-06, "epoch": 2.888888888888889, "percentage": 57.78, "elapsed_time": "0:16:22", "remaining_time": "0:11:58"}
{"current_steps": 183, "total_steps": 315, "loss": 0.1738, "lr": 4.085809318571905e-06, "epoch": 2.9047619047619047, "percentage": 58.1, "elapsed_time": "0:16:27", "remaining_time": "0:11:52"}
{"current_steps": 184, "total_steps": 315, "loss": 0.1747, "lr": 4.034211317046285e-06, "epoch": 2.9206349206349205, "percentage": 58.41, "elapsed_time": "0:16:32", "remaining_time": "0:11:46"}
{"current_steps": 185, "total_steps": 315, "loss": 0.1544, "lr": 3.982719934736832e-06, "epoch": 2.9365079365079367, "percentage": 58.73, "elapsed_time": "0:16:37", "remaining_time": "0:11:40"}
{"current_steps": 186, "total_steps": 315, "loss": 0.1247, "lr": 3.931340856086652e-06, "epoch": 2.9523809523809526, "percentage": 59.05, "elapsed_time": "0:16:42", "remaining_time": "0:11:35"}
{"current_steps": 187, "total_steps": 315, "loss": 0.1405, "lr": 3.880079753140978e-06, "epoch": 2.9682539682539684, "percentage": 59.37, "elapsed_time": "0:16:47", "remaining_time": "0:11:29"}
{"current_steps": 188, "total_steps": 315, "loss": 0.18, "lr": 3.82894228492099e-06, "epoch": 2.984126984126984, "percentage": 59.68, "elapsed_time": "0:16:51", "remaining_time": "0:11:23"}
{"current_steps": 189, "total_steps": 315, "loss": 0.133, "lr": 3.777934096799094e-06, "epoch": 3.0, "percentage": 60.0, "elapsed_time": "0:16:56", "remaining_time": "0:11:17"}
{"current_steps": 190, "total_steps": 315, "loss": 0.0625, "lr": 3.7270608198756852e-06, "epoch": 3.015873015873016, "percentage": 60.32, "elapsed_time": "0:18:02", "remaining_time": "0:11:52"}
{"current_steps": 191, "total_steps": 315, "loss": 0.124, "lr": 3.676328070357503e-06, "epoch": 3.0317460317460316, "percentage": 60.63, "elapsed_time": "0:18:07", "remaining_time": "0:11:46"}
{"current_steps": 192, "total_steps": 315, "loss": 0.0867, "lr": 3.6257414489376217e-06, "epoch": 3.0476190476190474, "percentage": 60.95, "elapsed_time": "0:18:12", "remaining_time": "0:11:39"}
{"current_steps": 193, "total_steps": 315, "loss": 0.079, "lr": 3.5753065401771577e-06, "epoch": 3.0634920634920633, "percentage": 61.27, "elapsed_time": "0:18:17", "remaining_time": "0:11:33"}
{"current_steps": 194, "total_steps": 315, "loss": 0.0736, "lr": 3.5250289118887515e-06, "epoch": 3.0793650793650795, "percentage": 61.59, "elapsed_time": "0:18:22", "remaining_time": "0:11:27"}
{"current_steps": 195, "total_steps": 315, "loss": 0.0768, "lr": 3.4749141145219118e-06, "epoch": 3.0952380952380953, "percentage": 61.9, "elapsed_time": "0:18:27", "remaining_time": "0:11:21"}
{"current_steps": 196, "total_steps": 315, "loss": 0.0748, "lr": 3.424967680550261e-06, "epoch": 3.111111111111111, "percentage": 62.22, "elapsed_time": "0:18:31", "remaining_time": "0:11:14"}
{"current_steps": 197, "total_steps": 315, "loss": 0.101, "lr": 3.3751951238607745e-06, "epoch": 3.126984126984127, "percentage": 62.54, "elapsed_time": "0:18:35", "remaining_time": "0:11:08"}
{"current_steps": 198, "total_steps": 315, "loss": 0.0662, "lr": 3.3256019391450696e-06, "epoch": 3.142857142857143, "percentage": 62.86, "elapsed_time": "0:18:40", "remaining_time": "0:11:02"}
{"current_steps": 199, "total_steps": 315, "loss": 0.0731, "lr": 3.2761936012928147e-06, "epoch": 3.1587301587301586, "percentage": 63.17, "elapsed_time": "0:18:45", "remaining_time": "0:10:55"}
{"current_steps": 200, "total_steps": 315, "loss": 0.0725, "lr": 3.226975564787322e-06, "epoch": 3.1746031746031744, "percentage": 63.49, "elapsed_time": "0:18:50", "remaining_time": "0:10:50"}
{"current_steps": 201, "total_steps": 315, "loss": 0.0957, "lr": 3.177953263103394e-06, "epoch": 3.1904761904761907, "percentage": 63.81, "elapsed_time": "0:18:55", "remaining_time": "0:10:44"}
{"current_steps": 202, "total_steps": 315, "loss": 0.1012, "lr": 3.1291321081074887e-06, "epoch": 3.2063492063492065, "percentage": 64.13, "elapsed_time": "0:19:01", "remaining_time": "0:10:38"}
{"current_steps": 203, "total_steps": 315, "loss": 0.0683, "lr": 3.0805174894602775e-06, "epoch": 3.2222222222222223, "percentage": 64.44, "elapsed_time": "0:19:06", "remaining_time": "0:10:32"}
{"current_steps": 204, "total_steps": 315, "loss": 0.0834, "lr": 3.032114774021636e-06, "epoch": 3.238095238095238, "percentage": 64.76, "elapsed_time": "0:19:12", "remaining_time": "0:10:27"}
{"current_steps": 205, "total_steps": 315, "loss": 0.081, "lr": 2.9839293052581767e-06, "epoch": 3.253968253968254, "percentage": 65.08, "elapsed_time": "0:19:17", "remaining_time": "0:10:21"}
{"current_steps": 206, "total_steps": 315, "loss": 0.0698, "lr": 2.9359664026533443e-06, "epoch": 3.2698412698412698, "percentage": 65.4, "elapsed_time": "0:19:22", "remaining_time": "0:10:15"}
{"current_steps": 207, "total_steps": 315, "loss": 0.0795, "lr": 2.8882313611201684e-06, "epoch": 3.2857142857142856, "percentage": 65.71, "elapsed_time": "0:19:27", "remaining_time": "0:10:09"}
{"current_steps": 208, "total_steps": 315, "loss": 0.0929, "lr": 2.8407294504167238e-06, "epoch": 3.3015873015873014, "percentage": 66.03, "elapsed_time": "0:19:32", "remaining_time": "0:10:03"}
{"current_steps": 209, "total_steps": 315, "loss": 0.0832, "lr": 2.793465914564375e-06, "epoch": 3.317460317460317, "percentage": 66.35, "elapsed_time": "0:19:37", "remaining_time": "0:09:57"}
{"current_steps": 210, "total_steps": 315, "loss": 0.0827, "lr": 2.7464459712688517e-06, "epoch": 3.3333333333333335, "percentage": 66.67, "elapsed_time": "0:19:43", "remaining_time": "0:09:51"}
{"current_steps": 211, "total_steps": 315, "loss": 0.0938, "lr": 2.6996748113442397e-06, "epoch": 3.3492063492063493, "percentage": 66.98, "elapsed_time": "0:19:48", "remaining_time": "0:09:45"}
{"current_steps": 212, "total_steps": 315, "loss": 0.0807, "lr": 2.653157598139932e-06, "epoch": 3.365079365079365, "percentage": 67.3, "elapsed_time": "0:19:52", "remaining_time": "0:09:39"}
{"current_steps": 213, "total_steps": 315, "loss": 0.0645, "lr": 2.6068994669706184e-06, "epoch": 3.380952380952381, "percentage": 67.62, "elapsed_time": "0:19:58", "remaining_time": "0:09:33"}
{"current_steps": 214, "total_steps": 315, "loss": 0.0976, "lr": 2.560905524549364e-06, "epoch": 3.3968253968253967, "percentage": 67.94, "elapsed_time": "0:20:03", "remaining_time": "0:09:27"}
{"current_steps": 215, "total_steps": 315, "loss": 0.0732, "lr": 2.515180848423853e-06, "epoch": 3.4126984126984126, "percentage": 68.25, "elapsed_time": "0:20:08", "remaining_time": "0:09:22"}
{"current_steps": 216, "total_steps": 315, "loss": 0.0651, "lr": 2.469730486415842e-06, "epoch": 3.4285714285714284, "percentage": 68.57, "elapsed_time": "0:20:13", "remaining_time": "0:09:16"}
{"current_steps": 217, "total_steps": 315, "loss": 0.0758, "lr": 2.4245594560639086e-06, "epoch": 3.4444444444444446, "percentage": 68.89, "elapsed_time": "0:20:19", "remaining_time": "0:09:10"}
{"current_steps": 218, "total_steps": 315, "loss": 0.0791, "lr": 2.379672744069527e-06, "epoch": 3.4603174603174605, "percentage": 69.21, "elapsed_time": "0:20:24", "remaining_time": "0:09:04"}
{"current_steps": 219, "total_steps": 315, "loss": 0.0766, "lr": 2.335075305746558e-06, "epoch": 3.4761904761904763, "percentage": 69.52, "elapsed_time": "0:20:29", "remaining_time": "0:08:59"}
{"current_steps": 220, "total_steps": 315, "loss": 0.0828, "lr": 2.2907720644742064e-06, "epoch": 3.492063492063492, "percentage": 69.84, "elapsed_time": "0:20:34", "remaining_time": "0:08:52"}
{"current_steps": 221, "total_steps": 315, "loss": 0.0738, "lr": 2.2467679111534963e-06, "epoch": 3.507936507936508, "percentage": 70.16, "elapsed_time": "0:20:38", "remaining_time": "0:08:46"}
{"current_steps": 222, "total_steps": 315, "loss": 0.0862, "lr": 2.2030677036673345e-06, "epoch": 3.5238095238095237, "percentage": 70.48, "elapsed_time": "0:20:43", "remaining_time": "0:08:40"}
{"current_steps": 223, "total_steps": 315, "loss": 0.0794, "lr": 2.159676266344222e-06, "epoch": 3.5396825396825395, "percentage": 70.79, "elapsed_time": "0:20:48", "remaining_time": "0:08:34"}
{"current_steps": 224, "total_steps": 315, "loss": 0.1081, "lr": 2.1165983894256647e-06, "epoch": 3.5555555555555554, "percentage": 71.11, "elapsed_time": "0:20:53", "remaining_time": "0:08:29"}
{"current_steps": 225, "total_steps": 315, "loss": 0.072, "lr": 2.0738388285373532e-06, "epoch": 3.571428571428571, "percentage": 71.43, "elapsed_time": "0:20:58", "remaining_time": "0:08:23"}
{"current_steps": 226, "total_steps": 315, "loss": 0.0848, "lr": 2.0314023041641567e-06, "epoch": 3.5873015873015874, "percentage": 71.75, "elapsed_time": "0:21:02", "remaining_time": "0:08:17"}
{"current_steps": 227, "total_steps": 315, "loss": 0.0827, "lr": 1.9892935011290037e-06, "epoch": 3.6031746031746033, "percentage": 72.06, "elapsed_time": "0:21:06", "remaining_time": "0:08:11"}
{"current_steps": 228, "total_steps": 315, "loss": 0.0544, "lr": 1.947517068075694e-06, "epoch": 3.619047619047619, "percentage": 72.38, "elapsed_time": "0:21:12", "remaining_time": "0:08:05"}
{"current_steps": 229, "total_steps": 315, "loss": 0.0954, "lr": 1.9060776169557083e-06, "epoch": 3.634920634920635, "percentage": 72.7, "elapsed_time": "0:21:16", "remaining_time": "0:07:59"}
{"current_steps": 230, "total_steps": 315, "loss": 0.0933, "lr": 1.864979722519068e-06, "epoch": 3.6507936507936507, "percentage": 73.02, "elapsed_time": "0:21:21", "remaining_time": "0:07:53"}
{"current_steps": 231, "total_steps": 315, "loss": 0.0759, "lr": 1.8242279218092968e-06, "epoch": 3.6666666666666665, "percentage": 73.33, "elapsed_time": "0:21:26", "remaining_time": "0:07:47"}
{"current_steps": 232, "total_steps": 315, "loss": 0.0821, "lr": 1.7838267136625536e-06, "epoch": 3.682539682539683, "percentage": 73.65, "elapsed_time": "0:21:31", "remaining_time": "0:07:41"}
{"current_steps": 233, "total_steps": 315, "loss": 0.0971, "lr": 1.743780558210979e-06, "epoch": 3.6984126984126986, "percentage": 73.97, "elapsed_time": "0:21:36", "remaining_time": "0:07:36"}
{"current_steps": 234, "total_steps": 315, "loss": 0.07, "lr": 1.704093876390312e-06, "epoch": 3.7142857142857144, "percentage": 74.29, "elapsed_time": "0:21:41", "remaining_time": "0:07:30"}
{"current_steps": 235, "total_steps": 315, "loss": 0.0811, "lr": 1.664771049451837e-06, "epoch": 3.7301587301587302, "percentage": 74.6, "elapsed_time": "0:21:47", "remaining_time": "0:07:24"}
{"current_steps": 236, "total_steps": 315, "loss": 0.0711, "lr": 1.6258164184787123e-06, "epoch": 3.746031746031746, "percentage": 74.92, "elapsed_time": "0:21:52", "remaining_time": "0:07:19"}
{"current_steps": 237, "total_steps": 315, "loss": 0.0671, "lr": 1.5872342839067305e-06, "epoch": 3.761904761904762, "percentage": 75.24, "elapsed_time": "0:21:57", "remaining_time": "0:07:13"}
{"current_steps": 238, "total_steps": 315, "loss": 0.0725, "lr": 1.5490289050495678e-06, "epoch": 3.7777777777777777, "percentage": 75.56, "elapsed_time": "0:22:02", "remaining_time": "0:07:07"}
{"current_steps": 239, "total_steps": 315, "loss": 0.0779, "lr": 1.511204499628574e-06, "epoch": 3.7936507936507935, "percentage": 75.87, "elapsed_time": "0:22:07", "remaining_time": "0:07:02"}
{"current_steps": 240, "total_steps": 315, "loss": 0.0591, "lr": 1.4737652433071515e-06, "epoch": 3.8095238095238093, "percentage": 76.19, "elapsed_time": "0:22:13", "remaining_time": "0:06:56"}
{"current_steps": 241, "total_steps": 315, "loss": 0.0861, "lr": 1.4367152692297799e-06, "epoch": 3.825396825396825, "percentage": 76.51, "elapsed_time": "0:22:18", "remaining_time": "0:06:50"}
{"current_steps": 242, "total_steps": 315, "loss": 0.0709, "lr": 1.4000586675657312e-06, "epoch": 3.8412698412698414, "percentage": 76.83, "elapsed_time": "0:22:23", "remaining_time": "0:06:45"}
{"current_steps": 243, "total_steps": 315, "loss": 0.0777, "lr": 1.3637994850575342e-06, "epoch": 3.857142857142857, "percentage": 77.14, "elapsed_time": "0:22:28", "remaining_time": "0:06:39"}
{"current_steps": 244, "total_steps": 315, "loss": 0.0708, "lr": 1.3279417245742288e-06, "epoch": 3.873015873015873, "percentage": 77.46, "elapsed_time": "0:22:33", "remaining_time": "0:06:33"}
{"current_steps": 245, "total_steps": 315, "loss": 0.0739, "lr": 1.2924893446694648e-06, "epoch": 3.888888888888889, "percentage": 77.78, "elapsed_time": "0:22:39", "remaining_time": "0:06:28"}
{"current_steps": 246, "total_steps": 315, "loss": 0.0818, "lr": 1.257446259144494e-06, "epoch": 3.9047619047619047, "percentage": 78.1, "elapsed_time": "0:22:44", "remaining_time": "0:06:22"}
{"current_steps": 247, "total_steps": 315, "loss": 0.0818, "lr": 1.222816336616104e-06, "epoch": 3.9206349206349205, "percentage": 78.41, "elapsed_time": "0:22:49", "remaining_time": "0:06:16"}
{"current_steps": 248, "total_steps": 315, "loss": 0.0786, "lr": 1.1886034000895341e-06, "epoch": 3.9365079365079367, "percentage": 78.73, "elapsed_time": "0:22:54", "remaining_time": "0:06:11"}
{"current_steps": 249, "total_steps": 315, "loss": 0.062, "lr": 1.1548112265364336e-06, "epoch": 3.9523809523809526, "percentage": 79.05, "elapsed_time": "0:22:59", "remaining_time": "0:06:05"}
{"current_steps": 250, "total_steps": 315, "loss": 0.0684, "lr": 1.1214435464779006e-06, "epoch": 3.9682539682539684, "percentage": 79.37, "elapsed_time": "0:23:04", "remaining_time": "0:05:59"}
{"current_steps": 251, "total_steps": 315, "loss": 0.074, "lr": 1.088504043572643e-06, "epoch": 3.984126984126984, "percentage": 79.68, "elapsed_time": "0:23:08", "remaining_time": "0:05:54"}
{"current_steps": 252, "total_steps": 315, "loss": 0.0591, "lr": 1.055996354210323e-06, "epoch": 4.0, "percentage": 80.0, "elapsed_time": "0:23:13", "remaining_time": "0:05:48"}
{"current_steps": 253, "total_steps": 315, "loss": 0.0465, "lr": 1.0239240671101065e-06, "epoch": 4.015873015873016, "percentage": 80.32, "elapsed_time": "0:24:18", "remaining_time": "0:05:57"}
{"current_steps": 254, "total_steps": 315, "loss": 0.0477, "lr": 9.922907229244905e-07, "epoch": 4.031746031746032, "percentage": 80.63, "elapsed_time": "0:24:23", "remaining_time": "0:05:51"}
{"current_steps": 255, "total_steps": 315, "loss": 0.042, "lr": 9.610998138484262e-07, "epoch": 4.0476190476190474, "percentage": 80.95, "elapsed_time": "0:24:28", "remaining_time": "0:05:45"}
{"current_steps": 256, "total_steps": 315, "loss": 0.0528, "lr": 9.303547832337934e-07, "epoch": 4.063492063492063, "percentage": 81.27, "elapsed_time": "0:24:33", "remaining_time": "0:05:39"}
{"current_steps": 257, "total_steps": 315, "loss": 0.0467, "lr": 9.000590252092701e-07, "epoch": 4.079365079365079, "percentage": 81.59, "elapsed_time": "0:24:38", "remaining_time": "0:05:33"}
{"current_steps": 258, "total_steps": 315, "loss": 0.0348, "lr": 8.702158843056319e-07, "epoch": 4.095238095238095, "percentage": 81.9, "elapsed_time": "0:24:43", "remaining_time": "0:05:27"}
{"current_steps": 259, "total_steps": 315, "loss": 0.0266, "lr": 8.408286550865319e-07, "epoch": 4.111111111111111, "percentage": 82.22, "elapsed_time": "0:24:47", "remaining_time": "0:05:21"}
{"current_steps": 260, "total_steps": 315, "loss": 0.0307, "lr": 8.119005817847924e-07, "epoch": 4.1269841269841265, "percentage": 82.54, "elapsed_time": "0:24:52", "remaining_time": "0:05:15"}
{"current_steps": 261, "total_steps": 315, "loss": 0.0361, "lr": 7.834348579442552e-07, "epoch": 4.142857142857143, "percentage": 82.86, "elapsed_time": "0:24:57", "remaining_time": "0:05:09"}
{"current_steps": 262, "total_steps": 315, "loss": 0.0403, "lr": 7.554346260672263e-07, "epoch": 4.158730158730159, "percentage": 83.17, "elapsed_time": "0:25:03", "remaining_time": "0:05:04"}
{"current_steps": 263, "total_steps": 315, "loss": 0.0485, "lr": 7.279029772675572e-07, "epoch": 4.174603174603175, "percentage": 83.49, "elapsed_time": "0:25:08", "remaining_time": "0:04:58"}
{"current_steps": 264, "total_steps": 315, "loss": 0.0241, "lr": 7.008429509293979e-07, "epoch": 4.190476190476191, "percentage": 83.81, "elapsed_time": "0:25:13", "remaining_time": "0:04:52"}
{"current_steps": 265, "total_steps": 315, "loss": 0.046, "lr": 6.742575343716584e-07, "epoch": 4.2063492063492065, "percentage": 84.13, "elapsed_time": "0:25:18", "remaining_time": "0:04:46"}
{"current_steps": 266, "total_steps": 315, "loss": 0.0458, "lr": 6.481496625182271e-07, "epoch": 4.222222222222222, "percentage": 84.44, "elapsed_time": "0:25:23", "remaining_time": "0:04:40"}
{"current_steps": 267, "total_steps": 315, "loss": 0.057, "lr": 6.225222175739598e-07, "epoch": 4.238095238095238, "percentage": 84.76, "elapsed_time": "0:25:28", "remaining_time": "0:04:34"}
{"current_steps": 268, "total_steps": 315, "loss": 0.0493, "lr": 5.973780287065007e-07, "epoch": 4.253968253968254, "percentage": 85.08, "elapsed_time": "0:25:33", "remaining_time": "0:04:28"}
{"current_steps": 269, "total_steps": 315, "loss": 0.0501, "lr": 5.727198717339511e-07, "epoch": 4.26984126984127, "percentage": 85.4, "elapsed_time": "0:25:38", "remaining_time": "0:04:23"}
{"current_steps": 270, "total_steps": 315, "loss": 0.0365, "lr": 5.485504688184307e-07, "epoch": 4.285714285714286, "percentage": 85.71, "elapsed_time": "0:25:43", "remaining_time": "0:04:17"}
{"current_steps": 271, "total_steps": 315, "loss": 0.0277, "lr": 5.24872488165562e-07, "epoch": 4.301587301587301, "percentage": 86.03, "elapsed_time": "0:25:49", "remaining_time": "0:04:11"}
{"current_steps": 272, "total_steps": 315, "loss": 0.0319, "lr": 5.016885437299113e-07, "epoch": 4.317460317460317, "percentage": 86.35, "elapsed_time": "0:25:54", "remaining_time": "0:04:05"}
{"current_steps": 273, "total_steps": 315, "loss": 0.0404, "lr": 4.790011949264173e-07, "epoch": 4.333333333333333, "percentage": 86.67, "elapsed_time": "0:25:59", "remaining_time": "0:03:59"}
{"current_steps": 274, "total_steps": 315, "loss": 0.0533, "lr": 4.5681294634784437e-07, "epoch": 4.349206349206349, "percentage": 86.98, "elapsed_time": "0:26:04", "remaining_time": "0:03:54"}
{"current_steps": 275, "total_steps": 315, "loss": 0.0395, "lr": 4.3512624748828225e-07, "epoch": 4.365079365079365, "percentage": 87.3, "elapsed_time": "0:26:09", "remaining_time": "0:03:48"}
{"current_steps": 276, "total_steps": 315, "loss": 0.0424, "lr": 4.139434924727359e-07, "epoch": 4.380952380952381, "percentage": 87.62, "elapsed_time": "0:26:14", "remaining_time": "0:03:42"}
{"current_steps": 277, "total_steps": 315, "loss": 0.0551, "lr": 3.9326701979281623e-07, "epoch": 4.396825396825397, "percentage": 87.94, "elapsed_time": "0:26:18", "remaining_time": "0:03:36"}
{"current_steps": 278, "total_steps": 315, "loss": 0.0281, "lr": 3.7309911204858997e-07, "epoch": 4.412698412698413, "percentage": 88.25, "elapsed_time": "0:26:22", "remaining_time": "0:03:30"}
{"current_steps": 279, "total_steps": 315, "loss": 0.0404, "lr": 3.534419956965823e-07, "epoch": 4.428571428571429, "percentage": 88.57, "elapsed_time": "0:26:27", "remaining_time": "0:03:24"}
{"current_steps": 280, "total_steps": 315, "loss": 0.0379, "lr": 3.3429784080398765e-07, "epoch": 4.444444444444445, "percentage": 88.89, "elapsed_time": "0:26:32", "remaining_time": "0:03:19"}
{"current_steps": 281, "total_steps": 315, "loss": 0.0542, "lr": 3.1566876080910193e-07, "epoch": 4.4603174603174605, "percentage": 89.21, "elapsed_time": "0:26:37", "remaining_time": "0:03:13"}
{"current_steps": 282, "total_steps": 315, "loss": 0.0273, "lr": 2.9755681228800904e-07, "epoch": 4.476190476190476, "percentage": 89.52, "elapsed_time": "0:26:41", "remaining_time": "0:03:07"}
{"current_steps": 283, "total_steps": 315, "loss": 0.0308, "lr": 2.799639947275412e-07, "epoch": 4.492063492063492, "percentage": 89.84, "elapsed_time": "0:26:46", "remaining_time": "0:03:01"}
{"current_steps": 284, "total_steps": 315, "loss": 0.0328, "lr": 2.6289225030454556e-07, "epoch": 4.507936507936508, "percentage": 90.16, "elapsed_time": "0:26:51", "remaining_time": "0:02:55"}
{"current_steps": 285, "total_steps": 315, "loss": 0.0505, "lr": 2.4634346367147233e-07, "epoch": 4.523809523809524, "percentage": 90.48, "elapsed_time": "0:26:56", "remaining_time": "0:02:50"}
{"current_steps": 286, "total_steps": 315, "loss": 0.0309, "lr": 2.303194617483212e-07, "epoch": 4.5396825396825395, "percentage": 90.79, "elapsed_time": "0:27:01", "remaining_time": "0:02:44"}
{"current_steps": 287, "total_steps": 315, "loss": 0.0425, "lr": 2.1482201352095277e-07, "epoch": 4.555555555555555, "percentage": 91.11, "elapsed_time": "0:27:06", "remaining_time": "0:02:38"}
{"current_steps": 288, "total_steps": 315, "loss": 0.041, "lr": 1.998528298458019e-07, "epoch": 4.571428571428571, "percentage": 91.43, "elapsed_time": "0:27:11", "remaining_time": "0:02:32"}
{"current_steps": 289, "total_steps": 315, "loss": 0.0363, "lr": 1.8541356326100436e-07, "epoch": 4.587301587301587, "percentage": 91.75, "elapsed_time": "0:27:15", "remaining_time": "0:02:27"}
{"current_steps": 290, "total_steps": 315, "loss": 0.0589, "lr": 1.7150580780396385e-07, "epoch": 4.603174603174603, "percentage": 92.06, "elapsed_time": "0:27:20", "remaining_time": "0:02:21"}
{"current_steps": 291, "total_steps": 315, "loss": 0.0441, "lr": 1.5813109883537792e-07, "epoch": 4.619047619047619, "percentage": 92.38, "elapsed_time": "0:27:25", "remaining_time": "0:02:15"}
{"current_steps": 292, "total_steps": 315, "loss": 0.0407, "lr": 1.4529091286973994e-07, "epoch": 4.634920634920634, "percentage": 92.7, "elapsed_time": "0:27:30", "remaining_time": "0:02:10"}
{"current_steps": 293, "total_steps": 315, "loss": 0.0314, "lr": 1.3298666741233424e-07, "epoch": 4.650793650793651, "percentage": 93.02, "elapsed_time": "0:27:35", "remaining_time": "0:02:04"}
{"current_steps": 294, "total_steps": 315, "loss": 0.0287, "lr": 1.2121972080275378e-07, "epoch": 4.666666666666667, "percentage": 93.33, "elapsed_time": "0:27:40", "remaining_time": "0:01:58"}
{"current_steps": 295, "total_steps": 315, "loss": 0.0492, "lr": 1.0999137206494315e-07, "epoch": 4.682539682539683, "percentage": 93.65, "elapsed_time": "0:27:45", "remaining_time": "0:01:52"}
{"current_steps": 296, "total_steps": 315, "loss": 0.0461, "lr": 9.93028607637908e-08, "epoch": 4.698412698412699, "percentage": 93.97, "elapsed_time": "0:27:50", "remaining_time": "0:01:47"}
{"current_steps": 297, "total_steps": 315, "loss": 0.0402, "lr": 8.915536686828764e-08, "epoch": 4.714285714285714, "percentage": 94.29, "elapsed_time": "0:27:55", "remaining_time": "0:01:41"}
{"current_steps": 298, "total_steps": 315, "loss": 0.0346, "lr": 7.955001062125989e-08, "epoch": 4.73015873015873, "percentage": 94.6, "elapsed_time": "0:28:00", "remaining_time": "0:01:35"}
{"current_steps": 299, "total_steps": 315, "loss": 0.0385, "lr": 7.048785241570321e-08, "epoch": 4.746031746031746, "percentage": 94.92, "elapsed_time": "0:28:05", "remaining_time": "0:01:30"}
{"current_steps": 300, "total_steps": 315, "loss": 0.0473, "lr": 6.19698926777168e-08, "epoch": 4.761904761904762, "percentage": 95.24, "elapsed_time": "0:28:09", "remaining_time": "0:01:24"}
{"current_steps": 301, "total_steps": 315, "loss": 0.0448, "lr": 5.399707175606117e-08, "epoch": 4.777777777777778, "percentage": 95.56, "elapsed_time": "0:28:14", "remaining_time": "0:01:18"}
{"current_steps": 302, "total_steps": 315, "loss": 0.0382, "lr": 4.657026981834623e-08, "epoch": 4.7936507936507935, "percentage": 95.87, "elapsed_time": "0:28:19", "remaining_time": "0:01:13"}
{"current_steps": 303, "total_steps": 315, "loss": 0.0346, "lr": 3.9690306753866204e-08, "epoch": 4.809523809523809, "percentage": 96.19, "elapsed_time": "0:28:24", "remaining_time": "0:01:07"}
{"current_steps": 304, "total_steps": 315, "loss": 0.0419, "lr": 3.3357942083085404e-08, "epoch": 4.825396825396825, "percentage": 96.51, "elapsed_time": "0:28:29", "remaining_time": "0:01:01"}
{"current_steps": 305, "total_steps": 315, "loss": 0.0385, "lr": 2.7573874873791372e-08, "epoch": 4.841269841269841, "percentage": 96.83, "elapsed_time": "0:28:33", "remaining_time": "0:00:56"}
{"current_steps": 306, "total_steps": 315, "loss": 0.0415, "lr": 2.233874366391997e-08, "epoch": 4.857142857142857, "percentage": 97.14, "elapsed_time": "0:28:38", "remaining_time": "0:00:50"}
{"current_steps": 307, "total_steps": 315, "loss": 0.0445, "lr": 1.7653126391063425e-08, "epoch": 4.8730158730158735, "percentage": 97.46, "elapsed_time": "0:28:43", "remaining_time": "0:00:44"}
{"current_steps": 308, "total_steps": 315, "loss": 0.0414, "lr": 1.3517540328669143e-08, "epoch": 4.888888888888889, "percentage": 97.78, "elapsed_time": "0:28:48", "remaining_time": "0:00:39"}
{"current_steps": 309, "total_steps": 315, "loss": 0.0274, "lr": 9.93244202893262e-09, "epoch": 4.904761904761905, "percentage": 98.1, "elapsed_time": "0:28:53", "remaining_time": "0:00:33"}
{"current_steps": 310, "total_steps": 315, "loss": 0.0375, "lr": 6.898227272398306e-09, "epoch": 4.920634920634921, "percentage": 98.41, "elapsed_time": "0:28:58", "remaining_time": "0:00:28"}
{"current_steps": 311, "total_steps": 315, "loss": 0.0282, "lr": 4.415231024265665e-09, "epoch": 4.936507936507937, "percentage": 98.73, "elapsed_time": "0:29:03", "remaining_time": "0:00:22"}
{"current_steps": 312, "total_steps": 315, "loss": 0.0271, "lr": 2.4837273974115393e-09, "epoch": 4.9523809523809526, "percentage": 99.05, "elapsed_time": "0:29:07", "remaining_time": "0:00:16"}
{"current_steps": 313, "total_steps": 315, "loss": 0.0419, "lr": 1.1039296221276863e-09, "epoch": 4.968253968253968, "percentage": 99.37, "elapsed_time": "0:29:13", "remaining_time": "0:00:11"}
{"current_steps": 314, "total_steps": 315, "loss": 0.0467, "lr": 2.7599002258127395e-10, "epoch": 4.984126984126984, "percentage": 99.68, "elapsed_time": "0:29:17", "remaining_time": "0:00:05"}
{"current_steps": 315, "total_steps": 315, "loss": 0.0281, "lr": 0.0, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:29:22", "remaining_time": "0:00:00"}
{"current_steps": 315, "total_steps": 315, "epoch": 5.0, "percentage": 100.0, "elapsed_time": "0:31:17", "remaining_time": "0:00:00"}