codeaidbackUp's picture
Upload folder using huggingface_hub
af9e925 verified
{"current_steps": 1010, "total_steps": 1728, "loss": 0.3071, "lr": 4.4104321365719216e-05, "epoch": 1.7534722222222223, "percentage": 58.45, "elapsed_time": "0:01:48", "remaining_time": "0:01:16"}
{"current_steps": 1020, "total_steps": 1728, "loss": 0.302, "lr": 4.310248137228176e-05, "epoch": 1.7708333333333335, "percentage": 59.03, "elapsed_time": "0:03:37", "remaining_time": "0:02:31"}
{"current_steps": 1030, "total_steps": 1728, "loss": 0.2602, "lr": 4.210345662950161e-05, "epoch": 1.7881944444444444, "percentage": 59.61, "elapsed_time": "0:05:31", "remaining_time": "0:03:44"}
{"current_steps": 1040, "total_steps": 1728, "loss": 0.3086, "lr": 4.11076548934452e-05, "epoch": 1.8055555555555556, "percentage": 60.19, "elapsed_time": "0:07:23", "remaining_time": "0:04:53"}
{"current_steps": 1050, "total_steps": 1728, "loss": 0.2801, "lr": 4.011548260469552e-05, "epoch": 1.8229166666666665, "percentage": 60.76, "elapsed_time": "0:09:13", "remaining_time": "0:05:57"}
{"current_steps": 1060, "total_steps": 1728, "loss": 0.3004, "lr": 3.9127344722461615e-05, "epoch": 1.8402777777777777, "percentage": 61.34, "elapsed_time": "0:11:04", "remaining_time": "0:06:59"}
{"current_steps": 1070, "total_steps": 1728, "loss": 0.2837, "lr": 3.8143644559292927e-05, "epoch": 1.8576388888888888, "percentage": 61.92, "elapsed_time": "0:12:56", "remaining_time": "0:07:57"}
{"current_steps": 1080, "total_steps": 1728, "loss": 0.2604, "lr": 3.716478361646555e-05, "epoch": 1.875, "percentage": 62.5, "elapsed_time": "0:14:45", "remaining_time": "0:08:51"}
{"current_steps": 1090, "total_steps": 1728, "loss": 0.304, "lr": 3.6191161420107864e-05, "epoch": 1.8923611111111112, "percentage": 63.08, "elapsed_time": "0:16:31", "remaining_time": "0:09:40"}
{"current_steps": 1100, "total_steps": 1728, "loss": 0.2866, "lr": 3.5223175358132256e-05, "epoch": 1.9097222222222223, "percentage": 63.66, "elapsed_time": "0:18:20", "remaining_time": "0:10:28"}
{"current_steps": 1100, "total_steps": 1728, "eval_loss": 0.48055773973464966, "epoch": 1.9097222222222223, "percentage": 63.66, "elapsed_time": "0:26:31", "remaining_time": "0:15:08"}
{"current_steps": 1110, "total_steps": 1728, "loss": 0.2847, "lr": 3.426122051803969e-05, "epoch": 1.9270833333333335, "percentage": 64.24, "elapsed_time": "0:28:18", "remaining_time": "0:15:45"}
{"current_steps": 1120, "total_steps": 1728, "loss": 0.278, "lr": 3.330568952566302e-05, "epoch": 1.9444444444444444, "percentage": 64.81, "elapsed_time": "0:30:09", "remaining_time": "0:16:22"}
{"current_steps": 1130, "total_steps": 1728, "loss": 0.2883, "lr": 3.235697238491516e-05, "epoch": 1.9618055555555556, "percentage": 65.39, "elapsed_time": "0:31:58", "remaining_time": "0:16:55"}
{"current_steps": 1140, "total_steps": 1728, "loss": 0.2924, "lr": 3.141545631860746e-05, "epoch": 1.9791666666666665, "percentage": 65.97, "elapsed_time": "0:33:46", "remaining_time": "0:17:25"}
{"current_steps": 1150, "total_steps": 1728, "loss": 0.3073, "lr": 3.0481525610402978e-05, "epoch": 1.9965277777777777, "percentage": 66.55, "elapsed_time": "0:35:38", "remaining_time": "0:17:55"}
{"current_steps": 1160, "total_steps": 1728, "loss": 0.304, "lr": 2.9555561447969683e-05, "epoch": 2.013888888888889, "percentage": 67.13, "elapsed_time": "0:37:28", "remaining_time": "0:18:21"}
{"current_steps": 1170, "total_steps": 1728, "loss": 0.2801, "lr": 2.8637941767396954e-05, "epoch": 2.03125, "percentage": 67.71, "elapsed_time": "0:39:21", "remaining_time": "0:18:46"}
{"current_steps": 1180, "total_steps": 1728, "loss": 0.287, "lr": 2.7729041098939585e-05, "epoch": 2.048611111111111, "percentage": 68.29, "elapsed_time": "0:41:12", "remaining_time": "0:19:08"}
{"current_steps": 1190, "total_steps": 1728, "loss": 0.3276, "lr": 2.682923041415163e-05, "epoch": 2.0659722222222223, "percentage": 68.87, "elapsed_time": "0:43:03", "remaining_time": "0:19:27"}
{"current_steps": 1200, "total_steps": 1728, "loss": 0.2718, "lr": 2.5938876974472802e-05, "epoch": 2.0833333333333335, "percentage": 69.44, "elapsed_time": "0:44:58", "remaining_time": "0:19:47"}
{"current_steps": 1200, "total_steps": 1728, "eval_loss": 0.47958508133888245, "epoch": 2.0833333333333335, "percentage": 69.44, "elapsed_time": "0:53:09", "remaining_time": "0:23:23"}
{"current_steps": 1210, "total_steps": 1728, "loss": 0.2929, "lr": 2.5058344181329273e-05, "epoch": 2.1006944444444446, "percentage": 70.02, "elapsed_time": "0:55:06", "remaining_time": "0:23:35"}
{"current_steps": 1220, "total_steps": 1728, "loss": 0.3054, "lr": 2.418799142780982e-05, "epoch": 2.1180555555555554, "percentage": 70.6, "elapsed_time": "0:56:57", "remaining_time": "0:23:43"}
{"current_steps": 1230, "total_steps": 1728, "loss": 0.3087, "lr": 2.332817395197813e-05, "epoch": 2.1354166666666665, "percentage": 71.18, "elapsed_time": "0:58:49", "remaining_time": "0:23:48"}
{"current_steps": 1240, "total_steps": 1728, "loss": 0.286, "lr": 2.2479242691880887e-05, "epoch": 2.1527777777777777, "percentage": 71.76, "elapsed_time": "1:00:37", "remaining_time": "0:23:51"}
{"current_steps": 1250, "total_steps": 1728, "loss": 0.2902, "lr": 2.164154414231091e-05, "epoch": 2.170138888888889, "percentage": 72.34, "elapsed_time": "1:02:24", "remaining_time": "0:23:51"}
{"current_steps": 1260, "total_steps": 1728, "loss": 0.2631, "lr": 2.0815420213383936e-05, "epoch": 2.1875, "percentage": 72.92, "elapsed_time": "1:04:15", "remaining_time": "0:23:52"}
{"current_steps": 1270, "total_steps": 1728, "loss": 0.3163, "lr": 2.0001208090986557e-05, "epoch": 2.204861111111111, "percentage": 73.5, "elapsed_time": "1:06:07", "remaining_time": "0:23:50"}
{"current_steps": 1280, "total_steps": 1728, "loss": 0.3257, "lr": 1.9199240099152498e-05, "epoch": 2.2222222222222223, "percentage": 74.07, "elapsed_time": "1:08:02", "remaining_time": "0:23:48"}
{"current_steps": 1290, "total_steps": 1728, "loss": 0.2952, "lr": 1.8409843564423056e-05, "epoch": 2.2395833333333335, "percentage": 74.65, "elapsed_time": "1:09:52", "remaining_time": "0:23:43"}
{"current_steps": 1300, "total_steps": 1728, "loss": 0.3169, "lr": 1.7633340682247558e-05, "epoch": 2.2569444444444446, "percentage": 75.23, "elapsed_time": "1:11:37", "remaining_time": "0:23:34"}
{"current_steps": 1300, "total_steps": 1728, "eval_loss": 0.468641072511673, "epoch": 2.2569444444444446, "percentage": 75.23, "elapsed_time": "1:19:43", "remaining_time": "0:26:14"}
{"current_steps": 1310, "total_steps": 1728, "loss": 0.3121, "lr": 1.6870048385477848e-05, "epoch": 2.2743055555555554, "percentage": 75.81, "elapsed_time": "1:21:34", "remaining_time": "0:26:01"}
{"current_steps": 1320, "total_steps": 1728, "loss": 0.2928, "lr": 1.6120278215010886e-05, "epoch": 2.2916666666666665, "percentage": 76.39, "elapsed_time": "1:23:24", "remaining_time": "0:25:46"}
{"current_steps": 1330, "total_steps": 1728, "loss": 0.2578, "lr": 1.5384336192632104e-05, "epoch": 2.3090277777777777, "percentage": 76.97, "elapsed_time": "1:25:13", "remaining_time": "0:25:30"}
{"current_steps": 1340, "total_steps": 1728, "loss": 0.2856, "lr": 1.4662522696111225e-05, "epoch": 2.326388888888889, "percentage": 77.55, "elapsed_time": "1:27:04", "remaining_time": "0:25:12"}
{"current_steps": 1350, "total_steps": 1728, "loss": 0.2829, "lr": 1.395513233660199e-05, "epoch": 2.34375, "percentage": 78.12, "elapsed_time": "1:28:56", "remaining_time": "0:24:54"}
{"current_steps": 1360, "total_steps": 1728, "loss": 0.3188, "lr": 1.3262453838395205e-05, "epoch": 2.361111111111111, "percentage": 78.7, "elapsed_time": "1:30:44", "remaining_time": "0:24:33"}
{"current_steps": 1370, "total_steps": 1728, "loss": 0.295, "lr": 1.2584769921074962e-05, "epoch": 2.3784722222222223, "percentage": 79.28, "elapsed_time": "1:32:32", "remaining_time": "0:24:10"}
{"current_steps": 1380, "total_steps": 1728, "loss": 0.3112, "lr": 1.1922357184125327e-05, "epoch": 2.3958333333333335, "percentage": 79.86, "elapsed_time": "1:34:22", "remaining_time": "0:23:47"}
{"current_steps": 1390, "total_steps": 1728, "loss": 0.2837, "lr": 1.1275485994035107e-05, "epoch": 2.4131944444444446, "percentage": 80.44, "elapsed_time": "1:36:07", "remaining_time": "0:23:22"}
{"current_steps": 1400, "total_steps": 1728, "loss": 0.276, "lr": 1.064442037394679e-05, "epoch": 2.4305555555555554, "percentage": 81.02, "elapsed_time": "1:37:56", "remaining_time": "0:22:56"}
{"current_steps": 1400, "total_steps": 1728, "eval_loss": 0.46923181414604187, "epoch": 2.4305555555555554, "percentage": 81.02, "elapsed_time": "1:46:08", "remaining_time": "0:24:51"}
{"current_steps": 1410, "total_steps": 1728, "loss": 0.305, "lr": 1.0029417895894211e-05, "epoch": 2.4479166666666665, "percentage": 81.6, "elapsed_time": "1:48:04", "remaining_time": "0:24:22"}
{"current_steps": 1420, "total_steps": 1728, "loss": 0.263, "lr": 9.430729575673658e-06, "epoch": 2.4652777777777777, "percentage": 82.18, "elapsed_time": "1:49:59", "remaining_time": "0:23:51"}
{"current_steps": 1430, "total_steps": 1728, "loss": 0.2709, "lr": 8.848599770390653e-06, "epoch": 2.482638888888889, "percentage": 82.75, "elapsed_time": "1:51:47", "remaining_time": "0:23:17"}
{"current_steps": 1440, "total_steps": 1728, "loss": 0.2834, "lr": 8.283266078724571e-06, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "1:53:35", "remaining_time": "0:22:43"}
{"current_steps": 1450, "total_steps": 1728, "loss": 0.2785, "lr": 7.734959243951783e-06, "epoch": 2.517361111111111, "percentage": 83.91, "elapsed_time": "1:55:28", "remaining_time": "0:22:08"}
{"current_steps": 1460, "total_steps": 1728, "loss": 0.2671, "lr": 7.203903059766848e-06, "epoch": 2.5347222222222223, "percentage": 84.49, "elapsed_time": "1:57:17", "remaining_time": "0:21:31"}
{"current_steps": 1470, "total_steps": 1728, "loss": 0.2646, "lr": 6.690314278940207e-06, "epoch": 2.5520833333333335, "percentage": 85.07, "elapsed_time": "1:59:05", "remaining_time": "0:20:54"}
{"current_steps": 1480, "total_steps": 1728, "loss": 0.2905, "lr": 6.194402524849585e-06, "epoch": 2.5694444444444446, "percentage": 85.65, "elapsed_time": "2:00:56", "remaining_time": "0:20:15"}
{"current_steps": 1490, "total_steps": 1728, "loss": 0.2948, "lr": 5.716370205921434e-06, "epoch": 2.5868055555555554, "percentage": 86.23, "elapsed_time": "2:02:48", "remaining_time": "0:19:36"}
{"current_steps": 1500, "total_steps": 1728, "loss": 0.2616, "lr": 5.256412433017005e-06, "epoch": 2.6041666666666665, "percentage": 86.81, "elapsed_time": "2:04:41", "remaining_time": "0:18:57"}
{"current_steps": 1500, "total_steps": 1728, "eval_loss": 0.4693165123462677, "epoch": 2.6041666666666665, "percentage": 86.81, "elapsed_time": "2:12:50", "remaining_time": "0:20:11"}
{"current_steps": 1510, "total_steps": 1728, "loss": 0.2411, "lr": 4.814716939797109e-06, "epoch": 2.6215277777777777, "percentage": 87.38, "elapsed_time": "2:14:33", "remaining_time": "0:19:25"}
{"current_steps": 1520, "total_steps": 1728, "loss": 0.2909, "lr": 4.391464006097845e-06, "epoch": 2.638888888888889, "percentage": 87.96, "elapsed_time": "2:16:27", "remaining_time": "0:18:40"}
{"current_steps": 1530, "total_steps": 1728, "loss": 0.2828, "lr": 3.986826384348608e-06, "epoch": 2.65625, "percentage": 88.54, "elapsed_time": "2:18:16", "remaining_time": "0:17:53"}
{"current_steps": 1540, "total_steps": 1728, "loss": 0.3004, "lr": 3.600969229062523e-06, "epoch": 2.673611111111111, "percentage": 89.12, "elapsed_time": "2:20:07", "remaining_time": "0:17:06"}
{"current_steps": 1550, "total_steps": 1728, "loss": 0.3031, "lr": 3.2340500294278876e-06, "epoch": 2.6909722222222223, "percentage": 89.7, "elapsed_time": "2:21:55", "remaining_time": "0:16:17"}
{"current_steps": 1560, "total_steps": 1728, "loss": 0.2654, "lr": 2.8862185450283572e-06, "epoch": 2.7083333333333335, "percentage": 90.28, "elapsed_time": "2:23:46", "remaining_time": "0:15:28"}
{"current_steps": 1570, "total_steps": 1728, "loss": 0.2812, "lr": 2.55761674471795e-06, "epoch": 2.7256944444444446, "percentage": 90.86, "elapsed_time": "2:25:37", "remaining_time": "0:14:39"}
{"current_steps": 1580, "total_steps": 1728, "loss": 0.2854, "lr": 2.24837874867585e-06, "epoch": 2.7430555555555554, "percentage": 91.44, "elapsed_time": "2:27:30", "remaining_time": "0:13:49"}
{"current_steps": 1590, "total_steps": 1728, "loss": 0.2975, "lr": 1.9586307736647323e-06, "epoch": 2.7604166666666665, "percentage": 92.01, "elapsed_time": "2:29:19", "remaining_time": "0:12:57"}
{"current_steps": 1600, "total_steps": 1728, "loss": 0.2545, "lr": 1.6884910815148425e-06, "epoch": 2.7777777777777777, "percentage": 92.59, "elapsed_time": "2:31:06", "remaining_time": "0:12:05"}
{"current_steps": 1600, "total_steps": 1728, "eval_loss": 0.4670693278312683, "epoch": 2.7777777777777777, "percentage": 92.59, "elapsed_time": "2:39:16", "remaining_time": "0:12:44"}
{"current_steps": 1610, "total_steps": 1728, "loss": 0.2886, "lr": 1.4380699308549572e-06, "epoch": 2.795138888888889, "percentage": 93.17, "elapsed_time": "2:41:14", "remaining_time": "0:11:49"}
{"current_steps": 1620, "total_steps": 1728, "loss": 0.2791, "lr": 1.2074695321098895e-06, "epoch": 2.8125, "percentage": 93.75, "elapsed_time": "2:43:10", "remaining_time": "0:10:52"}
{"current_steps": 1630, "total_steps": 1728, "loss": 0.2814, "lr": 9.96784005782836e-07, "epoch": 2.829861111111111, "percentage": 94.33, "elapsed_time": "2:45:01", "remaining_time": "0:09:55"}
{"current_steps": 1640, "total_steps": 1728, "loss": 0.2814, "lr": 8.060993440397624e-07, "epoch": 2.8472222222222223, "percentage": 94.91, "elapsed_time": "2:46:54", "remaining_time": "0:08:57"}
{"current_steps": 1650, "total_steps": 1728, "loss": 0.2736, "lr": 6.354933756112902e-07, "epoch": 2.8645833333333335, "percentage": 95.49, "elapsed_time": "2:48:46", "remaining_time": "0:07:58"}
{"current_steps": 1660, "total_steps": 1728, "loss": 0.286, "lr": 4.850357340266231e-07, "epoch": 2.8819444444444446, "percentage": 96.06, "elapsed_time": "2:50:35", "remaining_time": "0:06:59"}
{"current_steps": 1670, "total_steps": 1728, "loss": 0.2604, "lr": 3.5478782919230457e-07, "epoch": 2.8993055555555554, "percentage": 96.64, "elapsed_time": "2:52:28", "remaining_time": "0:05:59"}
{"current_steps": 1680, "total_steps": 1728, "loss": 0.288, "lr": 2.4480282232754445e-07, "epoch": 2.9166666666666665, "percentage": 97.22, "elapsed_time": "2:54:17", "remaining_time": "0:04:58"}
{"current_steps": 1690, "total_steps": 1728, "loss": 0.2588, "lr": 1.5512560426621526e-07, "epoch": 2.9340277777777777, "percentage": 97.8, "elapsed_time": "2:56:08", "remaining_time": "0:03:57"}
{"current_steps": 1700, "total_steps": 1728, "loss": 0.2673, "lr": 8.579277713448574e-08, "epoch": 2.951388888888889, "percentage": 98.38, "elapsed_time": "2:58:00", "remaining_time": "0:02:55"}
{"current_steps": 1700, "total_steps": 1728, "eval_loss": 0.46653616428375244, "epoch": 2.951388888888889, "percentage": 98.38, "elapsed_time": "3:06:14", "remaining_time": "0:03:04"}
{"current_steps": 1710, "total_steps": 1728, "loss": 0.2919, "lr": 3.6832639411521485e-08, "epoch": 2.96875, "percentage": 98.96, "elapsed_time": "3:07:57", "remaining_time": "0:01:58"}
{"current_steps": 1720, "total_steps": 1728, "loss": 0.2505, "lr": 8.26517437933494e-09, "epoch": 2.986111111111111, "percentage": 99.54, "elapsed_time": "3:09:43", "remaining_time": "0:00:52"}
{"current_steps": 1728, "total_steps": 1728, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "3:11:18", "remaining_time": "0:00:00"}