mm-interp-RLAIF-V_L0-q0_25 / trainer_log.jsonl
htlou's picture
Upload folder using huggingface_hub
d57768f verified
{"current_steps": 5, "total_steps": 216, "loss": 1.6525, "learning_rate": 5e-07, "epoch": 0.06944444444444445, "percentage": 2.31, "elapsed_time": "0:01:07", "remaining_time": "0:47:30"}
{"current_steps": 10, "total_steps": 216, "loss": 1.5085, "learning_rate": 1e-06, "epoch": 0.1388888888888889, "percentage": 4.63, "elapsed_time": "0:02:10", "remaining_time": "0:44:41"}
{"current_steps": 15, "total_steps": 216, "loss": 1.2944, "learning_rate": 9.985471028179154e-07, "epoch": 0.20833333333333334, "percentage": 6.94, "elapsed_time": "0:03:12", "remaining_time": "0:42:58"}
{"current_steps": 20, "total_steps": 216, "loss": 1.2274, "learning_rate": 9.94196854912548e-07, "epoch": 0.2777777777777778, "percentage": 9.26, "elapsed_time": "0:04:14", "remaining_time": "0:41:35"}
{"current_steps": 25, "total_steps": 216, "loss": 1.1796, "learning_rate": 9.869745381355905e-07, "epoch": 0.3472222222222222, "percentage": 11.57, "elapsed_time": "0:05:16", "remaining_time": "0:40:18"}
{"current_steps": 30, "total_steps": 216, "loss": 1.162, "learning_rate": 9.769221256218162e-07, "epoch": 0.4166666666666667, "percentage": 13.89, "elapsed_time": "0:06:18", "remaining_time": "0:39:09"}
{"current_steps": 35, "total_steps": 216, "loss": 1.1511, "learning_rate": 9.64098037858483e-07, "epoch": 0.4861111111111111, "percentage": 16.2, "elapsed_time": "0:07:21", "remaining_time": "0:38:01"}
{"current_steps": 40, "total_steps": 216, "loss": 1.1321, "learning_rate": 9.485768031694871e-07, "epoch": 0.5555555555555556, "percentage": 18.52, "elapsed_time": "0:08:23", "remaining_time": "0:36:57"}
{"current_steps": 45, "total_steps": 216, "loss": 1.141, "learning_rate": 9.304486245873971e-07, "epoch": 0.625, "percentage": 20.83, "elapsed_time": "0:09:26", "remaining_time": "0:35:51"}
{"current_steps": 50, "total_steps": 216, "loss": 1.1353, "learning_rate": 9.098188556305262e-07, "epoch": 0.6944444444444444, "percentage": 23.15, "elapsed_time": "0:10:28", "remaining_time": "0:34:45"}
{"current_steps": 50, "total_steps": 216, "eval_loss": 1.1089767217636108, "epoch": 0.6944444444444444, "percentage": 23.15, "elapsed_time": "0:11:05", "remaining_time": "0:36:47"}
{"current_steps": 55, "total_steps": 216, "loss": 1.1085, "learning_rate": 8.868073880316123e-07, "epoch": 0.7638888888888888, "percentage": 25.46, "elapsed_time": "0:12:06", "remaining_time": "0:35:27"}
{"current_steps": 60, "total_steps": 216, "loss": 1.1058, "learning_rate": 8.615479549763755e-07, "epoch": 0.8333333333333334, "percentage": 27.78, "elapsed_time": "0:13:09", "remaining_time": "0:34:12"}
{"current_steps": 65, "total_steps": 216, "loss": 1.1054, "learning_rate": 8.341873539012443e-07, "epoch": 0.9027777777777778, "percentage": 30.09, "elapsed_time": "0:14:12", "remaining_time": "0:32:59"}
{"current_steps": 70, "total_steps": 216, "loss": 1.1129, "learning_rate": 8.048845933670271e-07, "epoch": 0.9722222222222222, "percentage": 32.41, "elapsed_time": "0:15:14", "remaining_time": "0:31:47"}
{"current_steps": 75, "total_steps": 216, "loss": 1.0225, "learning_rate": 7.738099689665539e-07, "epoch": 1.0416666666666667, "percentage": 34.72, "elapsed_time": "0:16:17", "remaining_time": "0:30:37"}
{"current_steps": 80, "total_steps": 216, "loss": 0.9791, "learning_rate": 7.41144073636728e-07, "epoch": 1.1111111111111112, "percentage": 37.04, "elapsed_time": "0:17:20", "remaining_time": "0:29:29"}
{"current_steps": 85, "total_steps": 216, "loss": 0.9602, "learning_rate": 7.070767481266492e-07, "epoch": 1.1805555555555556, "percentage": 39.35, "elapsed_time": "0:18:22", "remaining_time": "0:28:19"}
{"current_steps": 90, "total_steps": 216, "loss": 0.9586, "learning_rate": 6.718059777212565e-07, "epoch": 1.25, "percentage": 41.67, "elapsed_time": "0:19:24", "remaining_time": "0:27:10"}
{"current_steps": 95, "total_steps": 216, "loss": 0.9528, "learning_rate": 6.355367416322778e-07, "epoch": 1.3194444444444444, "percentage": 43.98, "elapsed_time": "0:20:26", "remaining_time": "0:26:02"}
{"current_steps": 100, "total_steps": 216, "loss": 0.9543, "learning_rate": 5.984798217433531e-07, "epoch": 1.3888888888888888, "percentage": 46.3, "elapsed_time": "0:21:28", "remaining_time": "0:24:55"}
{"current_steps": 100, "total_steps": 216, "eval_loss": 1.0777673721313477, "epoch": 1.3888888888888888, "percentage": 46.3, "elapsed_time": "0:22:05", "remaining_time": "0:25:37"}
{"current_steps": 105, "total_steps": 216, "loss": 0.9546, "learning_rate": 5.608505776324157e-07, "epoch": 1.4583333333333333, "percentage": 48.61, "elapsed_time": "0:23:39", "remaining_time": "0:25:00"}
{"current_steps": 110, "total_steps": 216, "loss": 0.9602, "learning_rate": 5.228676949903973e-07, "epoch": 1.5277777777777777, "percentage": 50.93, "elapsed_time": "0:24:41", "remaining_time": "0:23:47"}
{"current_steps": 115, "total_steps": 216, "loss": 0.9547, "learning_rate": 4.847519147099294e-07, "epoch": 1.5972222222222223, "percentage": 53.24, "elapsed_time": "0:25:43", "remaining_time": "0:22:35"}
{"current_steps": 120, "total_steps": 216, "loss": 0.9369, "learning_rate": 4.46724750030062e-07, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "0:26:46", "remaining_time": "0:21:24"}
{"current_steps": 125, "total_steps": 216, "loss": 0.9455, "learning_rate": 4.0900719919241935e-07, "epoch": 1.7361111111111112, "percentage": 57.87, "elapsed_time": "0:27:48", "remaining_time": "0:20:14"}
{"current_steps": 130, "total_steps": 216, "loss": 0.9392, "learning_rate": 3.7181846109031e-07, "epoch": 1.8055555555555556, "percentage": 60.19, "elapsed_time": "0:28:50", "remaining_time": "0:19:04"}
{"current_steps": 135, "total_steps": 216, "loss": 0.9439, "learning_rate": 3.353746613749093e-07, "epoch": 1.875, "percentage": 62.5, "elapsed_time": "0:29:53", "remaining_time": "0:17:55"}
{"current_steps": 140, "total_steps": 216, "loss": 0.9396, "learning_rate": 2.9988759642186093e-07, "epoch": 1.9444444444444444, "percentage": 64.81, "elapsed_time": "0:30:55", "remaining_time": "0:16:47"}
{"current_steps": 145, "total_steps": 216, "loss": 0.9073, "learning_rate": 2.655635024578483e-07, "epoch": 2.013888888888889, "percentage": 67.13, "elapsed_time": "0:31:57", "remaining_time": "0:15:38"}
{"current_steps": 150, "total_steps": 216, "loss": 0.8627, "learning_rate": 2.3260185700046292e-07, "epoch": 2.0833333333333335, "percentage": 69.44, "elapsed_time": "0:32:59", "remaining_time": "0:14:30"}
{"current_steps": 150, "total_steps": 216, "eval_loss": 1.0668742656707764, "epoch": 2.0833333333333335, "percentage": 69.44, "elapsed_time": "0:33:35", "remaining_time": "0:14:46"}
{"current_steps": 155, "total_steps": 216, "loss": 0.8666, "learning_rate": 2.0119421957691218e-07, "epoch": 2.1527777777777777, "percentage": 71.76, "elapsed_time": "0:34:37", "remaining_time": "0:13:37"}
{"current_steps": 160, "total_steps": 216, "loss": 0.8574, "learning_rate": 1.7152311845883094e-07, "epoch": 2.2222222222222223, "percentage": 74.07, "elapsed_time": "0:35:40", "remaining_time": "0:12:29"}
{"current_steps": 165, "total_steps": 216, "loss": 0.8581, "learning_rate": 1.4376098988303404e-07, "epoch": 2.2916666666666665, "percentage": 76.39, "elapsed_time": "0:36:42", "remaining_time": "0:11:20"}
{"current_steps": 170, "total_steps": 216, "loss": 0.8505, "learning_rate": 1.1806917592302761e-07, "epoch": 2.361111111111111, "percentage": 78.7, "elapsed_time": "0:37:44", "remaining_time": "0:10:12"}
{"current_steps": 175, "total_steps": 216, "loss": 0.847, "learning_rate": 9.459698683523204e-08, "epoch": 2.4305555555555554, "percentage": 81.02, "elapsed_time": "0:38:46", "remaining_time": "0:09:05"}
{"current_steps": 180, "total_steps": 216, "loss": 0.8505, "learning_rate": 7.348083332917926e-08, "epoch": 2.5, "percentage": 83.33, "elapsed_time": "0:39:48", "remaining_time": "0:07:57"}
{"current_steps": 185, "total_steps": 216, "loss": 0.844, "learning_rate": 5.484343380457124e-08, "epoch": 2.5694444444444446, "percentage": 85.65, "elapsed_time": "0:40:51", "remaining_time": "0:06:50"}
{"current_steps": 190, "total_steps": 216, "loss": 0.8417, "learning_rate": 3.879310116241041e-08, "epoch": 2.638888888888889, "percentage": 87.96, "elapsed_time": "0:41:53", "remaining_time": "0:05:43"}
{"current_steps": 195, "total_steps": 216, "loss": 0.8382, "learning_rate": 2.5423113334966218e-08, "epoch": 2.7083333333333335, "percentage": 90.28, "elapsed_time": "0:42:56", "remaining_time": "0:04:37"}
{"current_steps": 200, "total_steps": 216, "loss": 0.8551, "learning_rate": 1.4811171192794624e-08, "epoch": 2.7777777777777777, "percentage": 92.59, "elapsed_time": "0:43:58", "remaining_time": "0:03:31"}
{"current_steps": 200, "total_steps": 216, "eval_loss": 1.0724252462387085, "epoch": 2.7777777777777777, "percentage": 92.59, "elapsed_time": "0:44:35", "remaining_time": "0:03:34"}
{"current_steps": 205, "total_steps": 216, "loss": 0.8432, "learning_rate": 7.018946979234997e-09, "epoch": 2.8472222222222223, "percentage": 94.91, "elapsed_time": "0:46:08", "remaining_time": "0:02:28"}
{"current_steps": 210, "total_steps": 216, "loss": 0.8478, "learning_rate": 2.0917258966953734e-09, "epoch": 2.9166666666666665, "percentage": 97.22, "elapsed_time": "0:47:11", "remaining_time": "0:01:20"}
{"current_steps": 215, "total_steps": 216, "loss": 0.8291, "learning_rate": 5.814292768108187e-11, "epoch": 2.986111111111111, "percentage": 99.54, "elapsed_time": "0:48:13", "remaining_time": "0:00:13"}
{"current_steps": 216, "total_steps": 216, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "0:48:56", "remaining_time": "0:00:00"}