{ "best_metric": 0.6666666666666666, "best_model_checkpoint": "videomae-base-finetuned-ucf101-subset/checkpoint-47", "epoch": 3.233695652173913, "eval_steps": 500, "global_step": 184, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.05, "learning_rate": 2.6315789473684212e-05, "loss": 1.3248, "step": 10 }, { "epoch": 0.11, "learning_rate": 4.9696969696969694e-05, "loss": 1.1778, "step": 20 }, { "epoch": 0.16, "learning_rate": 4.666666666666667e-05, "loss": 1.1431, "step": 30 }, { "epoch": 0.22, "learning_rate": 4.3636363636363636e-05, "loss": 1.1087, "step": 40 }, { "epoch": 0.26, "eval_accuracy": 0.6666666666666666, "eval_loss": 1.0796324014663696, "eval_runtime": 7.9196, "eval_samples_per_second": 7.576, "eval_steps_per_second": 1.263, "step": 47 }, { "epoch": 1.02, "learning_rate": 4.0606060606060606e-05, "loss": 1.1976, "step": 50 }, { "epoch": 1.07, "learning_rate": 3.757575757575758e-05, "loss": 1.1466, "step": 60 }, { "epoch": 1.12, "learning_rate": 3.454545454545455e-05, "loss": 1.1019, "step": 70 }, { "epoch": 1.18, "learning_rate": 3.151515151515151e-05, "loss": 0.9105, "step": 80 }, { "epoch": 1.23, "learning_rate": 2.8484848484848486e-05, "loss": 1.1741, "step": 90 }, { "epoch": 1.26, "eval_accuracy": 0.6666666666666666, "eval_loss": 1.0369313955307007, "eval_runtime": 7.179, "eval_samples_per_second": 8.358, "eval_steps_per_second": 1.393, "step": 94 }, { "epoch": 2.03, "learning_rate": 2.5454545454545454e-05, "loss": 1.0037, "step": 100 }, { "epoch": 2.09, "learning_rate": 2.2424242424242424e-05, "loss": 1.1246, "step": 110 }, { "epoch": 2.14, "learning_rate": 1.9393939393939395e-05, "loss": 0.9617, "step": 120 }, { "epoch": 2.2, "learning_rate": 1.6363636363636366e-05, "loss": 1.2222, "step": 130 }, { "epoch": 2.25, "learning_rate": 1.3333333333333333e-05, "loss": 1.1019, "step": 140 }, { "epoch": 2.26, "eval_accuracy": 0.6666666666666666, "eval_loss": 1.0367798805236816, "eval_runtime": 7.1432, "eval_samples_per_second": 8.4, "eval_steps_per_second": 1.4, "step": 141 }, { "epoch": 3.05, "learning_rate": 1.0303030303030304e-05, "loss": 1.0377, "step": 150 }, { "epoch": 3.1, "learning_rate": 7.272727272727272e-06, "loss": 0.9239, "step": 160 }, { "epoch": 3.16, "learning_rate": 4.242424242424243e-06, "loss": 0.962, "step": 170 }, { "epoch": 3.21, "learning_rate": 1.2121212121212122e-06, "loss": 1.2164, "step": 180 }, { "epoch": 3.23, "eval_accuracy": 0.6666666666666666, "eval_loss": 1.0368505716323853, "eval_runtime": 6.9878, "eval_samples_per_second": 8.586, "eval_steps_per_second": 1.431, "step": 184 }, { "epoch": 3.23, "step": 184, "total_flos": 1.371953817857065e+18, "train_loss": 1.1023413642593052, "train_runtime": 253.982, "train_samples_per_second": 4.347, "train_steps_per_second": 0.724 }, { "epoch": 3.23, "eval_accuracy": 0.6507936507936508, "eval_loss": 1.1350980997085571, "eval_runtime": 8.469, "eval_samples_per_second": 7.439, "eval_steps_per_second": 1.299, "step": 184 }, { "epoch": 3.23, "eval_accuracy": 0.6507936507936508, "eval_loss": 1.1350986957550049, "eval_runtime": 7.4306, "eval_samples_per_second": 8.478, "eval_steps_per_second": 1.48, "step": 184 } ], "logging_steps": 10, "max_steps": 184, "num_input_tokens_seen": 0, "num_train_epochs": 9223372036854775807, "save_steps": 500, "total_flos": 1.371953817857065e+18, "train_batch_size": 6, "trial_name": null, "trial_params": null }