|
{ |
|
"best_metric": 0.8218390804597702, |
|
"best_model_checkpoint": "swin-tiny-patch4-window7-224-finetuned-vit/checkpoint-438", |
|
"epoch": 2.9846678023850086, |
|
"eval_steps": 500, |
|
"global_step": 438, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.07, |
|
"learning_rate": 1.1363636363636365e-05, |
|
"loss": 2.5718, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.14, |
|
"learning_rate": 2.272727272727273e-05, |
|
"loss": 2.4304, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"learning_rate": 3.409090909090909e-05, |
|
"loss": 2.2567, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"learning_rate": 4.545454545454546e-05, |
|
"loss": 1.9423, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"learning_rate": 4.9238578680203045e-05, |
|
"loss": 1.5811, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.41, |
|
"learning_rate": 4.7969543147208126e-05, |
|
"loss": 1.2969, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"learning_rate": 4.67005076142132e-05, |
|
"loss": 1.3403, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"learning_rate": 4.543147208121827e-05, |
|
"loss": 0.9912, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"learning_rate": 4.416243654822335e-05, |
|
"loss": 1.3058, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"learning_rate": 4.289340101522843e-05, |
|
"loss": 1.0968, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.75, |
|
"learning_rate": 4.162436548223351e-05, |
|
"loss": 1.2238, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 0.82, |
|
"learning_rate": 4.035532994923858e-05, |
|
"loss": 1.0739, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 0.89, |
|
"learning_rate": 3.9086294416243655e-05, |
|
"loss": 1.0948, |
|
"step": 130 |
|
}, |
|
{ |
|
"epoch": 0.95, |
|
"learning_rate": 3.7817258883248735e-05, |
|
"loss": 0.967, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 0.99, |
|
"eval_accuracy": 0.735632183908046, |
|
"eval_loss": 0.752730667591095, |
|
"eval_runtime": 221.3941, |
|
"eval_samples_per_second": 2.358, |
|
"eval_steps_per_second": 0.298, |
|
"step": 146 |
|
}, |
|
{ |
|
"epoch": 1.02, |
|
"learning_rate": 3.654822335025381e-05, |
|
"loss": 0.9675, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"learning_rate": 3.527918781725888e-05, |
|
"loss": 0.9117, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 1.16, |
|
"learning_rate": 3.401015228426396e-05, |
|
"loss": 0.8393, |
|
"step": 170 |
|
}, |
|
{ |
|
"epoch": 1.23, |
|
"learning_rate": 3.2741116751269036e-05, |
|
"loss": 0.7949, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 1.29, |
|
"learning_rate": 3.147208121827411e-05, |
|
"loss": 0.8543, |
|
"step": 190 |
|
}, |
|
{ |
|
"epoch": 1.36, |
|
"learning_rate": 3.020304568527919e-05, |
|
"loss": 0.8966, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 1.43, |
|
"learning_rate": 2.8934010152284264e-05, |
|
"loss": 0.8289, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"learning_rate": 2.766497461928934e-05, |
|
"loss": 0.8569, |
|
"step": 220 |
|
}, |
|
{ |
|
"epoch": 1.57, |
|
"learning_rate": 2.6395939086294418e-05, |
|
"loss": 0.8244, |
|
"step": 230 |
|
}, |
|
{ |
|
"epoch": 1.64, |
|
"learning_rate": 2.5126903553299492e-05, |
|
"loss": 0.8009, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 1.7, |
|
"learning_rate": 2.385786802030457e-05, |
|
"loss": 0.765, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 1.77, |
|
"learning_rate": 2.2588832487309646e-05, |
|
"loss": 0.7593, |
|
"step": 260 |
|
}, |
|
{ |
|
"epoch": 1.84, |
|
"learning_rate": 2.1319796954314723e-05, |
|
"loss": 0.7606, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 1.91, |
|
"learning_rate": 2.0050761421319797e-05, |
|
"loss": 0.8093, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"learning_rate": 1.8781725888324874e-05, |
|
"loss": 0.7448, |
|
"step": 290 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.7988505747126436, |
|
"eval_loss": 0.5910783410072327, |
|
"eval_runtime": 144.8329, |
|
"eval_samples_per_second": 3.604, |
|
"eval_steps_per_second": 0.456, |
|
"step": 293 |
|
}, |
|
{ |
|
"epoch": 2.04, |
|
"learning_rate": 1.751269035532995e-05, |
|
"loss": 0.7165, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 2.11, |
|
"learning_rate": 1.6243654822335024e-05, |
|
"loss": 0.7588, |
|
"step": 310 |
|
}, |
|
{ |
|
"epoch": 2.18, |
|
"learning_rate": 1.4974619289340103e-05, |
|
"loss": 0.7021, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 2.25, |
|
"learning_rate": 1.3705583756345178e-05, |
|
"loss": 0.6398, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 2.32, |
|
"learning_rate": 1.2436548223350254e-05, |
|
"loss": 0.645, |
|
"step": 340 |
|
}, |
|
{ |
|
"epoch": 2.39, |
|
"learning_rate": 1.116751269035533e-05, |
|
"loss": 0.7154, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 2.45, |
|
"learning_rate": 9.898477157360408e-06, |
|
"loss": 0.5742, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 2.52, |
|
"learning_rate": 8.629441624365483e-06, |
|
"loss": 0.6697, |
|
"step": 370 |
|
}, |
|
{ |
|
"epoch": 2.59, |
|
"learning_rate": 7.360406091370558e-06, |
|
"loss": 0.5898, |
|
"step": 380 |
|
}, |
|
{ |
|
"epoch": 2.66, |
|
"learning_rate": 6.091370558375635e-06, |
|
"loss": 0.716, |
|
"step": 390 |
|
}, |
|
{ |
|
"epoch": 2.73, |
|
"learning_rate": 4.822335025380711e-06, |
|
"loss": 0.7302, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 2.79, |
|
"learning_rate": 3.5532994923857873e-06, |
|
"loss": 0.5301, |
|
"step": 410 |
|
}, |
|
{ |
|
"epoch": 2.86, |
|
"learning_rate": 2.284263959390863e-06, |
|
"loss": 0.637, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 2.93, |
|
"learning_rate": 1.015228426395939e-06, |
|
"loss": 0.5974, |
|
"step": 430 |
|
}, |
|
{ |
|
"epoch": 2.98, |
|
"eval_accuracy": 0.8218390804597702, |
|
"eval_loss": 0.5200982093811035, |
|
"eval_runtime": 140.4463, |
|
"eval_samples_per_second": 3.717, |
|
"eval_steps_per_second": 0.47, |
|
"step": 438 |
|
}, |
|
{ |
|
"epoch": 2.98, |
|
"step": 438, |
|
"total_flos": 3.483891679221596e+17, |
|
"train_loss": 0.9891002352379229, |
|
"train_runtime": 12153.7671, |
|
"train_samples_per_second": 1.159, |
|
"train_steps_per_second": 0.036 |
|
} |
|
], |
|
"logging_steps": 10, |
|
"max_steps": 438, |
|
"num_train_epochs": 3, |
|
"save_steps": 500, |
|
"total_flos": 3.483891679221596e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|