dima806's picture
Upload folder using huggingface_hub
3fd445a
raw
history blame
15.9 kB
{
"best_metric": 1.6099027395248413,
"best_model_checkpoint": "gemstones_image_detection/checkpoint-4779",
"epoch": 59.0,
"eval_steps": 500,
"global_step": 4779,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.06521739130434782,
"eval_loss": 4.402697563171387,
"eval_runtime": 7.0526,
"eval_samples_per_second": 91.314,
"eval_steps_per_second": 11.485,
"step": 81
},
{
"epoch": 2.0,
"eval_accuracy": 0.2329192546583851,
"eval_loss": 4.283246994018555,
"eval_runtime": 6.9117,
"eval_samples_per_second": 93.176,
"eval_steps_per_second": 11.719,
"step": 162
},
{
"epoch": 3.0,
"eval_accuracy": 0.38354037267080743,
"eval_loss": 4.158541202545166,
"eval_runtime": 7.0269,
"eval_samples_per_second": 91.648,
"eval_steps_per_second": 11.527,
"step": 243
},
{
"epoch": 4.0,
"eval_accuracy": 0.5139751552795031,
"eval_loss": 4.027233123779297,
"eval_runtime": 6.9926,
"eval_samples_per_second": 92.098,
"eval_steps_per_second": 11.584,
"step": 324
},
{
"epoch": 5.0,
"eval_accuracy": 0.6024844720496895,
"eval_loss": 3.892688035964966,
"eval_runtime": 7.1602,
"eval_samples_per_second": 89.942,
"eval_steps_per_second": 11.313,
"step": 405
},
{
"epoch": 6.0,
"eval_accuracy": 0.65527950310559,
"eval_loss": 3.7535414695739746,
"eval_runtime": 7.0085,
"eval_samples_per_second": 91.888,
"eval_steps_per_second": 11.557,
"step": 486
},
{
"epoch": 6.17,
"learning_rate": 9.064449064449066e-06,
"loss": 4.0521,
"step": 500
},
{
"epoch": 7.0,
"eval_accuracy": 0.6816770186335404,
"eval_loss": 3.6245224475860596,
"eval_runtime": 6.9342,
"eval_samples_per_second": 92.873,
"eval_steps_per_second": 11.681,
"step": 567
},
{
"epoch": 8.0,
"eval_accuracy": 0.7065217391304348,
"eval_loss": 3.5059802532196045,
"eval_runtime": 6.9825,
"eval_samples_per_second": 92.231,
"eval_steps_per_second": 11.6,
"step": 648
},
{
"epoch": 9.0,
"eval_accuracy": 0.7251552795031055,
"eval_loss": 3.3893799781799316,
"eval_runtime": 7.0313,
"eval_samples_per_second": 91.59,
"eval_steps_per_second": 11.52,
"step": 729
},
{
"epoch": 10.0,
"eval_accuracy": 0.7468944099378882,
"eval_loss": 3.2792539596557617,
"eval_runtime": 6.9072,
"eval_samples_per_second": 93.236,
"eval_steps_per_second": 11.727,
"step": 810
},
{
"epoch": 11.0,
"eval_accuracy": 0.7593167701863354,
"eval_loss": 3.185778856277466,
"eval_runtime": 7.1843,
"eval_samples_per_second": 89.64,
"eval_steps_per_second": 11.275,
"step": 891
},
{
"epoch": 12.0,
"eval_accuracy": 0.765527950310559,
"eval_loss": 3.093205690383911,
"eval_runtime": 7.203,
"eval_samples_per_second": 89.407,
"eval_steps_per_second": 11.245,
"step": 972
},
{
"epoch": 12.35,
"learning_rate": 8.024948024948025e-06,
"loss": 3.1602,
"step": 1000
},
{
"epoch": 13.0,
"eval_accuracy": 0.7639751552795031,
"eval_loss": 3.006822347640991,
"eval_runtime": 6.9935,
"eval_samples_per_second": 92.086,
"eval_steps_per_second": 11.582,
"step": 1053
},
{
"epoch": 14.0,
"eval_accuracy": 0.7701863354037267,
"eval_loss": 2.9287173748016357,
"eval_runtime": 6.8243,
"eval_samples_per_second": 94.369,
"eval_steps_per_second": 11.869,
"step": 1134
},
{
"epoch": 15.0,
"eval_accuracy": 0.7763975155279503,
"eval_loss": 2.8492088317871094,
"eval_runtime": 6.9345,
"eval_samples_per_second": 92.869,
"eval_steps_per_second": 11.681,
"step": 1215
},
{
"epoch": 16.0,
"eval_accuracy": 0.7763975155279503,
"eval_loss": 2.779766082763672,
"eval_runtime": 7.4706,
"eval_samples_per_second": 86.204,
"eval_steps_per_second": 10.842,
"step": 1296
},
{
"epoch": 17.0,
"eval_accuracy": 0.782608695652174,
"eval_loss": 2.71138858795166,
"eval_runtime": 7.6693,
"eval_samples_per_second": 83.971,
"eval_steps_per_second": 10.562,
"step": 1377
},
{
"epoch": 18.0,
"eval_accuracy": 0.7857142857142857,
"eval_loss": 2.64682674407959,
"eval_runtime": 7.4341,
"eval_samples_per_second": 86.628,
"eval_steps_per_second": 10.896,
"step": 1458
},
{
"epoch": 18.52,
"learning_rate": 6.985446985446987e-06,
"loss": 2.537,
"step": 1500
},
{
"epoch": 19.0,
"eval_accuracy": 0.7841614906832298,
"eval_loss": 2.586892604827881,
"eval_runtime": 7.0064,
"eval_samples_per_second": 91.916,
"eval_steps_per_second": 11.561,
"step": 1539
},
{
"epoch": 20.0,
"eval_accuracy": 0.7888198757763976,
"eval_loss": 2.533936023712158,
"eval_runtime": 6.9165,
"eval_samples_per_second": 93.111,
"eval_steps_per_second": 11.711,
"step": 1620
},
{
"epoch": 21.0,
"eval_accuracy": 0.7950310559006211,
"eval_loss": 2.4751620292663574,
"eval_runtime": 6.8444,
"eval_samples_per_second": 94.092,
"eval_steps_per_second": 11.835,
"step": 1701
},
{
"epoch": 22.0,
"eval_accuracy": 0.8059006211180124,
"eval_loss": 2.4239892959594727,
"eval_runtime": 6.7886,
"eval_samples_per_second": 94.864,
"eval_steps_per_second": 11.932,
"step": 1782
},
{
"epoch": 23.0,
"eval_accuracy": 0.8027950310559007,
"eval_loss": 2.3724544048309326,
"eval_runtime": 6.8741,
"eval_samples_per_second": 93.685,
"eval_steps_per_second": 11.783,
"step": 1863
},
{
"epoch": 24.0,
"eval_accuracy": 0.8043478260869565,
"eval_loss": 2.327075719833374,
"eval_runtime": 7.4527,
"eval_samples_per_second": 86.412,
"eval_steps_per_second": 10.869,
"step": 1944
},
{
"epoch": 24.69,
"learning_rate": 5.945945945945947e-06,
"loss": 2.0899,
"step": 2000
},
{
"epoch": 25.0,
"eval_accuracy": 0.8074534161490683,
"eval_loss": 2.2822916507720947,
"eval_runtime": 6.923,
"eval_samples_per_second": 93.024,
"eval_steps_per_second": 11.7,
"step": 2025
},
{
"epoch": 26.0,
"eval_accuracy": 0.812111801242236,
"eval_loss": 2.2414402961730957,
"eval_runtime": 6.7582,
"eval_samples_per_second": 95.292,
"eval_steps_per_second": 11.985,
"step": 2106
},
{
"epoch": 27.0,
"eval_accuracy": 0.8152173913043478,
"eval_loss": 2.198101043701172,
"eval_runtime": 6.9757,
"eval_samples_per_second": 92.32,
"eval_steps_per_second": 11.612,
"step": 2187
},
{
"epoch": 28.0,
"eval_accuracy": 0.812111801242236,
"eval_loss": 2.158327579498291,
"eval_runtime": 6.8707,
"eval_samples_per_second": 93.732,
"eval_steps_per_second": 11.789,
"step": 2268
},
{
"epoch": 29.0,
"eval_accuracy": 0.8152173913043478,
"eval_loss": 2.1208977699279785,
"eval_runtime": 7.0622,
"eval_samples_per_second": 91.19,
"eval_steps_per_second": 11.47,
"step": 2349
},
{
"epoch": 30.0,
"eval_accuracy": 0.8198757763975155,
"eval_loss": 2.086048126220703,
"eval_runtime": 7.4205,
"eval_samples_per_second": 86.787,
"eval_steps_per_second": 10.916,
"step": 2430
},
{
"epoch": 30.86,
"learning_rate": 4.906444906444907e-06,
"loss": 1.7517,
"step": 2500
},
{
"epoch": 31.0,
"eval_accuracy": 0.8152173913043478,
"eval_loss": 2.054029941558838,
"eval_runtime": 7.2868,
"eval_samples_per_second": 88.38,
"eval_steps_per_second": 11.116,
"step": 2511
},
{
"epoch": 32.0,
"eval_accuracy": 0.8214285714285714,
"eval_loss": 2.0214383602142334,
"eval_runtime": 6.9044,
"eval_samples_per_second": 93.273,
"eval_steps_per_second": 11.732,
"step": 2592
},
{
"epoch": 33.0,
"eval_accuracy": 0.8245341614906833,
"eval_loss": 1.9886717796325684,
"eval_runtime": 7.0403,
"eval_samples_per_second": 91.474,
"eval_steps_per_second": 11.505,
"step": 2673
},
{
"epoch": 34.0,
"eval_accuracy": 0.8167701863354038,
"eval_loss": 1.9592698812484741,
"eval_runtime": 7.0078,
"eval_samples_per_second": 91.898,
"eval_steps_per_second": 11.559,
"step": 2754
},
{
"epoch": 35.0,
"eval_accuracy": 0.8136645962732919,
"eval_loss": 1.9315446615219116,
"eval_runtime": 6.9305,
"eval_samples_per_second": 92.922,
"eval_steps_per_second": 11.687,
"step": 2835
},
{
"epoch": 36.0,
"eval_accuracy": 0.8136645962732919,
"eval_loss": 1.903202772140503,
"eval_runtime": 7.1188,
"eval_samples_per_second": 90.464,
"eval_steps_per_second": 11.378,
"step": 2916
},
{
"epoch": 37.0,
"eval_accuracy": 0.8214285714285714,
"eval_loss": 1.8818532228469849,
"eval_runtime": 7.3502,
"eval_samples_per_second": 87.617,
"eval_steps_per_second": 11.02,
"step": 2997
},
{
"epoch": 37.04,
"learning_rate": 3.866943866943867e-06,
"loss": 1.4983,
"step": 3000
},
{
"epoch": 38.0,
"eval_accuracy": 0.8198757763975155,
"eval_loss": 1.85394287109375,
"eval_runtime": 7.066,
"eval_samples_per_second": 91.141,
"eval_steps_per_second": 11.463,
"step": 3078
},
{
"epoch": 39.0,
"eval_accuracy": 0.8152173913043478,
"eval_loss": 1.8299955129623413,
"eval_runtime": 6.9274,
"eval_samples_per_second": 92.965,
"eval_steps_per_second": 11.693,
"step": 3159
},
{
"epoch": 40.0,
"eval_accuracy": 0.8198757763975155,
"eval_loss": 1.811854362487793,
"eval_runtime": 6.9595,
"eval_samples_per_second": 92.536,
"eval_steps_per_second": 11.639,
"step": 3240
},
{
"epoch": 41.0,
"eval_accuracy": 0.8136645962732919,
"eval_loss": 1.7893236875534058,
"eval_runtime": 6.921,
"eval_samples_per_second": 93.05,
"eval_steps_per_second": 11.704,
"step": 3321
},
{
"epoch": 42.0,
"eval_accuracy": 0.8214285714285714,
"eval_loss": 1.7720342874526978,
"eval_runtime": 6.8638,
"eval_samples_per_second": 93.826,
"eval_steps_per_second": 11.801,
"step": 3402
},
{
"epoch": 43.0,
"eval_accuracy": 0.8167701863354038,
"eval_loss": 1.7533122301101685,
"eval_runtime": 7.194,
"eval_samples_per_second": 89.519,
"eval_steps_per_second": 11.259,
"step": 3483
},
{
"epoch": 43.21,
"learning_rate": 2.827442827442828e-06,
"loss": 1.3099,
"step": 3500
},
{
"epoch": 44.0,
"eval_accuracy": 0.8214285714285714,
"eval_loss": 1.7392221689224243,
"eval_runtime": 6.9012,
"eval_samples_per_second": 93.317,
"eval_steps_per_second": 11.737,
"step": 3564
},
{
"epoch": 45.0,
"eval_accuracy": 0.8167701863354038,
"eval_loss": 1.71939218044281,
"eval_runtime": 7.3602,
"eval_samples_per_second": 87.497,
"eval_steps_per_second": 11.005,
"step": 3645
},
{
"epoch": 46.0,
"eval_accuracy": 0.8183229813664596,
"eval_loss": 1.7061350345611572,
"eval_runtime": 7.1127,
"eval_samples_per_second": 90.542,
"eval_steps_per_second": 11.388,
"step": 3726
},
{
"epoch": 47.0,
"eval_accuracy": 0.8198757763975155,
"eval_loss": 1.6922202110290527,
"eval_runtime": 7.1567,
"eval_samples_per_second": 89.986,
"eval_steps_per_second": 11.318,
"step": 3807
},
{
"epoch": 48.0,
"eval_accuracy": 0.8136645962732919,
"eval_loss": 1.6803785562515259,
"eval_runtime": 6.8048,
"eval_samples_per_second": 94.64,
"eval_steps_per_second": 11.903,
"step": 3888
},
{
"epoch": 49.0,
"eval_accuracy": 0.8152173913043478,
"eval_loss": 1.6694267988204956,
"eval_runtime": 7.2998,
"eval_samples_per_second": 88.221,
"eval_steps_per_second": 11.096,
"step": 3969
},
{
"epoch": 49.38,
"learning_rate": 1.7879417879417881e-06,
"loss": 1.1777,
"step": 4000
},
{
"epoch": 50.0,
"eval_accuracy": 0.8167701863354038,
"eval_loss": 1.6600834131240845,
"eval_runtime": 6.8099,
"eval_samples_per_second": 94.568,
"eval_steps_per_second": 11.894,
"step": 4050
},
{
"epoch": 51.0,
"eval_accuracy": 0.8214285714285714,
"eval_loss": 1.6486986875534058,
"eval_runtime": 6.809,
"eval_samples_per_second": 94.581,
"eval_steps_per_second": 11.896,
"step": 4131
},
{
"epoch": 52.0,
"eval_accuracy": 0.8152173913043478,
"eval_loss": 1.641870379447937,
"eval_runtime": 6.9774,
"eval_samples_per_second": 92.297,
"eval_steps_per_second": 11.609,
"step": 4212
},
{
"epoch": 53.0,
"eval_accuracy": 0.8167701863354038,
"eval_loss": 1.6351778507232666,
"eval_runtime": 7.0388,
"eval_samples_per_second": 91.493,
"eval_steps_per_second": 11.508,
"step": 4293
},
{
"epoch": 54.0,
"eval_accuracy": 0.812111801242236,
"eval_loss": 1.6281042098999023,
"eval_runtime": 7.0002,
"eval_samples_per_second": 91.997,
"eval_steps_per_second": 11.571,
"step": 4374
},
{
"epoch": 55.0,
"eval_accuracy": 0.8167701863354038,
"eval_loss": 1.6229327917099,
"eval_runtime": 7.1102,
"eval_samples_per_second": 90.574,
"eval_steps_per_second": 11.392,
"step": 4455
},
{
"epoch": 55.56,
"learning_rate": 7.484407484407485e-07,
"loss": 1.0992,
"step": 4500
},
{
"epoch": 56.0,
"eval_accuracy": 0.8136645962732919,
"eval_loss": 1.6176931858062744,
"eval_runtime": 6.9832,
"eval_samples_per_second": 92.221,
"eval_steps_per_second": 11.599,
"step": 4536
},
{
"epoch": 57.0,
"eval_accuracy": 0.8183229813664596,
"eval_loss": 1.6147724390029907,
"eval_runtime": 6.8902,
"eval_samples_per_second": 93.465,
"eval_steps_per_second": 11.756,
"step": 4617
},
{
"epoch": 58.0,
"eval_accuracy": 0.8167701863354038,
"eval_loss": 1.6121727228164673,
"eval_runtime": 6.9785,
"eval_samples_per_second": 92.283,
"eval_steps_per_second": 11.607,
"step": 4698
},
{
"epoch": 59.0,
"eval_accuracy": 0.8167701863354038,
"eval_loss": 1.6099027395248413,
"eval_runtime": 7.0345,
"eval_samples_per_second": 91.548,
"eval_steps_per_second": 11.515,
"step": 4779
}
],
"logging_steps": 500,
"max_steps": 4860,
"num_train_epochs": 60,
"save_steps": 500,
"total_flos": 1.1781939502129306e+19,
"trial_name": null,
"trial_params": null
}