|
{ |
|
"best_metric": 0.26001426577568054, |
|
"best_model_checkpoint": "./vit-base-beans/checkpoint-120", |
|
"epoch": 3.1578947368421053, |
|
"global_step": 120, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.26, |
|
"learning_rate": 0.00018684210526315792, |
|
"loss": 0.8842, |
|
"step": 10 |
|
}, |
|
{ |
|
"epoch": 0.53, |
|
"learning_rate": 0.0001736842105263158, |
|
"loss": 0.4388, |
|
"step": 20 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"learning_rate": 0.0001605263157894737, |
|
"loss": 0.3165, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 1.05, |
|
"learning_rate": 0.00014736842105263158, |
|
"loss": 0.1621, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 1.05, |
|
"eval_accuracy": 0.8820224719101124, |
|
"eval_loss": 0.3338429927825928, |
|
"eval_runtime": 3.9187, |
|
"eval_samples_per_second": 45.423, |
|
"eval_steps_per_second": 5.869, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 1.32, |
|
"learning_rate": 0.00013421052631578948, |
|
"loss": 0.0843, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"learning_rate": 0.00012105263157894738, |
|
"loss": 0.1241, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 1.84, |
|
"learning_rate": 0.00010789473684210527, |
|
"loss": 0.0418, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 2.11, |
|
"learning_rate": 9.473684210526316e-05, |
|
"loss": 0.0497, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 2.11, |
|
"eval_accuracy": 0.8876404494382022, |
|
"eval_loss": 0.31701481342315674, |
|
"eval_runtime": 5.1269, |
|
"eval_samples_per_second": 34.719, |
|
"eval_steps_per_second": 4.486, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 2.37, |
|
"learning_rate": 8.157894736842105e-05, |
|
"loss": 0.057, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 2.63, |
|
"learning_rate": 6.842105263157895e-05, |
|
"loss": 0.0389, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 2.89, |
|
"learning_rate": 5.526315789473685e-05, |
|
"loss": 0.0211, |
|
"step": 110 |
|
}, |
|
{ |
|
"epoch": 3.16, |
|
"learning_rate": 4.210526315789474e-05, |
|
"loss": 0.0357, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 3.16, |
|
"eval_accuracy": 0.9157303370786517, |
|
"eval_loss": 0.26001426577568054, |
|
"eval_runtime": 4.1994, |
|
"eval_samples_per_second": 42.387, |
|
"eval_steps_per_second": 5.477, |
|
"step": 120 |
|
} |
|
], |
|
"max_steps": 152, |
|
"num_train_epochs": 4, |
|
"total_flos": 1.4692612914988646e+17, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|