ce-len3-bs256-lr1e-3 / all_results.json
yangwang825's picture
End of training
8cd52d7 verified
raw
history blame contribute delete
393 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.9410023545240498,
"eval_loss": 0.29460111260414124,
"eval_runtime": 49.9476,
"eval_samples_per_second": 297.612,
"eval_steps_per_second": 297.612,
"total_flos": 1.96318398191328e+18,
"train_loss": 2.1099621225725396,
"train_runtime": 19361.582,
"train_samples_per_second": 69.094,
"train_steps_per_second": 0.27
}