Qwen2.5-0.5B-Open-R1-Distill / all_results.json
Qucy's picture
End of training
b65c750 verified
{
"epoch": 0.9994447529150472,
"eval_loss": 0.9036357998847961,
"eval_runtime": 7.071,
"eval_samples": 100,
"eval_samples_per_second": 18.102,
"eval_steps_per_second": 2.263,
"total_flos": 1.6624354892709888e+17,
"train_loss": 0.9221899901496039,
"train_runtime": 5284.4545,
"train_samples": 16610,
"train_samples_per_second": 4.089,
"train_steps_per_second": 0.128
}