qwen-2.5-3b-r1-countdown-offline_query_gen_solvable_only__train_query_gen-ckpt_175
/
train_results.json
{ | |
"total_flos": 0.0, | |
"train_loss": 6.581872487505476e-05, | |
"train_runtime": 36634.2295, | |
"train_samples": 38140, | |
"train_samples_per_second": 0.688, | |
"train_steps_per_second": 0.012 | |
} |