{ "epoch": 1.0, "eval_loss": 2.043407678604126, "eval_runtime": 65.3589, "eval_samples_per_second": 13.678, "eval_steps_per_second": 1.714, "perplexity": 7.716861026791248, "total_flos": 8.01984399409152e+16, "train_loss": 2.1353629073560736, "train_runtime": 1379.8897, "train_samples_per_second": 6.396, "train_steps_per_second": 3.198 }