{ "epoch": 2.0, "total_flos": 5008217800704.0, "train_loss": 0.08166181639473209, "train_runtime": 864.3861, "train_samples_per_second": 10.396, "train_steps_per_second": 1.3 }