{ "epoch": 3.0, "total_flos": 2.3635472472132813e+17, "train_loss": 1.1949122909343604, "train_runtime": 1081.5376, "train_samples_per_second": 2.854, "train_steps_per_second": 0.092 }