{ | |
"epoch": 29.864864864864863, | |
"eval_accuracy": 0.40400586223742063, | |
"eval_loss": 3.0258984565734863, | |
"eval_runtime": 0.1238, | |
"eval_samples": 1, | |
"eval_samples_per_second": 8.08, | |
"eval_steps_per_second": 8.08, | |
"perplexity": 20.612515844582727, | |
"total_flos": 8754328240128000.0, | |
"train_loss": 3.8146740595499673, | |
"train_runtime": 2143.757, | |
"train_samples": 291, | |
"train_samples_per_second": 4.072, | |
"train_steps_per_second": 0.056 | |
} |