{ | |
"epoch": 19.99134539732494, | |
"eval_accuracy": 0.4782639238952008, | |
"eval_loss": 2.6884331703186035, | |
"eval_runtime": 71.243, | |
"eval_samples": 60680, | |
"eval_samples_per_second": 851.733, | |
"eval_steps_per_second": 13.321, | |
"perplexity": 14.708611966715758, | |
"total_flos": 1.487139158163456e+18, | |
"train_loss": 2.8006602801864955, | |
"train_runtime": 30100.0214, | |
"train_samples": 569394, | |
"train_samples_per_second": 378.335, | |
"train_steps_per_second": 1.478 | |
} |