{ | |
"epoch": 28.0, | |
"eval_accuracy": 0.42334742212654364, | |
"eval_loss": 2.9599573612213135, | |
"eval_runtime": 111.655, | |
"eval_samples": 52190, | |
"eval_samples_per_second": 467.422, | |
"eval_steps_per_second": 7.308, | |
"perplexity": 19.297148931098217, | |
"total_flos": 1.808986925039616e+18, | |
"train_loss": 2.9159927132606205, | |
"train_runtime": 57317.9169, | |
"train_samples": 494517, | |
"train_samples_per_second": 345.105, | |
"train_steps_per_second": 1.348 | |
} |