{ | |
"epoch": 6.36, | |
"eval_accuracy": 0.47857468822060445, | |
"eval_loss": 2.895219087600708, | |
"eval_runtime": 728.1926, | |
"eval_samples": 308356, | |
"eval_samples_per_second": 423.454, | |
"eval_steps_per_second": 3.851, | |
"perplexity": 18.08746374623101, | |
"train_loss": 3.953961916252199, | |
"train_runtime": 197999.1228, | |
"train_samples": 5858758, | |
"train_samples_per_second": 2958.982, | |
"train_steps_per_second": 26.9 | |
} |