{ "epoch": 6.36, "eval_accuracy": 0.47857468822060445, "eval_loss": 2.895219087600708, "eval_runtime": 728.1926, "eval_samples": 308356, "eval_samples_per_second": 423.454, "eval_steps_per_second": 3.851, "perplexity": 18.08746374623101, "train_loss": 3.953961916252199, "train_runtime": 197999.1228, "train_samples": 5858758, "train_samples_per_second": 2958.982, "train_steps_per_second": 26.9 }