{ "epoch": 2.2, "eval_accuracy": 0.4755208001727227, "eval_loss": 3.0254220962524414, "eval_runtime": 1714.2937, "eval_samples": 308356, "eval_samples_per_second": 179.873, "eval_steps_per_second": 3.748, "perplexity": 20.602699198233495, "train_loss": 4.86919160338339, "train_runtime": 197999.0138, "train_samples": 5858758, "train_samples_per_second": 2958.983, "train_steps_per_second": 61.646 }