{ "epoch": 3.0, "eval_accuracy": 0.8077953820649405, "eval_loss": 0.9435999393463135, "eval_runtime": 2301.809, "eval_samples": 445055, "eval_samples_per_second": 193.35, "eval_steps_per_second": 6.042, "perplexity": 2.5692138042068984, "train_loss": 2.538804254183028, "train_runtime": 274559.0377, "train_samples": 8200540, "train_samples_per_second": 89.604, "train_steps_per_second": 2.8 }