{ "epoch": 0.9976905311778291, "eval_accuracy": 0.35085519571037665, "eval_loss": 4.024998664855957, "eval_runtime": 59.2419, "eval_samples": 1001, "eval_samples_per_second": 16.897, "eval_steps_per_second": 8.457, "perplexity": 55.98023403991824, "total_flos": 4.406810464349061e+17, "train_loss": 4.514452385179924, "train_runtime": 3834.9386, "train_samples": 19050, "train_samples_per_second": 4.967, "train_steps_per_second": 0.077 }