{ "epoch": 1.0, "eval_loss": 1.867760181427002, "eval_runtime": 104.988, "eval_samples_per_second": 145.788, "eval_steps_per_second": 9.115, "perplexity": 6.4737800555614, "total_flos": 1.421397042852266e+18, "train_loss": 2.0159098046724915, "train_runtime": 3573.2428, "train_samples_per_second": 43.7, "train_steps_per_second": 2.731 }