{ "epoch": 1.0, "eval_loss": 2.0081028938293457, "eval_runtime": 26.9935, "eval_samples_per_second": 40.38, "eval_steps_per_second": 5.075, "perplexity": 7.449172063720864, "total_flos": 9.814106308608e+16, "train_loss": 2.1073089152154165, "train_runtime": 871.165, "train_samples_per_second": 12.37, "train_steps_per_second": 6.185 }