{ "epoch": 1.0, "eval_loss": 1.8510078191757202, "eval_runtime": 415.3939, "eval_samples_per_second": 146.203, "eval_steps_per_second": 9.138, "perplexity": 6.366232301588858, "total_flos": 2.7919996141761987e+18, "train_loss": 2.1007044342432573, "train_runtime": 7350.2103, "train_samples_per_second": 41.566, "train_steps_per_second": 2.598 }