{ "epoch": 1.0, "eval_loss": 1.9825303554534912, "eval_runtime": 25.595, "eval_samples_per_second": 40.359, "eval_steps_per_second": 5.079, "perplexity": 7.2610929054914894, "total_flos": 9.9498061824e+16, "train_loss": 2.0932261693746033, "train_runtime": 883.1108, "train_samples_per_second": 12.371, "train_steps_per_second": 6.186 }