{ "epoch": 1.0, "eval_loss": 1.991428017616272, "eval_runtime": 53.9435, "eval_samples_per_second": 22.208, "eval_steps_per_second": 2.781, "perplexity": 7.325987935990124, "total_flos": 9.859643179008e+16, "train_loss": 2.0996591644456246, "train_runtime": 1436.8604, "train_samples_per_second": 7.534, "train_steps_per_second": 3.767 }