{ "epoch": 3.0, "eval_loss": 1.3244786262512207, "eval_runtime": 34.7071, "eval_samples": 14114, "eval_samples_per_second": 406.661, "eval_steps_per_second": 50.854, "total_flos": 2.645641233904435e+16, "train_loss": 0.5831284902567558, "train_runtime": 2740.1657, "train_samples": 130319, "train_samples_per_second": 142.676, "train_steps_per_second": 8.917 }