{ "epoch": 12.0, "eval_loss": 0.28984853625297546, "eval_runtime": 39.3361, "eval_samples": 36, "eval_samples_per_second": 0.915, "eval_steps_per_second": 0.915, "total_flos": 1.6007026740874445e+17, "train_loss": 0.43703304879440397, "train_runtime": 5927.738, "train_samples": 136, "train_samples_per_second": 1.147, "train_steps_per_second": 0.067 }