{ "epoch": 12.0, "total_flos": 1.4460005262082867e+18, "train_loss": 0.013737765663116536, "train_runtime": 2175.34, "train_samples_per_second": 8.578, "train_steps_per_second": 0.541 }