{ "epoch": 3.0, "total_flos": 6.651462652615066e+16, "train_loss": 0.6625232639766875, "train_runtime": 75.1281, "train_samples_per_second": 35.619, "train_steps_per_second": 0.28 }