{ "epoch": 3.0, "total_flos": 3.045462487125811e+16, "train_loss": 0.1802522621902765, "train_runtime": 46.5838, "train_samples_per_second": 8.436, "train_steps_per_second": 1.095 }