{ "epoch": 0.9993522716757657, "eval_loss": 2.16412353515625, "eval_runtime": 221.1512, "eval_samples": 6447, "eval_samples_per_second": 5.399, "eval_steps_per_second": 2.7, "total_flos": 5.373491620442276e+17, "train_loss": 2.19371005181913, "train_runtime": 17533.5186, "train_samples": 116722, "train_samples_per_second": 1.233, "train_steps_per_second": 0.077 }