{ | |
"epoch": 0.03797345732829604, | |
"eval_accuracy": 0.10393614847954215, | |
"eval_loss": 7.48828125, | |
"eval_runtime": 235.3204, | |
"eval_samples": 33767, | |
"eval_samples_per_second": 143.494, | |
"eval_steps_per_second": 2.244, | |
"perplexity": 1786.9780822945145, | |
"total_flos": 2185295466332160.0, | |
"train_loss": 8.552704480229592, | |
"train_runtime": 93913.2173, | |
"train_samples": 660643, | |
"train_samples_per_second": 703.461, | |
"train_steps_per_second": 10.992 | |
} |