{ | |
"epoch": 3.0, | |
"eval_accuracy": 0.7942649671391869, | |
"eval_loss": 0.8783124089241028, | |
"eval_runtime": 3627.2369, | |
"eval_samples": 674583, | |
"eval_samples_per_second": 185.977, | |
"eval_steps_per_second": 2.906, | |
"perplexity": 2.4068345247347325, | |
"total_flos": 1.2695212826516791e+19, | |
"train_loss": 1.0139643951673536, | |
"train_runtime": 533830.6605, | |
"train_samples": 16063608, | |
"train_samples_per_second": 90.274, | |
"train_steps_per_second": 1.411 | |
} |