{ | |
"epoch": 30.0, | |
"eval_accuracy": 0.1400072934534502, | |
"eval_loss": 6.242714881896973, | |
"eval_runtime": 11.5498, | |
"eval_samples": 3852, | |
"eval_samples_per_second": 333.512, | |
"eval_steps_per_second": 83.378, | |
"perplexity": 514.2527529747575, | |
"total_flos": 781486986700800.0, | |
"train_loss": 6.528281962779993, | |
"train_runtime": 3948.1737, | |
"train_samples": 76378, | |
"train_samples_per_second": 580.354, | |
"train_steps_per_second": 18.137 | |
} |