{ | |
"epoch": 1.0, | |
"eval_loss": 1.9683517217636108, | |
"eval_runtime": 30.1976, | |
"eval_samples_per_second": 22.088, | |
"eval_steps_per_second": 2.782, | |
"perplexity": 7.158866953723834, | |
"total_flos": 7.54868493877248e+16, | |
"train_loss": 2.153304632613963, | |
"train_runtime": 1112.8562, | |
"train_samples_per_second": 7.456, | |
"train_steps_per_second": 3.728 | |
} |