{ | |
"epoch": 25.0, | |
"eval_accuracy": 0.1417211592798902, | |
"eval_loss": 6.239955902099609, | |
"eval_runtime": 5.4847, | |
"eval_samples": 963, | |
"eval_samples_per_second": 175.578, | |
"eval_steps_per_second": 11.122, | |
"perplexity": 512.8358954579503, | |
"total_flos": 1.89218085967872e+16, | |
"train_loss": 1.2342067862914834, | |
"train_runtime": 1036.8459, | |
"train_samples": 19092, | |
"train_samples_per_second": 460.338, | |
"train_steps_per_second": 14.395 | |
} |