{ | |
"epoch": 0.9976905311778291, | |
"eval_accuracy": 0.35085519571037665, | |
"eval_loss": 4.024998664855957, | |
"eval_runtime": 59.2419, | |
"eval_samples": 1001, | |
"eval_samples_per_second": 16.897, | |
"eval_steps_per_second": 8.457, | |
"perplexity": 55.98023403991824, | |
"total_flos": 4.406810464349061e+17, | |
"train_loss": 4.514452385179924, | |
"train_runtime": 3834.9386, | |
"train_samples": 19050, | |
"train_samples_per_second": 4.967, | |
"train_steps_per_second": 0.077 | |
} |