{ "epoch": 1.0, "eval_loss": 1.9216065406799316, "eval_runtime": 115.3487, "eval_samples_per_second": 10.438, "eval_steps_per_second": 1.309, "perplexity": 6.831925423618136, "total_flos": 1.176672731136e+17, "train_loss": 2.077694829698687, "train_runtime": 1810.567, "train_samples_per_second": 7.136, "train_steps_per_second": 3.568 }