{"train/loss": 0.0099, "train/grad_norm": 0.054070062935352325, "train/learning_rate": 0.0, "train/epoch": 2.4, "train/global_step": 30, "_timestamp": 1709903258.2842968, "_runtime": 337.49764585494995, "_step": 3, "train/train_runtime": 344.3671, "train/train_samples_per_second": 1.394, "train/train_steps_per_second": 0.087, "train/total_flos": 2466763961794560.0, "train/train_loss": 0.8807701396445433, "_wandb": {"runtime": 524}}