{ "epoch": 2.96, "eval_loss": 1.6922149658203125, "eval_runtime": 5.2559, "eval_samples_per_second": 19.026, "eval_steps_per_second": 19.026, "total_flos": 2.182399960301568e+16, "train_loss": 1.7539968490600586, "train_runtime": 301.6989, "train_samples_per_second": 8.949, "train_steps_per_second": 0.557 }