{ "epoch": 2.96, "total_flos": 2.182399960301568e+16, "train_loss": 1.7539968490600586, "train_runtime": 301.6989, "train_samples_per_second": 8.949, "train_steps_per_second": 0.557 }