{ "epoch": 40.0, "total_flos": 5.5714266203904e+16, "train_loss": 0.024559360085297206, "train_runtime": 8074.1532, "train_samples": 21175, "train_samples_per_second": 104.903, "train_steps_per_second": 1.64 }