{ "epoch": 2.0, "total_flos": 1.5362943036162048e+16, "train_loss": 0.16884834933280946, "train_runtime": 1424.4252, "train_samples_per_second": 0.702, "train_steps_per_second": 0.176 }