{ "epoch": 1.0, "total_flos": 2.045152830947328e+16, "train_loss": 220573833625.6, "train_runtime": 1766.7401, "train_samples_per_second": 0.724, "train_steps_per_second": 0.006 }