{ "epoch": 4.0, "total_flos": 2.1353892586861363e+18, "train_loss": 1.3106378566387087, "train_runtime": 1021.3737, "train_samples_per_second": 26.944, "train_steps_per_second": 1.684 }