{"train/loss": 0.6241, "train/learning_rate": 0.0, "train/epoch": 1.76, "train/global_step": 60, "_timestamp": 1703472060.2063508, "_runtime": 339.4569706916809, "_step": 6, "train/train_runtime": 375.6288, "train/train_samples_per_second": 0.639, "train/train_steps_per_second": 0.16, "train/total_flos": 388804397884416.0, "train/train_loss": 0.9521554390589396} |