{"train/loss": 3.4742, "train/grad_norm": 10.155596733093262, "train/learning_rate": 2.0678246484698098e-07, "train/epoch": 0.0, "train/global_step": 40, "_timestamp": 1712600661.4672816, "_runtime": 97.60346961021423, "_step": 1, "_wandb": {"runtime": 135}}