{ "epoch": 0.08279516476237787, "eval_accuracy": 0.629556877924779, "eval_loss": 1.8264291286468506, "eval_runtime": 6.3204, "eval_samples": 408, "eval_samples_per_second": 64.553, "eval_steps_per_second": 2.057, "perplexity": 6.211665948497031, "total_flos": 2.198926000128e+16, "train_loss": 2.0824306030273436, "train_runtime": 944.4845, "train_samples": 193233, "train_samples_per_second": 613.773, "train_steps_per_second": 38.364 }