{ | |
"epoch": 0.08279516476237787, | |
"eval_accuracy": 0.629556877924779, | |
"eval_loss": 1.8264291286468506, | |
"eval_runtime": 6.3204, | |
"eval_samples": 408, | |
"eval_samples_per_second": 64.553, | |
"eval_steps_per_second": 2.057, | |
"perplexity": 6.211665948497031, | |
"total_flos": 2.198926000128e+16, | |
"train_loss": 2.0824306030273436, | |
"train_runtime": 944.4845, | |
"train_samples": 193233, | |
"train_samples_per_second": 613.773, | |
"train_steps_per_second": 38.364 | |
} |