{ | |
"epoch": 10.11, | |
"eval_loss": 2.560811996459961, | |
"eval_runtime": 225.5262, | |
"eval_samples": 200000, | |
"eval_samples_per_second": 886.815, | |
"eval_steps_per_second": 55.426, | |
"perplexity": 12.94632541910408, | |
"train_loss": 2.9681437548828127, | |
"train_runtime": 221059.9809, | |
"train_samples": 3799999, | |
"train_samples_per_second": 173.709, | |
"train_steps_per_second": 10.857 | |
} |