{ | |
"epoch": 1.0, | |
"eval_loss": 3.5582468509674072, | |
"eval_runtime": 6274.8366, | |
"eval_samples": 551057, | |
"eval_samples_per_second": 87.82, | |
"eval_steps_per_second": 21.955, | |
"perplexity": 35.10160482608155, | |
"train_loss": 3.89913355111991, | |
"train_runtime": 393554.9634, | |
"train_samples": 10794765, | |
"train_samples_per_second": 27.429, | |
"train_steps_per_second": 0.107 | |
} |