{ | |
"epoch": 0.9999558635300348, | |
"eval_accuracy": 0.4989978574884235, | |
"eval_loss": 2.5016486644744873, | |
"eval_runtime": 73.2986, | |
"eval_samples": 318, | |
"eval_samples_per_second": 4.338, | |
"eval_steps_per_second": 0.041, | |
"perplexity": 12.20259537139486, | |
"total_flos": 2.234940544568441e+20, | |
"train_loss": 2.6672301666211276, | |
"train_runtime": 28535.6383, | |
"train_samples": 2900094, | |
"train_samples_per_second": 101.631, | |
"train_steps_per_second": 0.397 | |
} |