djbp's picture
End of training
24a52ca verified
raw
history blame
400 Bytes
{
"epoch": 8.88888888888889,
"eval_accuracy": 0.3924731182795699,
"eval_loss": 2.05673885345459,
"eval_runtime": 21.7695,
"eval_samples_per_second": 8.544,
"eval_steps_per_second": 0.138,
"total_flos": 3.7044103653339955e+17,
"train_loss": 2.3554419835408527,
"train_runtime": 1715.7637,
"train_samples_per_second": 9.733,
"train_steps_per_second": 0.035
}