zephyr-2b-gemma-sft / all_results.json
ale-bay's picture
End of training
b76846d verified
raw
history blame contribute delete
411 Bytes
{
"epoch": 2.994991652754591,
"eval_loss": 1.0529426336288452,
"eval_runtime": 8.1882,
"eval_samples": 500,
"eval_samples_per_second": 233.629,
"eval_steps_per_second": 7.328,
"total_flos": 106879455854592.0,
"train_loss": 0.9405513189841008,
"train_runtime": 1810.6389,
"train_samples": 9500,
"train_samples_per_second": 63.501,
"train_steps_per_second": 0.495
}