mistral_gsm8k_gold_answer_lora / all_results.json
CharlesLi's picture
End of training
a78d5ec verified
raw
history blame contribute delete
399 Bytes
{
"epoch": 3.076923076923077,
"eval_loss": 1.5896568298339844,
"eval_runtime": 1.3625,
"eval_samples": 20,
"eval_samples_per_second": 14.678,
"eval_steps_per_second": 2.202,
"total_flos": 507088404480.0,
"train_loss": 1.75083886384964,
"train_runtime": 83.5061,
"train_samples": 100,
"train_samples_per_second": 3.832,
"train_steps_per_second": 0.24
}