zephyr-7b-dpo-full / all_results.json
yimingzhang's picture
Model save
428274d verified
raw
history blame contribute delete
748 Bytes
{
"epoch": 3.0,
"eval_logits/chosen": -2.3639509677886963,
"eval_logits/rejected": -2.4372596740722656,
"eval_logps/chosen": -316.3568115234375,
"eval_logps/rejected": -327.0231628417969,
"eval_loss": 0.7655794024467468,
"eval_rewards/accuracies": 0.7404580116271973,
"eval_rewards/chosen": -3.8106329441070557,
"eval_rewards/margins": 3.0781688690185547,
"eval_rewards/rejected": -6.8888020515441895,
"eval_runtime": 297.1799,
"eval_samples": 2086,
"eval_samples_per_second": 7.019,
"eval_steps_per_second": 0.441,
"train_loss": 0.22745071912974513,
"train_runtime": 76961.4992,
"train_samples": 62901,
"train_samples_per_second": 2.452,
"train_steps_per_second": 0.077
}