Gemma-2B-It-ORPO / all_results.json
chchen's picture
End of training
5fd6e30 verified
{
"epoch": 2.997999555456768,
"eval_logits/chosen": -20.655466079711914,
"eval_logits/rejected": -20.744272232055664,
"eval_logps/chosen": -1.3319367170333862,
"eval_logps/rejected": -1.5009632110595703,
"eval_loss": 1.3996269702911377,
"eval_odds_ratio_loss": 0.67690110206604,
"eval_rewards/accuracies": 0.5460000038146973,
"eval_rewards/chosen": -0.133193701505661,
"eval_rewards/margins": 0.016902634873986244,
"eval_rewards/rejected": -0.1500963419675827,
"eval_runtime": 79.967,
"eval_samples_per_second": 12.505,
"eval_sft_loss": 1.3319367170333862,
"eval_steps_per_second": 6.253,
"total_flos": 5.313908590588723e+17,
"train_loss": 1.477055920117832,
"train_runtime": 8055.1491,
"train_samples_per_second": 3.351,
"train_steps_per_second": 0.209
}