|
{ |
|
"epoch": 1.0, |
|
"eval_logits/chosen": -2.2312498092651367, |
|
"eval_logits/rejected": -2.2264044284820557, |
|
"eval_logps/chosen": -34.088890075683594, |
|
"eval_logps/rejected": -37.596412658691406, |
|
"eval_loss": 1.625149130821228, |
|
"eval_rewards/accuracies": 0.5078904032707214, |
|
"eval_rewards/chosen": -0.02173524722456932, |
|
"eval_rewards/margins": 0.010181299410760403, |
|
"eval_rewards/rejected": -0.0319165475666523, |
|
"eval_runtime": 145.6511, |
|
"eval_samples": 343, |
|
"eval_samples_per_second": 2.355, |
|
"eval_steps_per_second": 0.295 |
|
} |