{ "epoch": 0.992, "eval_abs_diff": 0.421875, "eval_all_logps_1": -819.568115234375, "eval_all_logps_1_values": -819.568115234375, "eval_all_logps_2": 444.0224914550781, "eval_all_logps_2_values": 444.0224914550781, "eval_logits/chosen": -1.4453125, "eval_logits/rejected": -1.484375, "eval_logps/chosen": -2.265625, "eval_logps/rejected": -2.34375, "eval_loss": 1.7294530868530273, "eval_original_losses": 1.7265625, "eval_rewards/accuracies": 0.4650000035762787, "eval_rewards/chosen": -5.65625, "eval_rewards/margins": 0.2001953125, "eval_rewards/rejected": -5.84375, "eval_runtime": 15.6751, "eval_samples": 200, "eval_samples_per_second": 12.759, "eval_steps_per_second": 3.19, "eval_weight": 1.0, "total_flos": 0.0, "train_loss": 1.8891444052419355, "train_runtime": 316.7887, "train_samples": 1000, "train_samples_per_second": 3.157, "train_steps_per_second": 0.098 }