{ | |
"epoch": 2.955223880597015, | |
"eval_logits/chosen": -2.3310205936431885, | |
"eval_logits/rejected": -2.3245856761932373, | |
"eval_logps/chosen": -280.4070129394531, | |
"eval_logps/rejected": -236.11550903320312, | |
"eval_loss": 0.5229008197784424, | |
"eval_rewards/accuracies": 0.8166666626930237, | |
"eval_rewards/chosen": 2.1573832035064697, | |
"eval_rewards/margins": 2.773956775665283, | |
"eval_rewards/rejected": -0.616573691368103, | |
"eval_runtime": 61.6988, | |
"eval_samples_per_second": 15.397, | |
"eval_steps_per_second": 0.243 | |
} |