|
{ |
|
"epoch": 1.0, |
|
"eval_logits/chosen": -3.164646625518799, |
|
"eval_logits/rejected": -3.153470039367676, |
|
"eval_logps/chosen": -543.001708984375, |
|
"eval_logps/rejected": -567.34228515625, |
|
"eval_loss": 0.7142251133918762, |
|
"eval_rewards/accuracies": 0.546875, |
|
"eval_rewards/chosen": -1.4159148931503296, |
|
"eval_rewards/margins": 0.08076205104589462, |
|
"eval_rewards/rejected": -1.496677041053772, |
|
"eval_runtime": 125.7685, |
|
"eval_samples": 1000, |
|
"eval_samples_per_second": 7.951, |
|
"eval_steps_per_second": 0.254 |
|
} |