Qwen2-0.5B-DRDPO-imdb-bm-tp / eval_results.json
Last commit not found
raw
history blame contribute delete
683 Bytes
{
"epoch": 1.0,
"eval_error": 0.23849666118621826,
"eval_logits/chosen": -2.8272712230682373,
"eval_logits/rejected": -2.8083930015563965,
"eval_logps/chosen": -477.6735534667969,
"eval_logps/rejected": -481.281494140625,
"eval_loss": 0.8262702226638794,
"eval_preference/chosen": 0.5308043956756592,
"eval_preference/rejected": 0.46919554471969604,
"eval_rewards/accuracies": 0.5099999904632568,
"eval_rewards/chosen": 2.068169116973877,
"eval_rewards/margins": 0.0749686062335968,
"eval_rewards/rejected": 1.993200421333313,
"eval_runtime": 41.6193,
"eval_samples_per_second": 24.027,
"eval_steps_per_second": 3.003
}