Llama-3.2-3B-DPO / eval_results.json
sciarrilli's picture
Model save
edcf956 verified
raw
history blame contribute delete
546 Bytes
{
"epoch": 0.9957081545064378,
"eval_logits/chosen": 0.6785366535186768,
"eval_logits/rejected": 0.5101125240325928,
"eval_logps/chosen": -353.8060607910156,
"eval_logps/rejected": -244.0733184814453,
"eval_loss": 0.6846491098403931,
"eval_rewards/accuracies": 0.625,
"eval_rewards/chosen": -0.03933782875537872,
"eval_rewards/margins": 0.03162214532494545,
"eval_rewards/rejected": -0.07095997035503387,
"eval_runtime": 9.0831,
"eval_samples_per_second": 1.101,
"eval_steps_per_second": 0.22
}