zephyr-7b / eval_results.json
jikaixuan's picture
End of training
c11af18 verified
raw
history blame
628 Bytes
{
"epoch": 1.0,
"eval_logits/chosen": 4.460368633270264,
"eval_logits/rejected": 4.594798564910889,
"eval_logps/chosen": -380.465087890625,
"eval_logps/rejected": -579.1896362304688,
"eval_loss": 0.4399436116218567,
"eval_pred_label": 2212.28125,
"eval_rewards/accuracies": 0.33984375,
"eval_rewards/chosen": -3.1655280590057373,
"eval_rewards/margins": 1.8544387817382812,
"eval_rewards/rejected": -5.019967079162598,
"eval_runtime": 125.2743,
"eval_samples": 2000,
"eval_samples_per_second": 15.965,
"eval_steps_per_second": 0.255,
"eval_use_label": 6575.71875
}