|
{ |
|
"epoch": 0.9997172745264349, |
|
"eval_logits/chosen": -1.0220762491226196, |
|
"eval_logits/rejected": -1.0401626825332642, |
|
"eval_logps/chosen": -4.1724467277526855, |
|
"eval_logps/rejected": -4.85194206237793, |
|
"eval_loss": 2.5764122009277344, |
|
"eval_rewards/accuracies": 0.7931150197982788, |
|
"eval_rewards/chosen": -41.724464416503906, |
|
"eval_rewards/margins": 6.794952392578125, |
|
"eval_rewards/rejected": -48.51942443847656, |
|
"eval_runtime": 50.6713, |
|
"eval_samples_per_second": 58.791, |
|
"eval_steps_per_second": 3.69 |
|
} |