|
{ |
|
"epoch": 1.0, |
|
"eval_logits/chosen": 0.9743706583976746, |
|
"eval_logits/rejected": 0.6065909266471863, |
|
"eval_logps/chosen": -139.52996826171875, |
|
"eval_logps/rejected": -142.2351837158203, |
|
"eval_loss": 0.01678086631000042, |
|
"eval_rewards/accuracies": 0.9956116080284119, |
|
"eval_rewards/chosen": -1.5749770402908325, |
|
"eval_rewards/margins": 9.825251579284668, |
|
"eval_rewards/rejected": -11.400227546691895, |
|
"eval_runtime": 379.7007, |
|
"eval_samples_per_second": 9.6, |
|
"eval_steps_per_second": 4.801, |
|
"train_loss": 0.025599888430248966, |
|
"train_runtime": 6987.638, |
|
"train_samples_per_second": 4.693, |
|
"train_steps_per_second": 0.587 |
|
} |