Sean13's picture
End of training
63dc068 verified
{
"epoch": 0.998660594695955,
"eta/annotator_0": 0.9730426073074341,
"eval_agreement_weights/mean": 0.9695923328399658,
"eval_agreement_weights/std": 0.018151868134737015,
"eval_loss": 0.7976000905036926,
"eval_rewards/accuracies": 0.5507165789604187,
"eval_rewards/chosen": -1.2290558815002441,
"eval_rewards/margins": 0.09547457098960876,
"eval_rewards/rejected": -1.3243849277496338,
"eval_runtime": 101.569,
"eval_samples": 2994,
"eval_samples_per_second": 29.478,
"eval_steps_per_second": 0.925
}