NicholasCorrado's picture
End of training
7fe06c6 verified
{
"epoch": 0.9983492901947838,
"eval_logits/chosen": -2.375783920288086,
"eval_logits/rejected": -2.3758819103240967,
"eval_logps/chosen": -218.0917205810547,
"eval_logps/rejected": -221.27059936523438,
"eval_loss": 0.6741424202919006,
"eval_rewards/accuracies": 0.564338207244873,
"eval_rewards/chosen": -0.5671599507331848,
"eval_rewards/margins": 0.056060947477817535,
"eval_rewards/rejected": -0.6232209205627441,
"eval_runtime": 162.069,
"eval_samples": 8652,
"eval_samples_per_second": 53.385,
"eval_steps_per_second": 0.839,
"total_flos": 0.0,
"train_loss": 0.6782766637347993,
"train_runtime": 9304.817,
"train_samples": 193800,
"train_samples_per_second": 20.828,
"train_steps_per_second": 0.041
}