{ | |
"epoch": 0.9974025974025974, | |
"eval_logits/chosen": -69679219.2, | |
"eval_logits/rejected": -34451756.137931034, | |
"eval_logps/chosen": -343.90514322916664, | |
"eval_logps/rejected": -233.7683694773707, | |
"eval_loss": 0.30314239859580994, | |
"eval_rewards/chosen": 1.5421129862467449, | |
"eval_rewards/margins": 8.846664735640603, | |
"eval_rewards/rejected": -7.304551749393858, | |
"eval_runtime": 374.42, | |
"eval_samples_per_second": 1.247, | |
"eval_steps_per_second": 0.158, | |
"kl": 1080.3172607421875 | |
} |