| { | |
| "epoch": 0.9974025974025974, | |
| "eval_logits/chosen": -69679219.2, | |
| "eval_logits/rejected": -34451756.137931034, | |
| "eval_logps/chosen": -343.90514322916664, | |
| "eval_logps/rejected": -233.7683694773707, | |
| "eval_loss": 0.30314239859580994, | |
| "eval_rewards/chosen": 1.5421129862467449, | |
| "eval_rewards/margins": 8.846664735640603, | |
| "eval_rewards/rejected": -7.304551749393858, | |
| "eval_runtime": 374.42, | |
| "eval_samples_per_second": 1.247, | |
| "eval_steps_per_second": 0.158, | |
| "kl": 1080.3172607421875, | |
| "total_flos": 8.196772297546138e+16, | |
| "train_loss": 0.31702631492581634, | |
| "train_runtime": 54644.2785, | |
| "train_samples_per_second": 0.845, | |
| "train_steps_per_second": 0.007 | |
| } |