{ "epoch": 3.0, "eval_/kl_divergence": 49.863685607910156, "eval_/mean_score": 0.9476001262664795, "eval_loss": 0.0, "eval_runtime": 12.1673, "eval_samples_per_second": 8.219, "eval_steps_per_second": 0.329 }