DeepSeek-R1-Distill-Qwen-1.5B-FactGRPO-2reward-SubLenCheck-SingleBox-0.15E-40_30_150-kl-rebuild
/
generation_config.json
{ | |
"_from_model_config": true, | |
"bos_token_id": 151646, | |
"do_sample": true, | |
"eos_token_id": 151643, | |
"temperature": 0.6, | |
"top_p": 0.95, | |
"transformers_version": "4.50.0.dev0" | |
} | |