mirror of
https://www.modelscope.cn/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B.git
synced 2025-12-08 20:44:24 +08:00
10 lines
181 B
JSON
10 lines
181 B
JSON
{
|
|
"_from_model_config": true,
|
|
"bos_token_id": 151646,
|
|
"eos_token_id": 151643,
|
|
"do_sample": true,
|
|
"temperature": 0.6,
|
|
"top_p": 0.95,
|
|
"transformers_version": "4.39.3"
|
|
}
|