mirror of
https://www.modelscope.cn/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B.git
synced 2025-12-08 20:44:24 +08:00
Add generation_config.json
This commit is contained in:
parent
6166147947
commit
aa6e681058
8
.gitattributes
vendored
8
.gitattributes
vendored
@ -33,11 +33,3 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|||||||
*.zip filter=lfs diff=lfs merge=lfs -text
|
*.zip filter=lfs diff=lfs merge=lfs -text
|
||||||
*.zst filter=lfs diff=lfs merge=lfs -text
|
*.zst filter=lfs diff=lfs merge=lfs -text
|
||||||
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
||||||
model-00001-of-000008.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
||||||
model-00002-of-000008.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
||||||
model-00003-of-000008.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
||||||
model-00004-of-000008.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
||||||
model-00005-of-000008.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
||||||
model-00006-of-000008.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
||||||
model-00007-of-000008.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
||||||
model-00008-of-000008.safetensors filter=lfs diff=lfs merge=lfs -text
|
|
||||||
|
|||||||
@ -1,3 +1,6 @@
|
|||||||
|
---
|
||||||
|
library_name: transformers
|
||||||
|
---
|
||||||
# DeepSeek-R1
|
# DeepSeek-R1
|
||||||
<!-- markdownlint-disable first-line-h1 -->
|
<!-- markdownlint-disable first-line-h1 -->
|
||||||
<!-- markdownlint-disable html -->
|
<!-- markdownlint-disable html -->
|
||||||
|
|||||||
9
generation_config.json
Normal file
9
generation_config.json
Normal file
@ -0,0 +1,9 @@
|
|||||||
|
{
|
||||||
|
"_from_model_config": true,
|
||||||
|
"bos_token_id": 151646,
|
||||||
|
"eos_token_id": 151643,
|
||||||
|
"do_sample": true,
|
||||||
|
"temperature": 0.6,
|
||||||
|
"top_p": 0.95,
|
||||||
|
"transformers_version": "4.39.3"
|
||||||
|
}
|
||||||
Loading…
x
Reference in New Issue
Block a user