From dcf2a4eb9494f263578ee9b4545991b05a4f645d Mon Sep 17 00:00:00 2001 From: ai-modelscope Date: Tue, 21 Jan 2025 20:27:27 +0800 Subject: [PATCH] Add generation_config.json --- .gitattributes | 2 -- README.md | 5 ++++- generation_config.json | 9 +++++++++ 3 files changed, 13 insertions(+), 3 deletions(-) create mode 100644 generation_config.json diff --git a/.gitattributes b/.gitattributes index 2d6110e..a6344aa 100644 --- a/.gitattributes +++ b/.gitattributes @@ -33,5 +33,3 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text -model-00001-of-000002.safetensors filter=lfs diff=lfs merge=lfs -text -model-00002-of-000002.safetensors filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md index e5bcaca..1187f86 100644 --- a/README.md +++ b/README.md @@ -1,3 +1,6 @@ +--- +library_name: transformers +--- # DeepSeek-R1 @@ -206,4 +209,4 @@ DeepSeek-R1 series support commercial use, allow for any modifications and deriv ``` ## 9. Contact -If you have any questions, please raise an issue or contact us at [service@deepseek.com](service@deepseek.com). +If you have any questions, please raise an issue or contact us at [service@deepseek.com](service@deepseek.com). \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..052ab54 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,9 @@ +{ + "_from_model_config": true, + "bos_token_id": 151646, + "eos_token_id": 151643, + "do_sample": true, + "temperature": 0.6, + "top_p": 0.95, + "transformers_version": "4.39.3" +}