[model] add deepseek-R1 & show think process (#6767)
Former-commit-id: 4dccb724af51208a001c96fefbdbf226be09e50c
This commit is contained in:
@@ -493,6 +493,38 @@ register_model_group(
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-V3",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-V3",
|
||||
},
|
||||
"DeepSeek-R1-1.5B-Distill": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B",
|
||||
},
|
||||
"DeepSeek-R1-7B-Distill": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Qwen-7B",
|
||||
},
|
||||
"DeepSeek-R1-8B-Distill": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Llama-8B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Llama-8B",
|
||||
},
|
||||
"DeepSeek-R1-14B-Distill": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Qwen-14B",
|
||||
},
|
||||
"DeepSeek-R1-32B-Distill": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B",
|
||||
},
|
||||
"DeepSeek-R1-70B-Distill": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
|
||||
},
|
||||
"DeepSeek-R1-671B-Zero": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1-Zero",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1-Zero",
|
||||
},
|
||||
"DeepSeek-R1-671B": {
|
||||
DownloadSource.DEFAULT: "deepseek-ai/DeepSeek-R1",
|
||||
DownloadSource.MODELSCOPE: "deepseek-ai/DeepSeek-R1",
|
||||
},
|
||||
},
|
||||
template="deepseek3",
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user