Browse Source

feat(model_providers): Support deepseek-r1 for Nvidia Catalog (#13269)

Signed-off-by: -LAN- <laipz8200@outlook.com>
-LAN- 2 tháng trước cách đây
mục cha
commit
6d66d6da15

+ 1 - 0
api/core/model_runtime/model_providers/nvidia/llm/_position.yaml

@@ -1,3 +1,4 @@
+- deepseek-ai/deepseek-r1
 - google/gemma-7b
 - google/codegemma-7b
 - google/recurrentgemma-2b

+ 35 - 0
api/core/model_runtime/model_providers/nvidia/llm/deepseek-r1.yaml

@@ -0,0 +1,35 @@
+model: deepseek-ai/deepseek-r1
+label:
+  en_US: deepseek-ai/deepseek-r1
+model_type: llm
+features:
+  - agent-thought
+model_properties:
+  mode: chat
+  context_size: 128000
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+    min: 0
+    max: 1
+    default: 0.5
+  - name: top_p
+    use_template: top_p
+    min: 0
+    max: 1
+    default: 1
+  - name: max_tokens
+    use_template: max_tokens
+    min: 1
+    max: 1024
+    default: 1024
+  - name: frequency_penalty
+    use_template: frequency_penalty
+    min: -2
+    max: 2
+    default: 0
+  - name: presence_penalty
+    use_template: presence_penalty
+    min: -2
+    max: 2
+    default: 0

+ 1 - 1
api/core/model_runtime/model_providers/nvidia/llm/llm.py

@@ -83,7 +83,7 @@ class NVIDIALargeLanguageModel(OAIAPICompatLargeLanguageModel):
     def _add_custom_parameters(self, credentials: dict, model: str) -> None:
         credentials["mode"] = "chat"
 
-        if self.MODEL_SUFFIX_MAP[model]:
+        if self.MODEL_SUFFIX_MAP.get(model):
             credentials["server_url"] = f"https://ai.api.nvidia.com/v1/{self.MODEL_SUFFIX_MAP[model]}"
             credentials.pop("endpoint_url")
         else: