Jelajahi Sumber

feat: support llama3.1 series models for openrouter provider (#6595)

sino 9 bulan lalu
induk
melakukan
d5c2680fde

+ 3 - 0
api/core/model_runtime/model_providers/openrouter/llm/_position.yaml

@@ -12,6 +12,9 @@
 - google/gemini-pro
 - cohere/command-r-plus
 - cohere/command-r
+- meta-llama/llama-3.1-405b-instruct
+- meta-llama/llama-3.1-70b-instruct
+- meta-llama/llama-3.1-8b-instruct
 - meta-llama/llama-3-70b-instruct
 - meta-llama/llama-3-8b-instruct
 - mistralai/mixtral-8x22b-instruct

+ 23 - 0
api/core/model_runtime/model_providers/openrouter/llm/llama-3.1-405b-instruct.yaml

@@ -0,0 +1,23 @@
+model: meta-llama/llama-3.1-405b-instruct
+label:
+  en_US: llama-3.1-405b-instruct
+model_type: llm
+model_properties:
+  mode: chat
+  context_size: 128000
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+  - name: top_p
+    use_template: top_p
+  - name: max_tokens
+    use_template: max_tokens
+    required: true
+    default: 512
+    min: 1
+    max: 128000
+pricing:
+  input: "3"
+  output: "3"
+  unit: "0.000001"
+  currency: USD

+ 23 - 0
api/core/model_runtime/model_providers/openrouter/llm/llama-3.1-70b-instruct.yaml

@@ -0,0 +1,23 @@
+model: meta-llama/llama-3.1-70b-instruct
+label:
+  en_US: llama-3.1-70b-instruct
+model_type: llm
+model_properties:
+  mode: chat
+  context_size: 128000
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+  - name: top_p
+    use_template: top_p
+  - name: max_tokens
+    use_template: max_tokens
+    required: true
+    default: 512
+    min: 1
+    max: 128000
+pricing:
+  input: "0.9"
+  output: "0.9"
+  unit: "0.000001"
+  currency: USD

+ 23 - 0
api/core/model_runtime/model_providers/openrouter/llm/llama-3.1-8b-instruct.yaml

@@ -0,0 +1,23 @@
+model: meta-llama/llama-3.1-8b-instruct
+label:
+  en_US: llama-3.1-8b-instruct
+model_type: llm
+model_properties:
+  mode: chat
+  context_size: 128000
+parameter_rules:
+  - name: temperature
+    use_template: temperature
+  - name: top_p
+    use_template: top_p
+  - name: max_tokens
+    use_template: max_tokens
+    required: true
+    default: 512
+    min: 1
+    max: 128000
+pricing:
+  input: "0.2"
+  output: "0.2"
+  unit: "0.000001"
+  currency: USD