11 달 전 · 2fdd64c1b5
--- a/api/core/model_runtime/model_providers/cohere/cohere.yaml
+++ b/api/core/model_runtime/model_providers/cohere/cohere.yaml
@@ -32,6 +32,15 @@ provider_credential_schema:
 
				         zh_Hans: 在此输入您的 API Key
			
 
				         en_US: Enter your API Key
			
 
				       show_on: [ ]
			
 
				+    - variable: base_url
			
 
				+      label:
			
 
				+        zh_Hans: API Base
			
 
				+        en_US: API Base
			
 
				+      type: text-input
			
 
				+      required: false
			
 
				+      placeholder:
			
 
				+        zh_Hans: 在此输入您的 API Base，如 https://api.cohere.ai/v1
			
 
				+        en_US: Enter your API Base, e.g. https://api.cohere.ai/v1
			
 
				 model_credential_schema:
			
 
				   model:
			
 
				     label:
			
@@ -70,3 +79,12 @@ model_credential_schema:
 
				       placeholder:
			
 
				         zh_Hans: 在此输入您的 API Key
			
 
				         en_US: Enter your API Key
			
 
				+    - variable: base_url
			
 
				+      label:
			
 
				+        zh_Hans: API Base
			
 
				+        en_US: API Base
			
 
				+      type: text-input
			
 
				+      required: false
			
 
				+      placeholder:
			
 
				+        zh_Hans: 在此输入您的 API Base，如 https://api.cohere.ai/v1
			
 
				+        en_US: Enter your API Base, e.g. https://api.cohere.ai/v1
			
--- a/api/core/model_runtime/model_providers/cohere/llm/llm.py
+++ b/api/core/model_runtime/model_providers/cohere/llm/llm.py
@@ -173,7 +173,7 @@ class CohereLargeLanguageModel(LargeLanguageModel):
 
				         :return: full response or stream response chunk generator result
			
 
				         """
			
 
				         # initialize client
			
 
				-        client = cohere.Client(credentials.get('api_key'))
			
 
				+        client = cohere.Client(credentials.get('api_key'), base_url=credentials.get('base_url'))
			
 
				 
			
 
				         if stop:
			
 
				             model_parameters['end_sequences'] = stop
			
@@ -233,7 +233,8 @@ class CohereLargeLanguageModel(LargeLanguageModel):
 
				 
			
 
				         return response
			
 
				 
			
 
				-    def _handle_generate_stream_response(self, model: str, credentials: dict, response: Iterator[GenerateStreamedResponse],
			
 
				+    def _handle_generate_stream_response(self, model: str, credentials: dict,
			
 
				+                                         response: Iterator[GenerateStreamedResponse],
			
 
				                                          prompt_messages: list[PromptMessage]) -> Generator:
			
 
				         """
			
 
				         Handle llm stream response
			
@@ -317,7 +318,7 @@ class CohereLargeLanguageModel(LargeLanguageModel):
 
				         :return: full response or stream response chunk generator result
			
 
				         """
			
 
				         # initialize client
			
 
				-        client = cohere.Client(credentials.get('api_key'))
			
 
				+        client = cohere.Client(credentials.get('api_key'), base_url=credentials.get('base_url'))
			
 
				 
			
 
				         if stop:
			
 
				             model_parameters['stop_sequences'] = stop
			
@@ -636,7 +637,7 @@ class CohereLargeLanguageModel(LargeLanguageModel):
 
				         :return: number of tokens
			
 
				         """
			
 
				         # initialize client
			
 
				-        client = cohere.Client(credentials.get('api_key'))
			
 
				+        client = cohere.Client(credentials.get('api_key'), base_url=credentials.get('base_url'))
			
 
				 
			
 
				         response = client.tokenize(
			
 
				             text=text,
			
--- a/api/core/model_runtime/model_providers/cohere/rerank/rerank.py
+++ b/api/core/model_runtime/model_providers/cohere/rerank/rerank.py
@@ -44,7 +44,7 @@ class CohereRerankModel(RerankModel):
 
				             )
			
 
				 
			
 
				         # initialize client
			
 
				-        client = cohere.Client(credentials.get('api_key'))
			
 
				+        client = cohere.Client(credentials.get('api_key'), base_url=credentials.get('base_url'))
			
 
				         response = client.rerank(
			
 
				             query=query,
			
 
				             documents=docs,
			
--- a/api/core/model_runtime/model_providers/cohere/text_embedding/text_embedding.py
+++ b/api/core/model_runtime/model_providers/cohere/text_embedding/text_embedding.py
@@ -141,7 +141,7 @@ class CohereTextEmbeddingModel(TextEmbeddingModel):
 
				             return []
			
 
				 
			
 
				         # initialize client
			
 
				-        client = cohere.Client(credentials.get('api_key'))
			
 
				+        client = cohere.Client(credentials.get('api_key'), base_url=credentials.get('base_url'))
			
 
				 
			
 
				         response = client.tokenize(
			
 
				             text=text,
			
@@ -180,7 +180,7 @@ class CohereTextEmbeddingModel(TextEmbeddingModel):
 
				         :return: embeddings and used tokens
			
 
				         """
			
 
				         # initialize client
			
 
				-        client = cohere.Client(credentials.get('api_key'))
			
 
				+        client = cohere.Client(credentials.get('api_key'), base_url=credentials.get('base_url'))
			
 
				 
			
 
				         # call embedding model
			
 
				         response = client.embed(