|
@@ -85,7 +85,8 @@ class XinferenceAILargeLanguageModel(LargeLanguageModel):
|
|
|
tools=tools, stop=stop, stream=stream, user=user,
|
|
|
extra_model_kwargs=XinferenceHelper.get_xinference_extra_parameter(
|
|
|
server_url=credentials['server_url'],
|
|
|
- model_uid=credentials['model_uid']
|
|
|
+ model_uid=credentials['model_uid'],
|
|
|
+ api_key=credentials.get('api_key'),
|
|
|
)
|
|
|
)
|
|
|
|
|
@@ -106,7 +107,8 @@ class XinferenceAILargeLanguageModel(LargeLanguageModel):
|
|
|
|
|
|
extra_param = XinferenceHelper.get_xinference_extra_parameter(
|
|
|
server_url=credentials['server_url'],
|
|
|
- model_uid=credentials['model_uid']
|
|
|
+ model_uid=credentials['model_uid'],
|
|
|
+ api_key=credentials.get('api_key')
|
|
|
)
|
|
|
if 'completion_type' not in credentials:
|
|
|
if 'chat' in extra_param.model_ability:
|
|
@@ -396,7 +398,8 @@ class XinferenceAILargeLanguageModel(LargeLanguageModel):
|
|
|
else:
|
|
|
extra_args = XinferenceHelper.get_xinference_extra_parameter(
|
|
|
server_url=credentials['server_url'],
|
|
|
- model_uid=credentials['model_uid']
|
|
|
+ model_uid=credentials['model_uid'],
|
|
|
+ api_key=credentials.get('api_key')
|
|
|
)
|
|
|
|
|
|
if 'chat' in extra_args.model_ability:
|
|
@@ -464,6 +467,7 @@ class XinferenceAILargeLanguageModel(LargeLanguageModel):
|
|
|
|
|
|
xinference_client = Client(
|
|
|
base_url=credentials['server_url'],
|
|
|
+ api_key=credentials.get('api_key'),
|
|
|
)
|
|
|
|
|
|
xinference_model = xinference_client.get_model(credentials['model_uid'])
|