|
@@ -792,13 +792,19 @@ class DocumentService:
|
|
|
dataset.indexing_technique = knowledge_config.indexing_technique
|
|
|
if knowledge_config.indexing_technique == "high_quality":
|
|
|
model_manager = ModelManager()
|
|
|
- embedding_model = model_manager.get_default_model_instance(
|
|
|
- tenant_id=current_user.current_tenant_id, model_type=ModelType.TEXT_EMBEDDING
|
|
|
- )
|
|
|
- dataset.embedding_model = embedding_model.model
|
|
|
- dataset.embedding_model_provider = embedding_model.provider
|
|
|
+ if knowledge_config.embedding_model and knowledge_config.embedding_model_provider:
|
|
|
+ dataset_embedding_model = knowledge_config.embedding_model
|
|
|
+ dataset_embedding_model_provider = knowledge_config.embedding_model_provider
|
|
|
+ else:
|
|
|
+ embedding_model = model_manager.get_default_model_instance(
|
|
|
+ tenant_id=current_user.current_tenant_id, model_type=ModelType.TEXT_EMBEDDING
|
|
|
+ )
|
|
|
+ dataset_embedding_model = embedding_model.model
|
|
|
+ dataset_embedding_model_provider = embedding_model.provider
|
|
|
+ dataset.embedding_model = dataset_embedding_model
|
|
|
+ dataset.embedding_model_provider = dataset_embedding_model_provider
|
|
|
dataset_collection_binding = DatasetCollectionBindingService.get_dataset_collection_binding(
|
|
|
- embedding_model.provider, embedding_model.model
|
|
|
+ dataset_embedding_model_provider, dataset_embedding_model
|
|
|
)
|
|
|
dataset.collection_binding_id = dataset_collection_binding.id
|
|
|
if not dataset.retrieval_model:
|
|
@@ -810,7 +816,11 @@ class DocumentService:
|
|
|
"score_threshold_enabled": False,
|
|
|
}
|
|
|
|
|
|
- dataset.retrieval_model = knowledge_config.retrieval_model.model_dump() or default_retrieval_model # type: ignore
|
|
|
+ dataset.retrieval_model = (
|
|
|
+ knowledge_config.retrieval_model.model_dump()
|
|
|
+ if knowledge_config.retrieval_model
|
|
|
+ else default_retrieval_model
|
|
|
+ ) # type: ignore
|
|
|
|
|
|
documents = []
|
|
|
if knowledge_config.original_document_id:
|