12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849 |
- import os
- import pytest
- from core.model_runtime.entities.text_embedding_entities import TextEmbeddingResult
- from core.model_runtime.errors.validate import CredentialsValidateFailedError
- from core.model_runtime.model_providers.gpustack.text_embedding.text_embedding import (
- GPUStackTextEmbeddingModel,
- )
- def test_validate_credentials():
- model = GPUStackTextEmbeddingModel()
- with pytest.raises(CredentialsValidateFailedError):
- model.validate_credentials(
- model="bge-m3",
- credentials={
- "endpoint_url": "invalid_url",
- "api_key": "invalid_api_key",
- },
- )
- model.validate_credentials(
- model="bge-m3",
- credentials={
- "endpoint_url": os.environ.get("GPUSTACK_SERVER_URL"),
- "api_key": os.environ.get("GPUSTACK_API_KEY"),
- },
- )
- def test_invoke_model():
- model = GPUStackTextEmbeddingModel()
- result = model.invoke(
- model="bge-m3",
- credentials={
- "endpoint_url": os.environ.get("GPUSTACK_SERVER_URL"),
- "api_key": os.environ.get("GPUSTACK_API_KEY"),
- "context_size": 8192,
- },
- texts=["hello", "world"],
- user="abc-123",
- )
- assert isinstance(result, TextEmbeddingResult)
- assert len(result.embeddings) == 2
- assert result.usage.total_tokens == 7
|