| import os | |
| import pytest | |
| from core.model_runtime.entities.text_embedding_entities import TextEmbeddingResult | |
| from core.model_runtime.errors.validate import CredentialsValidateFailedError | |
| from core.model_runtime.model_providers.gpustack.text_embedding.text_embedding import ( | |
| GPUStackTextEmbeddingModel, | |
| ) | |
| def test_validate_credentials(): | |
| model = GPUStackTextEmbeddingModel() | |
| with pytest.raises(CredentialsValidateFailedError): | |
| model.validate_credentials( | |
| model="bge-m3", | |
| credentials={ | |
| "endpoint_url": "invalid_url", | |
| "api_key": "invalid_api_key", | |
| }, | |
| ) | |
| model.validate_credentials( | |
| model="bge-m3", | |
| credentials={ | |
| "endpoint_url": os.environ.get("GPUSTACK_SERVER_URL"), | |
| "api_key": os.environ.get("GPUSTACK_API_KEY"), | |
| }, | |
| ) | |
| def test_invoke_model(): | |
| model = GPUStackTextEmbeddingModel() | |
| result = model.invoke( | |
| model="bge-m3", | |
| credentials={ | |
| "endpoint_url": os.environ.get("GPUSTACK_SERVER_URL"), | |
| "api_key": os.environ.get("GPUSTACK_API_KEY"), | |
| "context_size": 8192, | |
| }, | |
| texts=["hello", "world"], | |
| user="abc-123", | |
| ) | |
| assert isinstance(result, TextEmbeddingResult) | |
| assert len(result.embeddings) == 2 | |
| assert result.usage.total_tokens == 7 | |