|
import os |
|
|
|
import pytest |
|
|
|
from core.model_runtime.entities.text_embedding_entities import TextEmbeddingResult |
|
from core.model_runtime.errors.validate import CredentialsValidateFailedError |
|
from core.model_runtime.model_providers.xinference.text_embedding.text_embedding import XinferenceTextEmbeddingModel |
|
from tests.integration_tests.model_runtime.__mock.xinference import MOCK, setup_xinference_mock |
|
|
|
|
|
@pytest.mark.parametrize("setup_xinference_mock", [["none"]], indirect=True) |
|
def test_validate_credentials(setup_xinference_mock): |
|
model = XinferenceTextEmbeddingModel() |
|
|
|
with pytest.raises(CredentialsValidateFailedError): |
|
model.validate_credentials( |
|
model="bge-base-en", |
|
credentials={ |
|
"server_url": os.environ.get("XINFERENCE_SERVER_URL"), |
|
"model_uid": "www " + os.environ.get("XINFERENCE_EMBEDDINGS_MODEL_UID"), |
|
}, |
|
) |
|
|
|
model.validate_credentials( |
|
model="bge-base-en", |
|
credentials={ |
|
"server_url": os.environ.get("XINFERENCE_SERVER_URL"), |
|
"model_uid": os.environ.get("XINFERENCE_EMBEDDINGS_MODEL_UID"), |
|
}, |
|
) |
|
|
|
|
|
@pytest.mark.parametrize("setup_xinference_mock", [["none"]], indirect=True) |
|
def test_invoke_model(setup_xinference_mock): |
|
model = XinferenceTextEmbeddingModel() |
|
|
|
result = model.invoke( |
|
model="bge-base-en", |
|
credentials={ |
|
"server_url": os.environ.get("XINFERENCE_SERVER_URL"), |
|
"model_uid": os.environ.get("XINFERENCE_EMBEDDINGS_MODEL_UID"), |
|
}, |
|
texts=["hello", "world"], |
|
user="abc-123", |
|
) |
|
|
|
assert isinstance(result, TextEmbeddingResult) |
|
assert len(result.embeddings) == 2 |
|
assert result.usage.total_tokens > 0 |
|
|
|
|
|
def test_get_num_tokens(): |
|
model = XinferenceTextEmbeddingModel() |
|
|
|
num_tokens = model.get_num_tokens( |
|
model="bge-base-en", |
|
credentials={ |
|
"server_url": os.environ.get("XINFERENCE_SERVER_URL"), |
|
"model_uid": os.environ.get("XINFERENCE_EMBEDDINGS_MODEL_UID"), |
|
}, |
|
texts=["hello", "world"], |
|
) |
|
|
|
assert num_tokens == 2 |
|
|