Compare commits

...

3 Commits

Author SHA1 Message Date
Devin AI
ffdc9a1aa3 Enhance Azure OpenAI embedding validation with comprehensive parameter checks
Co-Authored-By: Joe Moura <joao@crewai.com>
2025-03-10 23:56:06 +00:00
Devin AI
e5ca5fb1dd Fix import ordering in azure_memory_test.py
Co-Authored-By: Joe Moura <joao@crewai.com>
2025-03-10 23:47:51 +00:00
Devin AI
26a5900aa7 Fix Azure OpenAI embeddings by validating deployment_id parameter (#2320)
Co-Authored-By: Joe Moura <joao@crewai.com>
2025-03-10 23:46:13 +00:00
2 changed files with 168 additions and 2 deletions

View File

@@ -74,11 +74,49 @@ class EmbeddingConfigurator:
)
@staticmethod
def _configure_azure(config, model_name):
def _configure_azure(config: Dict[str, Any], model_name: str) -> EmbeddingFunction:
"""
Configure an Azure OpenAI embedding function.
Args:
config: A dictionary containing Azure OpenAI configuration parameters.
Required parameters:
- api_key: Azure OpenAI API key
- api_base: Azure OpenAI API base URL
- api_version: Azure OpenAI API version
- deployment_id: Azure OpenAI deployment ID for the embedding model
model_name: The name of the embedding model
Returns:
An OpenAIEmbeddingFunction configured for Azure OpenAI
Raises:
ValueError: If required parameters are missing or invalid
"""
from chromadb.utils.embedding_functions.openai_embedding_function import (
OpenAIEmbeddingFunction,
)
# Check required parameters for Azure OpenAI
required_params = {
"api_key": "API key",
"api_base": "API base URL",
"api_version": "API version",
"deployment_id": "deployment ID"
}
missing_params = []
for param, description in required_params.items():
if not config.get(param):
missing_params.append(f"{description} ({param})")
if missing_params:
params_str = ", ".join(missing_params)
raise ValueError(
f"Missing required parameters for Azure OpenAI embeddings: {params_str}. "
f"Ensure these parameters match your Azure OpenAI embedding model configuration."
)
return OpenAIEmbeddingFunction(
api_key=config.get("api_key"),
api_base=config.get("api_base"),

View File

@@ -0,0 +1,128 @@
from unittest.mock import MagicMock, patch
import pytest
from crewai.utilities.embedding_configurator import EmbeddingConfigurator
# Test constants for Azure OpenAI configurations
AZURE_BASE_CONFIG = {
"provider": "azure",
"config": {
"model": "text-embedding-ada-002",
"api_key": "test-key",
"api_base": "https://test.openai.azure.com",
"api_version": "2023-05-15",
"api_type": "azure",
}
}
AZURE_COMPLETE_CONFIG = {
"provider": "azure",
"config": {
"model": "text-embedding-ada-002",
"api_key": "test-key",
"api_base": "https://test.openai.azure.com",
"api_version": "2023-05-15",
"api_type": "azure",
"deployment_id": "text-embedding-ada-002",
}
}
def test_azure_embedder_missing_deployment_id():
"""Test that Azure embedder raises an error when deployment_id is missing"""
embedder_config = AZURE_BASE_CONFIG.copy()
configurator = EmbeddingConfigurator()
with pytest.raises(ValueError) as excinfo:
configurator.configure_embedder(embedder_config)
assert "Missing required parameters" in str(excinfo.value)
assert "deployment ID (deployment_id)" in str(excinfo.value)
def test_azure_embedder_missing_api_key():
"""Test that Azure embedder raises an error when api_key is missing"""
embedder_config = AZURE_BASE_CONFIG.copy()
embedder_config["config"] = embedder_config["config"].copy()
embedder_config["config"]["deployment_id"] = "text-embedding-ada-002"
embedder_config["config"].pop("api_key")
configurator = EmbeddingConfigurator()
with pytest.raises(ValueError) as excinfo:
configurator.configure_embedder(embedder_config)
assert "Missing required parameters" in str(excinfo.value)
assert "API key (api_key)" in str(excinfo.value)
def test_azure_embedder_missing_api_base():
"""Test that Azure embedder raises an error when api_base is missing"""
embedder_config = AZURE_BASE_CONFIG.copy()
embedder_config["config"] = embedder_config["config"].copy()
embedder_config["config"]["deployment_id"] = "text-embedding-ada-002"
embedder_config["config"].pop("api_base")
configurator = EmbeddingConfigurator()
with pytest.raises(ValueError) as excinfo:
configurator.configure_embedder(embedder_config)
assert "Missing required parameters" in str(excinfo.value)
assert "API base URL (api_base)" in str(excinfo.value)
def test_azure_embedder_missing_api_version():
"""Test that Azure embedder raises an error when api_version is missing"""
embedder_config = AZURE_BASE_CONFIG.copy()
embedder_config["config"] = embedder_config["config"].copy()
embedder_config["config"]["deployment_id"] = "text-embedding-ada-002"
embedder_config["config"].pop("api_version")
configurator = EmbeddingConfigurator()
with pytest.raises(ValueError) as excinfo:
configurator.configure_embedder(embedder_config)
assert "Missing required parameters" in str(excinfo.value)
assert "API version (api_version)" in str(excinfo.value)
def test_azure_embedder_empty_parameters():
"""Test that Azure embedder raises an error when parameters are empty strings"""
embedder_config = AZURE_BASE_CONFIG.copy()
embedder_config["config"] = embedder_config["config"].copy()
embedder_config["config"]["deployment_id"] = ""
embedder_config["config"]["api_key"] = ""
configurator = EmbeddingConfigurator()
with pytest.raises(ValueError) as excinfo:
configurator.configure_embedder(embedder_config)
assert "Missing required parameters" in str(excinfo.value)
assert "API key (api_key)" in str(excinfo.value)
assert "deployment ID (deployment_id)" in str(excinfo.value)
@patch("chromadb.utils.embedding_functions.openai_embedding_function.OpenAIEmbeddingFunction")
def test_azure_embedder_with_all_required_parameters(mock_openai_embedding):
"""Test that Azure embedder works when all required parameters are provided"""
mock_instance = MagicMock()
mock_openai_embedding.return_value = mock_instance
embedder_config = AZURE_COMPLETE_CONFIG.copy()
configurator = EmbeddingConfigurator()
result = configurator.configure_embedder(embedder_config)
assert result == mock_instance
mock_openai_embedding.assert_called_once()
# Verify parameters were passed correctly
call_kwargs = mock_openai_embedding.call_args.kwargs
assert call_kwargs["api_key"] == "test-key"
assert call_kwargs["api_base"] == "https://test.openai.azure.com"
assert call_kwargs["api_version"] == "2023-05-15"
assert call_kwargs["deployment_id"] == "text-embedding-ada-002"