diff --git a/libs/partners/openai/langchain_openai/embeddings/azure.py b/libs/partners/openai/langchain_openai/embeddings/azure.py index 684689d92ac..0daabd40f92 100644 --- a/libs/partners/openai/langchain_openai/embeddings/azure.py +++ b/libs/partners/openai/langchain_openai/embeddings/azure.py @@ -99,10 +99,10 @@ class AzureOpenAIEmbeddings(OpenAIEmbeddings): values["azure_ad_token"] = ( convert_to_secret_str(azure_ad_token) if azure_ad_token else None ) - # Azure OpenAI embedding models allow a maximum of 16 texts + # Azure OpenAI embedding models allow a maximum of 2048 texts # at a time in each batch - # See: https://learn.microsoft.com/en-us/azure/ai-services/openai/reference#embeddings - values["chunk_size"] = min(values["chunk_size"], 16) + # See: https://learn.microsoft.com/en-us/azure/ai-services/openai/how-to/embeddings?tabs=console#best-practices + values["chunk_size"] = min(values["chunk_size"], 2048) # For backwards compatibility. Before openai v1, no distinction was made # between azure_endpoint and base_url (openai_api_base). openai_api_base = values["openai_api_base"]