add first-class support for Azure OpenAI

2026-01-09 13:17:55 -05:00 · 2024-06-05 09:53:46 +02:00
parent 984caedfac
commit dbd3bec8b5
5 changed files with 59 additions and 5 deletions
--- a/core/config/init.py
+++ b/core/config/init.py
@@ -1,6 +1,6 @@
 from enum import Enum
 from os.path import abspath, dirname, isdir, join
-from typing import Literal, Optional, Union
+from typing import Any, Literal, Optional, Union

 from pydantic import BaseModel, ConfigDict, Field, field_validator
 from typing_extensions import Annotated
@@ -55,6 +55,7 @@ class LLMProvider(str, Enum):
    ANTHROPIC = "anthropic"
    GROQ = "groq"
    LM_STUDIO = "lm-studio"
+    AZURE = "azure"


 class UIAdapter(str, Enum):
@@ -89,6 +90,10 @@ class ProviderConfig(_StrictModel):
        description="Timeout (in seconds) for receiving a new chunk of data from the response stream",
        ge=0.0,
    )
+    extra: Optional[dict[str, Any]] = Field(
+        None,
+        description="Extra provider-specific configuration",
+    )


 class AgentLLMConfig(_StrictModel):
@@ -140,6 +145,10 @@ class LLMConfig(_StrictModel):
        description="Timeout (in seconds) for receiving a new chunk of data from the response stream",
        ge=0.0,
    )
+    extra: Optional[dict[str, Any]] = Field(
+        None,
+        description="Extra provider-specific configuration",
+    )

    @classmethod
    def from_provider_and_agent_configs(cls, provider: ProviderConfig, agent: AgentLLMConfig):
@@ -151,6 +160,7 @@ class LLMConfig(_StrictModel):
            temperature=agent.temperature,
            connect_timeout=provider.connect_timeout,
            read_timeout=provider.read_timeout,
+            extra=provider.extra,
        )


--- a/core/llm/azure_client.py
+++ b/core/llm/azure_client.py
@@ -0,0 +1,29 @@
+from httpx import Timeout
+from openai import AsyncAzureOpenAI
+
+from core.config import LLMProvider
+from core.llm.openai_client import OpenAIClient
+from core.log import get_logger
+
+log = get_logger(__name__)
+
+
+class AzureClient(OpenAIClient):
+    provider = LLMProvider.AZURE
+    stream_options = None
+
+    def _init_client(self):
+        azure_deployment = self.config.extra.get("azure_deployment")
+        api_version = self.config.extra.get("api_version")
+
+        self.client = AsyncAzureOpenAI(
+            api_key=self.config.api_key,
+            azure_endpoint=self.config.base_url,
+            azure_deployment=azure_deployment,
+            api_version=api_version,
+            timeout=Timeout(
+                max(self.config.connect_timeout, self.config.read_timeout),
+                connect=self.config.connect_timeout,
+                read=self.config.read_timeout,
+            ),
+        )
--- a/core/llm/base.py
+++ b/core/llm/base.py
@@ -316,6 +316,7 @@ class BaseLLMClient:
        :return: Client class for the specified provider.
        """
        from .anthropic_client import AnthropicClient
+        from .azure_client import AzureClient
        from .groq_client import GroqClient
        from .openai_client import OpenAIClient

@@ -325,6 +326,8 @@ class BaseLLMClient:
            return AnthropicClient
        elif provider == LLMProvider.GROQ:
            return GroqClient
+        elif provider == LLMProvider.AZURE:
+            return AzureClient
        else:
            raise ValueError(f"Unsupported LLM provider: {provider.value}")

--- a/core/llm/openai_client.py
+++ b/core/llm/openai_client.py
@@ -17,6 +17,7 @@ tokenizer = tiktoken.get_encoding("cl100k_base")

 class OpenAIClient(BaseLLMClient):
    provider = LLMProvider.OPENAI
+    stream_options = {"include_usage": True}

    def _init_client(self):
        self.client = AsyncOpenAI(
@@ -40,10 +41,10 @@ class OpenAIClient(BaseLLMClient):
            "messages": convo.messages,
            "temperature": self.config.temperature if temperature is None else temperature,
            "stream": True,
-            "stream_options": {
-                "include_usage": True,
-            },
        }
+        if self.stream_options:
+            completion_kwargs["stream_options"] = self.stream_options
+
        if json_mode:
            completion_kwargs["response_format"] = {"type": "json_object"}

--- a/example-config.json
+++ b/example-config.json
@@ -1,6 +1,6 @@
 {
  // Configuration for the LLM providers that can be used. Pythagora supports
-  // OpenAI, Anthropic and Groq. Azure and OpenRouter and local LLMs (such as LM-Studio)
+  // OpenAI, Azure, Anthropic and Groq. OpenRouter and local LLMs (such as LM-Studio)
  // also work, you can use "openai" provider to define these.
  "llm": {
    "openai": {
@@ -9,6 +9,17 @@
      "api_key": null,
      "connect_timeout": 60.0,
      "read_timeout": 10.0
+    },
+    // Example config for Azure OpenAI (see https://learn.microsoft.com/en-us/azure/ai-services/openai/reference#chat-completions)
+    "azure": {
+      "base_url": "https://your-resource-name.openai.azure.com/",
+      "api_key": "your-api-key",
+      "connect_timeout": 60.0,
+      "read_timeout": 10.0,
+      "extra": {
+        "azure_deployment": "your-azure-deployment-id",
+        "api_version": "2024-02-01"
+      }
    }
  },
  // Each agent can use a different model or configuration. The default, as before, is GPT4 Turbo