fix(backend): correct LLM configurations (#10585)

## Summary Corrects the context window for GPT5_CHAT, fixes provider for CLAUDE_4_1_OPUS from 'openai' to 'anthropic', and adds a 600s timeout to the Anthropic client call in llm_call. ## Changes 🏗️ - changed gpt5's context limit to be smaller, 16k - changed claude's provider from openai to anthropic - Adding a 600s timeout to the Anthropic client call ## Checklist 📋 #### For code changes: - [x] I have clearly listed my changes in the PR description - [x] I have made a test plan - [x] I have tested my changes according to the test plan: - [x] test all models and they work
2026-02-09 14:25:25 -05:00 · 2025-08-08 16:45:18 +01:00
parent c1c5571fd5
commit b68e490868
1 changed files with 3 additions and 2 deletions
--- a/autogpt_platform/backend/backend/blocks/llm.py
+++ b/autogpt_platform/backend/backend/blocks/llm.py
@@ -183,7 +183,7 @@ MODEL_METADATA = {
    LlmModel.GPT5: ModelMetadata("openai", 400000, 128000),
    LlmModel.GPT5_MINI: ModelMetadata("openai", 400000, 128000),
    LlmModel.GPT5_NANO: ModelMetadata("openai", 400000, 128000),
-    LlmModel.GPT5_CHAT: ModelMetadata("openai", 400000, 128000),
+    LlmModel.GPT5_CHAT: ModelMetadata("openai", 400000, 16384),
    LlmModel.GPT41: ModelMetadata("openai", 1047576, 32768),
    LlmModel.GPT41_MINI: ModelMetadata("openai", 1047576, 32768),
    LlmModel.GPT4O_MINI: ModelMetadata(
@@ -196,7 +196,7 @@ MODEL_METADATA = {
    LlmModel.GPT3_5_TURBO: ModelMetadata("openai", 16385, 4096),  # gpt-3.5-turbo-0125
    # https://docs.anthropic.com/en/docs/about-claude/models
    LlmModel.CLAUDE_4_1_OPUS: ModelMetadata(
-        "openai", 200000, 32000
+        "anthropic", 200000, 32000
    ),  # claude-opus-4-1-20250805
    LlmModel.CLAUDE_4_OPUS: ModelMetadata(
        "anthropic", 200000, 8192
@@ -493,6 +493,7 @@ async def llm_call(
                messages=messages,
                max_tokens=max_tokens,
                tools=an_tools,
+                timeout=600,
            )

            if not resp.content: