BerriAI · krrishdholakia · Mar 6, 2026 · Mar 6, 2026 · Mar 6, 2026 · Mar 6, 2026
diff --git a/docs/my-website/docs/integrations/index.md b/docs/my-website/docs/integrations/index.md
@@ -3,6 +3,7 @@
 This section covers integrations with various tools and services that can be used with LiteLLM (either Proxy or SDK).
 
 ## AI Agent Frameworks
+- **[AgentField](../tutorials/agentfield.md)** - Open-source control plane for building and orchestrating autonomous AI agents
 - **[Letta](./letta.md)** - Build stateful LLM agents with persistent memory using LiteLLM Proxy
 
 ## Development Tools
@@ -15,4 +16,4 @@ This section covers integrations with various tools and services that can be use
 - **[Datadog](../observability/datadog.md)**
 
 
-Click into each section to learn more about the integrations.
+Click into each section to learn more about the integrations.
diff --git a/docs/my-website/docs/tutorials/agentfield.md b/docs/my-website/docs/tutorials/agentfield.md
@@ -0,0 +1,124 @@
+import Tabs from '@theme/Tabs';
+import TabItem from '@theme/TabItem';
+
+# AgentField with LiteLLM
+
+Use [AgentField](https://agentfield.ai) with any LLM provider through LiteLLM.
+
+AgentField is an open-source control plane for building and orchestrating autonomous AI agents, with SDKs for Python, TypeScript, and Go. AgentField's Python SDK uses LiteLLM internally for multi-provider LLM support.
+
+## Overview
+
+AgentField's Python SDK uses `litellm.acompletion()` under the hood, giving you access to 100+ LLM providers out of the box:
+
+- Use any LiteLLM-supported model (OpenAI, Anthropic, Azure, Bedrock, Ollama, etc.)
+- Switch between providers by changing the model string
+- All LiteLLM features (caching, fallbacks, routing) work automatically
+
+## Prerequisites
+
+- Python 3.9+
+- API keys for your LLM providers
+- AgentField control plane (optional, for orchestration features)
+
+## Installation
+
+```bash
+pip install agentfield
+```
+
+## Quick Start
+
+### Basic Agent with OpenAI
+
+```python
+from agentfield import Agent, AgentConfig
+
+config = AgentConfig(
+    name="my-agent",
+    model="gpt-4o",  # Any LiteLLM-supported model
+    instructions="You are a helpful assistant."
+)
+
+agent = Agent(config)
+response = await agent.run("Hello, world!")
+```
+
+### Using Anthropic
+
+```python
+config = AgentConfig(
+    name="claude-agent",
+    model="anthropic/claude-sonnet-4-20250514",  # LiteLLM model format
+    instructions="You are a helpful assistant."
+)
+```
+
+### Using Ollama (Local Models)
+
+```python
+config = AgentConfig(
+    name="local-agent",
+    model="ollama/llama3.1",  # LiteLLM's ollama/ prefix
+    instructions="You are a helpful assistant."
+)
+```
+
+### Using Azure OpenAI
+
+```python
+config = AgentConfig(
+    name="azure-agent",
+    model="azure/gpt-4o",  # LiteLLM's azure/ prefix
+    instructions="You are a helpful assistant."
+)
+```
+
+### Using with LiteLLM Proxy
+
+Point AgentField to a LiteLLM Proxy for centralized model management:
+
+```python
+import os
+
+os.environ["OPENAI_API_BASE"] = "http://0.0.0.0:4000"  # LiteLLM Proxy URL
+os.environ["OPENAI_API_KEY"] = "sk-1234"  # LiteLLM Proxy key
+
+config = AgentConfig(
+    name="proxy-agent",
+    model="gpt-4o",  # Virtual model name from proxy config
+    instructions="You are a helpful assistant."
+)
+```
+
+## Multi-Agent Orchestration
+
+AgentField's control plane orchestrates multiple agents, each potentially using different LLM providers:
+
+```python
+from agentfield import Agent, AgentConfig, ControlPlane
+
+# Create agents with different providers
+researcher = Agent(AgentConfig(
+    name="researcher",
+    model="anthropic/claude-sonnet-4-20250514",
+    instructions="You research topics thoroughly."
+))
+
+writer = Agent(AgentConfig(
+    name="writer",
+    model="gpt-4o",
+    instructions="You write clear, concise content."
+))
+
+# Register with control plane
+cp = ControlPlane(server="http://localhost:8080")
+cp.register(researcher)
+cp.register(writer)
+```
+
+## Links
+
+- [Documentation](https://agentfield.ai/docs)
+- [GitHub](https://github.com/Agent-Field/agentfield)
+- [Python SDK](https://github.com/Agent-Field/agentfield/tree/main/sdk/python)
diff --git a/docs/my-website/sidebars.js b/docs/my-website/sidebars.js
@@ -185,6 +185,7 @@ const sidebars = {
         slug: "/agent_sdks"
       },
       items: [
+        "tutorials/agentfield",
         "tutorials/openai_agents_sdk",
         "tutorials/claude_agent_sdk",
         "tutorials/copilotkit_sdk",

diff --git a/litellm/__init__.py b/litellm/__init__.py
@@ -1452,6 +1452,7 @@ def set_global_gitlab_config(config: Dict[str, Any]) -> None:
     from .llms.perplexity.responses.transformation import PerplexityResponsesConfig as PerplexityResponsesConfig
     from .llms.databricks.responses.transformation import DatabricksResponsesAPIConfig as DatabricksResponsesAPIConfig
     from .llms.openrouter.responses.transformation import OpenRouterResponsesAPIConfig as OpenRouterResponsesAPIConfig
+    from .llms.ovhcloud.responses.transformation import OVHCloudResponsesAPIConfig as OVHCloudResponsesAPIConfig
     from .llms.gemini.interactions.transformation import GoogleAIStudioInteractionsConfig as GoogleAIStudioInteractionsConfig
     from .llms.openai.chat.o_series_transformation import OpenAIOSeriesConfig as OpenAIOSeriesConfig, OpenAIOSeriesConfig as OpenAIO1Config
     from .llms.anthropic.skills.transformation import AnthropicSkillsConfig as AnthropicSkillsConfig

diff --git a/litellm/_lazy_imports_registry.py b/litellm/_lazy_imports_registry.py
@@ -233,6 +233,7 @@
     "PerplexityResponsesConfig",
     "DatabricksResponsesAPIConfig",
     "OpenRouterResponsesAPIConfig",
+    "OVHCloudResponsesAPIConfig",
     "GoogleAIStudioInteractionsConfig",
     "OpenAIOSeriesConfig",
     "AnthropicSkillsConfig",
@@ -930,6 +931,10 @@
         ".llms.openrouter.responses.transformation",
         "OpenRouterResponsesAPIConfig",
     ),
+    "OVHCloudResponsesAPIConfig": (
+        ".llms.ovhcloud.responses.transformation",
+        "OVHCloudResponsesAPIConfig",
+    ),
     "GoogleAIStudioInteractionsConfig": (
         ".llms.gemini.interactions.transformation",
         "GoogleAIStudioInteractionsConfig",

diff --git a/litellm/cost_calculator.py b/litellm/cost_calculator.py
@@ -1095,6 +1095,19 @@ def completion_cost(  # noqa: PLR0915
             router_model_id=router_model_id,
         )
 
+        # When base_model overrides model and carries its own provider prefix
+        # (e.g. base_model="gemini/gemini-2.0-flash" on an anthropic deployment),
+        # align custom_llm_provider so cost_per_token builds the correct key.
+        # Skip when custom_pricing is True (base_model is ignored in that path).
+        _provider_overridden = False
+        if base_model is not None and selected_model is not None and not custom_pricing:
+            _parts = selected_model.split("/", 1)
+            if len(_parts) > 1 and _parts[0] in LlmProvidersSet:
+                extracted = _parts[0]
+                if extracted != custom_llm_provider:
+                    custom_llm_provider = extracted
+                    _provider_overridden = True
+
         potential_model_names = [
             selected_model,
             _get_response_model(completion_response),
@@ -1176,9 +1189,10 @@ def completion_cost(  # noqa: PLR0915
 
                     hidden_params = getattr(completion_response, "_hidden_params", None)
                     if hidden_params is not None:
-                        custom_llm_provider = hidden_params.get(
-                            "custom_llm_provider", custom_llm_provider or None
-                        )
+                        if not _provider_overridden:
+                            custom_llm_provider = hidden_params.get(
+                                "custom_llm_provider", custom_llm_provider or None
+                            )
                         region_name = hidden_params.get("region_name", region_name)
 
                         # For Gemini/Vertex AI responses, trafficType is stored in

diff --git a/litellm/litellm_core_utils/audio_utils/utils.py b/litellm/litellm_core_utils/audio_utils/utils.py
@@ -263,7 +263,16 @@ def calculate_request_duration(file: FileTypes) -> Optional[float]:
         # Extract duration using soundfile
         file_object = io.BytesIO(file_content)
         with sf.SoundFile(file_object) as audio:
-            duration = len(audio) / audio.samplerate
+            frames = len(audio)
+            # Guard against sentinel/invalid frame counts (e.g., 2^63-1 from libsndfile)
+            if frames <= 0 or frames >= 2**63 - 1:
+                return None
+            if audio.samplerate <= 0:
+                return None
+            duration = frames / audio.samplerate
+            # Reject implausible durations (> 24 hours)
+            if duration > 86400:
+                return None
             return duration
 
     except Exception:

diff --git a/litellm/litellm_core_utils/llm_response_utils/convert_dict_to_response.py b/litellm/litellm_core_utils/llm_response_utils/convert_dict_to_response.py
@@ -46,6 +46,20 @@
 
 from .get_headers import get_response_headers
 
+def _normalize_images(
+    images: Optional[List[Dict[str, object]]],
+) -> Optional[List[Dict[str, object]]]:
+    """Normalize image items to include required 'index' field if missing."""
+    if images is None:
+        return None
+    normalized: List[Dict[str, object]] = []
+    for i, img in enumerate(images):
+        if isinstance(img, dict) and "index" not in img:
+            img = {**img, "index": i}
+        normalized.append(img)
+    return normalized
+
+
 _MESSAGE_FIELDS: frozenset = frozenset(Message.model_fields.keys())
 _CHOICES_FIELDS: frozenset = frozenset(Choices.model_fields.keys())
 _MODEL_RESPONSE_FIELDS: frozenset = frozenset(ModelResponse.model_fields.keys()) | {

diff --git a/litellm/llms/anthropic/experimental_pass_through/messages/handler.py b/litellm/llms/anthropic/experimental_pass_through/messages/handler.py
@@ -24,6 +24,10 @@
 from litellm.types.router import GenericLiteLLMParams
 from litellm.utils import ProviderConfigManager, client
 
+from litellm.litellm_core_utils.prompt_templates.common_utils import (
+    DEFAULT_ASSISTANT_CONTINUE_MESSAGE,
+)
+
 from ..adapters.handler import LiteLLMMessagesToCompletionTransformationHandler
 from ..responses_adapters.handler import LiteLLMMessagesToResponsesAPIHandler
 from .utils import AnthropicMessagesRequestUtils, mock_response
@@ -49,6 +53,58 @@ def _should_route_to_responses_api(custom_llm_provider: Optional[str]) -> bool:
 #################################################
 
 
+def _sanitize_anthropic_messages(messages: List[Dict]) -> List[Dict]:
+    """
+    Sanitize messages for the /v1/messages endpoint.
+
+    The Anthropic API can return assistant messages with empty text blocks
+    alongside tool_use blocks (e.g., {"type": "text", "text": ""}). While
+    the API returns these, it rejects them when sent back in subsequent
+    requests with "text content blocks must be non-empty".
+
+    This is particularly common in multi-turn tool-use conversations (e.g.,
+    Claude Code / Agent SDK) where the model starts a text block but
+    immediately switches to a tool_use block.
+
+    The /v1/chat/completions path already handles this via
+    process_empty_text_blocks() in factory.py, but the /v1/messages path
+    was missing sanitization.
+    """
+    for i, message in enumerate(messages):
+        content = message.get("content")
+        if not isinstance(content, list):
+            continue
+
+        # Filter out empty text blocks, keeping non-empty text and other types.
+        # Use `(... or "")` to guard against None text values.
+        filtered = [
+            block
+            for block in content
+            if not (
+                isinstance(block, dict)
+                and block.get("type") == "text"
+                and not (block.get("text") or "").strip()
+            )
+        ]
+
+        # Only update if we actually removed something.
+        # Avoid mutating the caller's dicts — create a shallow copy.
+        if len(filtered) < len(content):
+            if len(filtered) > 0:
+                messages[i] = {**message, "content": filtered}
+            else:
+                # All blocks were empty text — replace with a continuation
+                # message rather than leaving empty blocks that trigger 400
+                # errors. Matches behavior of process_empty_text_blocks()
+                # in factory.py.
+                messages[i] = {
+                    **message,
+                    "content": [{"type": "text", "text": DEFAULT_ASSISTANT_CONTINUE_MESSAGE.get("content", "Please continue.")}],
+                }
+
+    return messages
+
+
 async def _execute_pre_request_hooks(
     model: str,
     messages: List[Dict],
@@ -137,6 +193,10 @@ async def anthropic_messages(
     """
     Async: Make llm api request in Anthropic /messages API spec
     """
+    # Sanitize empty text blocks from messages before processing.
+    # See: https://github.com/BerriAI/litellm/issues/22930
+    messages = _sanitize_anthropic_messages(messages)
+
     # Execute pre-request hooks to allow CustomLoggers to modify request
     request_kwargs = await _execute_pre_request_hooks(
         model=model,

diff --git a/litellm/llms/ollama/completion/transformation.py b/litellm/llms/ollama/completion/transformation.py
@@ -238,6 +238,12 @@ def get_model_info(
             or get_secret_str("OLLAMA_API_BASE")
             or "http://localhost:11434"
         )
+        # Strip any endpoint paths that may have been appended by get_complete_url()
+        # to avoid malformed URLs like /api/generate/api/show
+        for endpoint in ["/api/generate", "/api/chat", "/api/embed"]:
+            if api_base.endswith(endpoint):
+                api_base = api_base[: -len(endpoint)]
+                break
         api_key = self.get_api_key()
         headers = {"Authorization": f"Bearer {api_key}"} if api_key else {}
 

diff --git a/litellm/llms/ovhcloud/responses/__init__.py b/litellm/llms/ovhcloud/responses/__init__.py
@@ -0,0 +1 @@
+"""OVHCloud Responses API support"""