traceloop · galkleinman · Feb 22, 2026 · Jan 31, 2026 · Feb 21, 2026 · Feb 22, 2026
diff --git a/...telemetry-instrumentation-anthropic/opentelemetry/instrumentation/anthropic/span_utils.py b/...telemetry-instrumentation-anthropic/opentelemetry/instrumentation/anthropic/span_utils.py
@@ -174,7 +174,7 @@ async def aset_input_attributes(span, kwargs):
                 if schema:
                     set_span_attribute(
                         span,
-                        SpanAttributes.LLM_REQUEST_STRUCTURED_OUTPUT_SCHEMA,
+                        "gen_ai.request.structured_output_schema",
                         json.dumps(schema),
                     )
 

diff --git a/...ntelemetry-instrumentation-anthropic/opentelemetry/instrumentation/anthropic/streaming.py b/...ntelemetry-instrumentation-anthropic/opentelemetry/instrumentation/anthropic/streaming.py
@@ -94,6 +94,13 @@ def _set_token_usage(
     )
     set_span_attribute(span, SpanAttributes.LLM_USAGE_TOTAL_TOKENS, total_tokens)
 
+    set_span_attribute(
+        span, SpanAttributes.GEN_AI_USAGE_CACHE_READ_INPUT_TOKENS, cache_read_tokens
+    )
+    set_span_attribute(
+        span, SpanAttributes.GEN_AI_USAGE_CACHE_CREATION_INPUT_TOKENS, cache_creation_tokens
+    )
+
     set_span_attribute(
         span, GenAIAttributes.GEN_AI_RESPONSE_MODEL, complete_response.get("model")
     )

diff --git a/packages/opentelemetry-instrumentation-anthropic/pyproject.toml b/packages/opentelemetry-instrumentation-anthropic/pyproject.toml
@@ -13,7 +13,7 @@ requires-python = ">=3.10,<4"
 dependencies = [
   "opentelemetry-api>=1.38.0,<2",
   "opentelemetry-instrumentation>=0.59b0",
-  "opentelemetry-semantic-conventions-ai>=0.4.13,<0.5.0",
+  "opentelemetry-semantic-conventions-ai>=0.4.14,<0.5.0",
   "opentelemetry-semantic-conventions>=0.59b0",
 ]
 

diff --git a/packages/opentelemetry-instrumentation-anthropic/tests/test_prompt_caching.py b/packages/opentelemetry-instrumentation-anthropic/tests/test_prompt_caching.py
@@ -2,13 +2,51 @@
 
 import pytest
 from opentelemetry.sdk._logs import ReadableLogRecord
+from opentelemetry.sdk.trace import ReadableSpan
 from opentelemetry.semconv._incubating.attributes import (
     gen_ai_attributes as GenAIAttributes,
 )
 
 from .utils import verify_metrics
 
 
+def _verify_caching_attributes(
+    cache_creation_span: ReadableSpan,
+    cache_read_span: ReadableSpan,
+    input_tokens: int,
+    cache_creation_span_output_tokens: int,
+    cache_read_span_output_tokens: int,
+    cached_tokens: int,
+):
+    assert (
+        cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
+        == cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"]
+    )
+
+    # first check that cache_creation_span only wrote to cache, but not read from it,
+    assert cache_creation_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 0
+    assert (
+        cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"] != 0
+    )
+
+    # then check for exact figures for the fixture/cassette
+    assert (
+        cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
+        == cached_tokens
+    )
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == input_tokens
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == cache_creation_span_output_tokens
+
+    # first check that cache_read_span only read from cache, but not wrote to it,
+    assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
+    assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
+
+    # then check for exact figures for the fixture/cassette
+    assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == cached_tokens
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == input_tokens
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == cache_read_span_output_tokens
+
+
 @pytest.mark.vcr
 def test_anthropic_prompt_caching_legacy(
     instrument_legacy, anthropic_client, span_exporter, log_exporter, reader
@@ -70,6 +108,11 @@ def test_anthropic_prompt_caching_legacy(
     assert cache_read_span.attributes["gen_ai.prompt.1.role"] == "user"
     assert text == cache_read_span.attributes["gen_ai.prompt.1.content"]
 
+    assert (
+        cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
+        == cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"]
+    )
+
     assert (
         cache_creation_span.attributes.get("gen_ai.response.id")
         == "msg_01EF3r8zYyZntM4Sg9a5kc6k"
@@ -82,11 +125,7 @@ def test_anthropic_prompt_caching_legacy(
     assert cache_creation_span.attributes["gen_ai.completion.0.role"] == "assistant"
     assert cache_read_span.attributes["gen_ai.completion.0.role"] == "assistant"
 
-    # assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1167
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 187
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1167
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 202
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1167, 187, 202, 1163)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -150,11 +189,7 @@ def test_anthropic_prompt_caching_with_events_with_content(
     cache_creation_span = spans[0]
     cache_read_span = spans[1]
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1167
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 187
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1167
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 202
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1167, 187, 202, 1163)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -316,11 +351,7 @@ def test_anthropic_prompt_caching_with_events_with_no_content(
     cache_creation_span = spans[0]
     cache_read_span = spans[1]
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1167
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 187
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1167
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 202
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1167, 187, 202, 1163)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -426,11 +457,7 @@ async def test_anthropic_prompt_caching_async_legacy(
     assert cache_creation_span.attributes["gen_ai.completion.0.role"] == "assistant"
     assert cache_read_span.attributes["gen_ai.completion.0.role"] == "assistant"
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 207
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 224
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1169, 207, 224, 1165)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -495,11 +522,7 @@ async def test_anthropic_prompt_caching_async_with_events_with_content(
     cache_creation_span = spans[0]
     cache_read_span = spans[1]
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 207
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 224
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1169, 207, 224, 1165)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -667,11 +690,12 @@ async def test_anthropic_prompt_caching_async_with_events_with_no_content(
     cache_creation_span = spans[0]
     cache_read_span = spans[1]
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 207
+    assert (
+        cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
+        == cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"]
+    )
 
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 224
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1169, 207, 224, 1165)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -780,11 +804,7 @@ def test_anthropic_prompt_caching_stream_legacy(
     assert cache_creation_span.attributes["gen_ai.completion.0.role"] == "assistant"
     assert cache_read_span.attributes["gen_ai.completion.0.role"] == "assistant"
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 202
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 222
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1169, 202, 222, 1165)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -852,11 +872,7 @@ def test_anthropic_prompt_caching_stream_with_events_with_content(
     cache_creation_span = spans[0]
     cache_read_span = spans[1]
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 202
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 222
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1169, 202, 222, 1165)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -1029,11 +1045,7 @@ def test_anthropic_prompt_caching_stream_with_events_with_no_content(
     cache_creation_span = spans[0]
     cache_read_span = spans[1]
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 202
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 222
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1169, 202, 222, 1165)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -1142,11 +1154,7 @@ async def test_anthropic_prompt_caching_async_stream_legacy(
     assert cache_read_span.attributes["gen_ai.prompt.1.role"] == "user"
     assert text == cache_read_span.attributes["gen_ai.prompt.1.content"]
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1171
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 290
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1171
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 257
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1171, 290, 257, 1167)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -1215,11 +1223,7 @@ async def test_anthropic_prompt_caching_async_stream_with_events_with_content(
     cache_creation_span = spans[0]
     cache_read_span = spans[1]
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1171
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 290
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1171
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 257
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1171, 290, 257, 1167)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -1403,11 +1407,7 @@ async def test_anthropic_prompt_caching_async_stream_with_events_with_no_content
     cache_creation_span = spans[0]
     cache_read_span = spans[1]
 
-    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1171
-    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 290
-
-    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1171
-    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 257
+    _verify_caching_attributes(cache_creation_span, cache_read_span, 1171, 290, 257, 1167)
 
     # verify metrics
     metrics_data = reader.get_metrics_data()

diff --git a/packages/opentelemetry-instrumentation-anthropic/tests/test_structured_outputs.py b/packages/opentelemetry-instrumentation-anthropic/tests/test_structured_outputs.py
@@ -4,7 +4,6 @@
 from opentelemetry.semconv._incubating.attributes import (
     gen_ai_attributes as GenAIAttributes,
 )
-from opentelemetry.semconv_ai import SpanAttributes
 
 
 JOKE_SCHEMA = {
@@ -65,9 +64,9 @@ def test_anthropic_structured_outputs_legacy(
         == "assistant"
     )
 
-    assert SpanAttributes.LLM_REQUEST_STRUCTURED_OUTPUT_SCHEMA in anthropic_span.attributes
+    assert "gen_ai.request.structured_output_schema" in anthropic_span.attributes
     schema_attr = json.loads(
-        anthropic_span.attributes[SpanAttributes.LLM_REQUEST_STRUCTURED_OUTPUT_SCHEMA]
+        anthropic_span.attributes["gen_ai.request.structured_output_schema"]
     )
     assert "properties" in schema_attr
     assert "joke" in schema_attr["properties"]