traceloop · martimfasantos · Jul 15, 2025 · Jul 19, 2025 · Jul 19, 2025 · Jul 19, 2025
diff --git a/packages/opentelemetry-instrumentation-alephalpha/tests/test_completion.py b/packages/opentelemetry-instrumentation-alephalpha/tests/test_completion.py
@@ -35,12 +35,12 @@ def test_alephalpha_completion(
         together_span.attributes.get("gen_ai.completion.0.content")
         == response.completions[0].completion
     )
-    assert together_span.attributes.get("gen_ai.usage.prompt_tokens") == 9
+    assert together_span.attributes.get("gen_ai.usage.input_tokens") == 9
     assert together_span.attributes.get(
         "llm.usage.total_tokens"
     ) == together_span.attributes.get(
-        "gen_ai.usage.completion_tokens"
-    ) + together_span.attributes.get("gen_ai.usage.prompt_tokens")
+        "gen_ai.usage.output_tokens"
+    ) + together_span.attributes.get("gen_ai.usage.input_tokens")
 
     logs = log_exporter.get_finished_logs()
     assert (
@@ -66,12 +66,12 @@ def test_alephalpha_completion_with_events_with_content(
     assert together_span.attributes.get("gen_ai.system") == "AlephAlpha"
     assert together_span.attributes.get("llm.request.type") == "completion"
     assert together_span.attributes.get("gen_ai.request.model") == "luminous-base"
-    assert together_span.attributes.get("gen_ai.usage.prompt_tokens") == 9
+    assert together_span.attributes.get("gen_ai.usage.input_tokens") == 9
     assert together_span.attributes.get(
         "llm.usage.total_tokens"
     ) == together_span.attributes.get(
-        "gen_ai.usage.completion_tokens"
-    ) + together_span.attributes.get("gen_ai.usage.prompt_tokens")
+        "gen_ai.usage.output_tokens"
+    ) + together_span.attributes.get("gen_ai.usage.input_tokens")
 
     logs = log_exporter.get_finished_logs()
     assert len(logs) == 2
@@ -116,12 +116,12 @@ def test_alephalpha_completion_with_events_with_no_content(
     assert together_span.attributes.get("gen_ai.system") == "AlephAlpha"
     assert together_span.attributes.get("llm.request.type") == "completion"
     assert together_span.attributes.get("gen_ai.request.model") == "luminous-base"
-    assert together_span.attributes.get("gen_ai.usage.prompt_tokens") == 9
+    assert together_span.attributes.get("gen_ai.usage.input_tokens") == 9
     assert together_span.attributes.get(
         "llm.usage.total_tokens"
     ) == together_span.attributes.get(
-        "gen_ai.usage.completion_tokens"
-    ) + together_span.attributes.get("gen_ai.usage.prompt_tokens")
+        "gen_ai.usage.output_tokens"
+    ) + together_span.attributes.get("gen_ai.usage.input_tokens")
 
     logs = log_exporter.get_finished_logs()
     assert len(logs) == 2

diff --git a/packages/opentelemetry-instrumentation-anthropic/tests/test_messages.py b/packages/opentelemetry-instrumentation-anthropic/tests/test_messages.py
@@ -1291,10 +1291,10 @@ def test_anthropic_tools_legacy(
     anthropic_span = spans[0]
 
     # verify usage
-    assert anthropic_span.attributes["gen_ai.usage.prompt_tokens"] == 514
+    assert anthropic_span.attributes["gen_ai.usage.input_tokens"] == 514
     assert (
-        anthropic_span.attributes["gen_ai.usage.completion_tokens"]
-        + anthropic_span.attributes["gen_ai.usage.prompt_tokens"]
+        anthropic_span.attributes["gen_ai.usage.output_tokens"]
+        + anthropic_span.attributes["gen_ai.usage.input_tokens"]
         == anthropic_span.attributes["llm.usage.total_tokens"]
     )
 
@@ -1466,10 +1466,10 @@ def test_anthropic_tools_with_events_with_content(
     anthropic_span = spans[0]
 
     # verify usage
-    assert anthropic_span.attributes["gen_ai.usage.prompt_tokens"] == 514
+    assert anthropic_span.attributes["gen_ai.usage.input_tokens"] == 514
     assert (
-        anthropic_span.attributes["gen_ai.usage.completion_tokens"]
-        + anthropic_span.attributes["gen_ai.usage.prompt_tokens"]
+        anthropic_span.attributes["gen_ai.usage.output_tokens"]
+        + anthropic_span.attributes["gen_ai.usage.input_tokens"]
         == anthropic_span.attributes["llm.usage.total_tokens"]
     )
 
@@ -1602,10 +1602,10 @@ def test_anthropic_tools_with_events_with_no_content(
     anthropic_span = spans[0]
 
     # verify usage
-    assert anthropic_span.attributes["gen_ai.usage.prompt_tokens"] == 514
+    assert anthropic_span.attributes["gen_ai.usage.input_tokens"] == 514
     assert (
-        anthropic_span.attributes["gen_ai.usage.completion_tokens"]
-        + anthropic_span.attributes["gen_ai.usage.prompt_tokens"]
+        anthropic_span.attributes["gen_ai.usage.output_tokens"]
+        + anthropic_span.attributes["gen_ai.usage.input_tokens"]
         == anthropic_span.attributes["llm.usage.total_tokens"]
     )
 

diff --git a/packages/opentelemetry-instrumentation-anthropic/tests/test_prompt_caching.py b/packages/opentelemetry-instrumentation-anthropic/tests/test_prompt_caching.py
@@ -99,17 +99,17 @@ def test_anthropic_prompt_caching_legacy(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1163
     )
-    # assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1167
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 187
+    # assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1167
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 187
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1163
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1167
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 202
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1167
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 202
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -189,17 +189,17 @@ def test_anthropic_prompt_caching_with_events_with_content(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1163
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1167
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 187
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1167
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 187
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1163
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1167
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 202
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1167
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 202
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -377,17 +377,17 @@ def test_anthropic_prompt_caching_with_events_with_no_content(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1163
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1167
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 187
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1167
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 187
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1163
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1167
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 202
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1167
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 202
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -507,17 +507,17 @@ async def test_anthropic_prompt_caching_async_legacy(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1165
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 207
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 207
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1165
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 224
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 224
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -598,17 +598,17 @@ async def test_anthropic_prompt_caching_async_with_events_with_content(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1165
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 207
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 207
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1165
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 224
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 224
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -792,17 +792,17 @@ async def test_anthropic_prompt_caching_async_with_events_with_no_content(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1165
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 207
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 207
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1165
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 224
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 224
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -925,17 +925,17 @@ def test_anthropic_prompt_caching_stream_legacy(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1165
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 202
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 202
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1165
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 222
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 222
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -1019,17 +1019,17 @@ def test_anthropic_prompt_caching_stream_with_events_with_content(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1165
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 202
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 202
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1165
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 222
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 222
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -1218,17 +1218,17 @@ def test_anthropic_prompt_caching_stream_with_events_with_no_content(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1165
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 202
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 202
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1165
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1169
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 222
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1169
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 222
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -1352,17 +1352,17 @@ async def test_anthropic_prompt_caching_async_stream_legacy(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1167
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1171
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 290
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1171
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 290
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1167
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1171
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 257
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1171
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 257
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -1447,17 +1447,17 @@ async def test_anthropic_prompt_caching_async_stream_with_events_with_content(
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1167
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1171
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 290
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1171
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 290
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1167
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1171
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 257
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1171
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 257
 
     # verify metrics
     metrics_data = reader.get_metrics_data()
@@ -1657,17 +1657,17 @@ async def test_anthropic_prompt_caching_async_stream_with_events_with_no_content
         cache_creation_span.attributes["gen_ai.usage.cache_creation_input_tokens"]
         == 1167
     )
-    assert cache_creation_span.attributes["gen_ai.usage.prompt_tokens"] == 1171
-    assert cache_creation_span.attributes["gen_ai.usage.completion_tokens"] == 290
+    assert cache_creation_span.attributes["gen_ai.usage.input_tokens"] == 1171
+    assert cache_creation_span.attributes["gen_ai.usage.output_tokens"] == 290
 
     # first check that cache_read_span only read from cache, but not wrote to it,
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] != 0
     assert cache_read_span.attributes["gen_ai.usage.cache_creation_input_tokens"] == 0
 
     # then check for exact figures for the fixture/cassete
     assert cache_read_span.attributes["gen_ai.usage.cache_read_input_tokens"] == 1167
-    assert cache_read_span.attributes["gen_ai.usage.prompt_tokens"] == 1171
-    assert cache_read_span.attributes["gen_ai.usage.completion_tokens"] == 257
+    assert cache_read_span.attributes["gen_ai.usage.input_tokens"] == 1171
+    assert cache_read_span.attributes["gen_ai.usage.output_tokens"] == 257
 
     # verify metrics
     metrics_data = reader.get_metrics_data()