modelcontextprotocol · Kludex · Jun 25, 2026 · Jun 25, 2026 · Jun 25, 2026 · cubic-dev-ai
diff --git a/src/mcp/server/_otel.py b/src/mcp/server/_otel.py
@@ -59,8 +59,12 @@ async def __call__(self, ctx: ServerRequestContext[Any, Any], call_next: CallNex
                 span.set_status(StatusCode.ERROR, str(e))
                 raise
             if ctx.method == "tools/call":
+                # Tool errors are detected pre-serialization, so only shapes that reach the wire as an error
+                # count: the model, or the camelCase alias (`is_error` is dropped by the alias-only wire
+                # validation). A raw-dict `isError` is matched as a literal bool only - non-bool coercible
+                # values (1, "true") would serialize to an error but are rare enough to leave undetected.
                 match result:
-                    case CallToolResult(is_error=True) | {"isError": True} | {"is_error": True}:
+                    case CallToolResult(is_error=True) | {"isError": True}:
                         span.set_attribute("error.type", "tool_error")
                         span.set_status(StatusCode.ERROR)
                     case _:

diff --git a/tests/server/test_otel.py b/tests/server/test_otel.py
@@ -92,19 +92,22 @@ async def err_tool(ctx: Ctx, params: CallToolRequestParams) -> CallToolResult:
 
 
 @pytest.mark.anyio
-async def test_tool_error_snake_case_dict_result_sets_error_type(server: SrvT, spans: SpanCapture):
+async def test_snake_case_dict_result_is_not_a_tool_error(server: SrvT, spans: SpanCapture):
+    # `is_error` is alias-only on the wire, so serialization drops it; the result reaches the
+    # client as a success and the span must not contradict that.
     async def err_tool(ctx: Ctx, params: CallToolRequestParams) -> dict[str, Any]:
         return {"content": [], "is_error": True}
 
     server.add_request_handler("tools/call", CallToolRequestParams, err_tool)
     server.middleware.append(OpenTelemetryMiddleware())
     async with connected_runner(server) as (client, _):
         spans.clear()
-        await client.send_raw_request("tools/call", {"name": "mytool", "arguments": {}})
+        result = await client.send_raw_request("tools/call", {"name": "mytool", "arguments": {}})
+    assert result == {"content": []}
     [span] = [s for s in spans.finished() if s.kind == SpanKind.SERVER]
     assert span.attributes is not None
-    assert span.attributes["error.type"] == "tool_error"
-    assert span.status.status_code == StatusCode.ERROR
+    assert "error.type" not in span.attributes
+    assert span.status.status_code == StatusCode.UNSET
 
 
 @pytest.mark.anyio