modelcontextprotocol
diff --git a/‎src/mcp/server/streamable_http.py‎
Lines changed: 2 additions & 2 deletions b/‎src/mcp/server/streamable_http.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎tests/interaction/README.md‎
Lines changed: 12 additions & 3 deletions b/‎tests/interaction/README.md‎
Lines changed: 12 additions & 3 deletions
diff --git a/‎tests/interaction/_requirements.py‎
Lines changed: 839 additions & 191 deletions b/‎tests/interaction/_requirements.py‎
Lines changed: 839 additions & 191 deletions
diff --git a/‎tests/interaction/auth/test_as_handlers.py‎
Lines changed: 6 additions & 5 deletions b/‎tests/interaction/auth/test_as_handlers.py‎
Lines changed: 6 additions & 5 deletions
diff --git a/‎tests/interaction/auth/test_lifecycle.py‎
Lines changed: 24 additions & 16 deletions b/‎tests/interaction/auth/test_lifecycle.py‎
Lines changed: 24 additions & 16 deletions
diff --git a/‎tests/interaction/conftest.py‎
Lines changed: 6 additions & 5 deletions b/‎tests/interaction/conftest.py‎
Lines changed: 6 additions & 5 deletions
diff --git a/‎tests/interaction/lowlevel/test_cancellation.py‎
Lines changed: 126 additions & 5 deletions b/‎tests/interaction/lowlevel/test_cancellation.py‎
Lines changed: 126 additions & 5 deletions
@@ -686,7 +686,7 @@ async def _handle_get_request(self, request: Request, send: Send) -> None:
             "Content-Type": CONTENT_TYPE_SSE,
         }
 
-        if self.mcp_session_id:  # pragma: no branch
+        if self.mcp_session_id:
             headers[MCP_SESSION_ID_HEADER] = self.mcp_session_id
 
         # Check if we already have an active GET stream
@@ -750,7 +750,7 @@ async def standalone_sse_writer():
     async def _handle_delete_request(self, request: Request, send: Send) -> None:
         """Handle DELETE requests for explicit session termination."""
         # Validate session ID
-        if not self.mcp_session_id:  # pragma: no cover
+        if not self.mcp_session_id:
             # If no session ID set, return Method Not Allowed
             response = self._create_error_response(
                 "Method Not Allowed: Session termination not supported",
 
@@ -118,6 +118,13 @@ be exercised by at least one test, every deferred requirement by none, and an un
 import time. A behaviour without a manifest entry cannot be silently half-tested, and a manifest
 entry without a test cannot be silently aspirational.
 
+Coverage is enforced per matrix cell as well: every (transport, spec version) cell a
+requirement's own grid admits must appear in the cells of at least one test covering it, so a
+version- or transport-bounded mark stacked onto a shared test cannot silently strip cells — an
+era, a transport — from the other requirements that test covers. A covering test that does not
+use the `connect` fixture counts for every admitted cell: it runs unparametrized, so no stacked
+mark can strip anything from it.
+
 ### The divergence lifecycle
 
 1. A test reveals that the SDK does not do what the spec says. The test pins what the SDK
@@ -143,9 +150,11 @@ exercises. `SPEC_BASE_URL` (and `SPEC_2026_BASE_URL`) are pinned literals — no
 `SPEC_VERSIONS` — so growing the active axis never repoints existing `source` links. The
 `connect` fixture fans out over `CONNECTABLE_TRANSPORTS × SPEC_VERSIONS`, but the grid is
 filtered per test:
-`pytest_generate_tests` reads the test's stacked `@requirement` marks and calls `compute_cells()`,
-which intersects the admissible cells across every cited requirement — a cell survives only if
-**all** of the test's requirements admit it.
+`pytest_generate_tests` reads the test's stacked `@requirement` marks and calls `cells_for_test()`
+(a thin wrapper over `compute_cells()`), which intersects the admissible cells across every cited
+requirement — a cell survives only if **all** of the test's requirements admit it. A stack whose
+intersection is empty fails collection: a `connect` test that can never run on any cell is a
+manifest contradiction, not a skip.
 
 `streamable-http-stateless` is the fourth connectable transport: the 2025-era unofficial stateless
 mode where each request opens a fresh transport, no session id is issued, and there is no standalone
 
@@ -308,11 +308,12 @@ async def test_register_echoes_native_for_a_client_that_registered_application_t
     """A client registering `application_type: "web"` is told `"native"` in the registration echo.
 
     Pins the known gap recorded on the requirement (divergence): the registration handler's
-    field-by-field passthrough omits `application_type`, so the model default fills the echo
-    where RFC 7591 §3.2.1 requires the registered value -- and the SDK OAuth client adopts the
-    echo into persisted storage, so the corruption is client-visible end to end. When the
-    one-line passthrough fix lands this test fails: re-pin the echo to `"web"`, delete the
-    Divergence, and add the echo assertion to
+    field-by-field passthrough omits `application_type`, so the model default replaces the
+    submitted value in the stored record and the echo alike -- wire-legal under RFC 7591 (a
+    server may replace requested metadata values), but an accident of the field list rather
+    than a policy, and the SDK OAuth client adopts the echo into persisted storage, so the
+    corruption is client-visible end to end. When the one-line passthrough fix lands this test
+    fails: re-pin the echo to `"web"`, delete the Divergence, and add the echo assertion to
     `test_dcr_sends_a_consumer_set_application_type_verbatim` (test_flow.py) per the
     requirement's note.
     """
 
@@ -175,14 +175,14 @@ async def test_a_refresh_response_without_a_refresh_token_preserves_the_stored_o
     """A refresh response that omits `refresh_token` leaves the stored one in place.
 
     RFC 6749 §6 lets the authorization server omit `refresh_token` from a refresh response, in
-    which case the client keeps the one it holds; the 2026 Refresh Tokens section (SEP-2207)
-    restates this as "MUST NOT assume refresh tokens will be issued". The provider models the
-    non-rotating AS: its refresh response carries only a new access token (`exclude_none`
-    serialization keeps the key genuinely absent from the wire) and the presented token stays
-    valid server-side. The preserved token alone could pass vacuously if the refresh response
-    were dropped entirely, so the adopted `expires_in` (the first token's was -3600) proves it
-    was not, and the single authorize/register pair proves the omission was treated as normal
-    rather than triggering a re-authorization.
+    which case the client keeps the one it holds -- the discipline the 2026 Refresh Tokens
+    section's "MUST NOT assume refresh tokens will be issued" (SEP-2207) states for issuance
+    generally. The provider models the non-rotating AS: its refresh response carries only a new
+    access token (`exclude_none` serialization keeps the key genuinely absent from the wire) and
+    the presented token stays valid server-side. The preserved token alone could pass vacuously
+    if the refresh response were dropped entirely, so the adopted `expires_in` (the first
+    token's was -3600) proves it was not, and the single authorize/register pair proves the
+    omission was treated as normal rather than triggering a re-authorization.
     """
     recorded, on_request = record_requests()
     provider = InMemoryAuthorizationServerProvider(issue_expired_first=True, rotate_refresh_tokens=False)
@@ -260,8 +260,10 @@ async def test_a_403_step_up_re_authorizes_with_the_union_of_prior_and_challenge
     """The step-up re-authorize requests the union of the previously requested and challenged scopes.
 
     The first authorization requests `mcp`; the 403 challenges a disjoint `write` (not naming
-    `mcp`). Per SEP-2350 the client must re-authorize with `mcp write`, not drop `mcp`. The client
-    is pre-registered with both scopes so the server's authorize handler accepts the wider request.
+    `mcp`). The client re-authorizes with `mcp write`, not dropping `mcp` -- the SEP-2350 union,
+    spec-mandated at 2026-07-28; on this legacy flow it is the SDK's own choice anticipating that
+    mandate. The client is pre-registered with both scopes so the server's authorize handler
+    accepts the wider request.
     """
     provider = InMemoryAuthorizationServerProvider()
     storage = InMemoryTokenStorage(client_info=seeded_client(provider, scope="mcp write"))
@@ -325,11 +327,14 @@ async def test_tokens_from_the_previous_authorization_server_are_never_replayed_
 
     Choreography twin of the as-binding discard test above, pinning the token half of the same
     SEP-2352 branch: storage carries both an old-issuer client registration and that server's
-    tokens. The stale access token is presented once to the resource server (reload treats it
-    as live), the 401 triggers the binding check, and the discard drops tokens together with
-    the credentials -- so the stale refresh token reaches no endpoint of the new authorization
-    server and the only token exchange is the fresh authorization-code grant. The requirement's
-    note carries the refresh-ordering hazard this test is the regression net for.
+    tokens, with the access token seeded already expired. Reload loses the expiry clock, so the
+    stale access token is presented once to the resource server, the 401 triggers the binding
+    check, and the discard drops tokens together with the credentials -- the stale refresh token
+    reaches no endpoint of the new authorization server and the only token exchange is the fresh
+    authorization-code grant. The expired seed arms the net for a fix that re-anchors the expiry
+    clock at reload: the pre-discovery refresh branch then engages in this exact scenario, and
+    the replay sweep fails unless the discard still runs ahead of any refresh attempt. The
+    requirement's note carries the refresh-ordering hazard in full.
     """
     recorded, on_request = record_requests()
     provider = InMemoryAuthorizationServerProvider()
@@ -349,7 +354,10 @@ async def test_tokens_from_the_previous_authorization_server_are_never_replayed_
     storage.tokens = OAuthToken(
         access_token="stale-access-token",
         token_type="Bearer",
-        expires_in=3600,
+        # Seeded already expired: today reload loses the expiry clock and treats the token as
+        # live; if a fix re-anchors it, this seed drives the pre-discovery refresh branch --
+        # the ordering hazard the replay sweep below must catch.
+        expires_in=-3600,
         scope="mcp",
         refresh_token="stale-refresh-token",
     )
 
@@ -2,8 +2,9 @@
 
 The ``connect`` fixture is parametrized per-test from the ``@requirement`` marks the test
 carries: ``pytest_generate_tests`` looks up each cited requirement in the manifest and computes
-the (transport, spec_version) cells via :func:`compute_cells`, applying arm exclusions, version
-bounds, and known-failure xfails declaratively.
+the (transport, spec_version) cells via :func:`cells_for_test`, applying arm exclusions, version
+bounds, and known-failure xfails declaratively. A test whose stacked requirements intersect to
+zero cells fails collection instead of silently skipping.
 """
 
 from functools import partial
@@ -17,7 +18,7 @@
     connect_over_streamable_http,
     connect_over_streamable_http_stateless,
 )
-from tests.interaction._requirements import REQUIREMENTS, compute_cells
+from tests.interaction._requirements import cells_for_test
 
 _FACTORIES: dict[str, Connect] = {
     "in-memory": connect_in_memory,
@@ -31,8 +32,8 @@ def pytest_generate_tests(metafunc: pytest.Metafunc) -> None:
     """Parametrize ``connect`` from the test's stacked ``@requirement`` marks."""
     if "connect" not in metafunc.fixturenames:
         return
-    requirements = [REQUIREMENTS[mark.args[0]] for mark in metafunc.definition.iter_markers("requirement")]
-    metafunc.parametrize("connect", compute_cells(requirements), indirect=True)
+    requirement_ids = [mark.args[0] for mark in metafunc.definition.iter_markers("requirement")]
+    metafunc.parametrize("connect", cells_for_test(metafunc.definition.nodeid, requirement_ids), indirect=True)
 
 
 @pytest.fixture
 
@@ -1,9 +1,11 @@
 """Cancellation interactions against the low-level Server, driven through the public Client API.
 
-There is no client-side cancellation API: cancelling means sending a CancelledNotification
-carrying the request id, which only the server-side handler can observe (`ctx.request_id`), so
-these tests capture the id from inside the blocked handler before cancelling. The handler blocks
-on an Event rather than a sleep, and every wait is bounded by `anyio.fail_after`.
+Client-side cancellation is cancelling the caller's scope around an in-flight call; the
+dispatcher then sends the courtesy notifications/cancelled. The receiving-side tests instead
+drive the wire act directly -- sending a CancelledNotification carrying the request id, which
+only the server-side handler can observe (`ctx.request_id`) -- so they capture the id from
+inside the blocked handler before cancelling. Handlers block on an Event rather than a sleep,
+and every wait is bounded by `anyio.fail_after`.
 """
 
 import anyio
@@ -27,16 +29,64 @@
 
 from mcp import MCPError
 from mcp.client import ClientRequestContext, ClientSession
+from mcp.client._memory import InMemoryTransport
+from mcp.client.client import Client
 from mcp.server import Server, ServerRequestContext
 from mcp.shared.memory import MessageStream, create_client_server_memory_streams
 from mcp.shared.message import SessionMessage
 from tests.interaction._connect import Connect
-from tests.interaction._helpers import IncomingMessage
+from tests.interaction._helpers import IncomingMessage, RecordingTransport
 from tests.interaction._requirements import requirement
 
 pytestmark = pytest.mark.anyio
 
 
+@requirement("protocol:cancel:abort-signal")
+async def test_cancelling_the_callers_scope_sends_cancelled_and_abandons_the_call() -> None:
+    """Cancelling the scope around an in-flight call sends notifications/cancelled and the call never returns.
+
+    Spec-mandated (cancellation flow): the sender of a cancelled request issues
+    notifications/cancelled referencing its id. Legacy-era act: at 2026-07-28 the wire act splits
+    by transport (see the manifest entry's note). The wire is observed at the recording-transport
+    seam; the reason string is the SDK's own deliberate output.
+    """
+    handler_started = anyio.Event()
+
+    async def call_tool(ctx: ServerRequestContext, params: types.CallToolRequestParams) -> CallToolResult:
+        assert params.name == "block"
+        handler_started.set()
+        await anyio.Event().wait()  # blocks until the courtesy cancellation interrupts it
+        raise NotImplementedError  # unreachable: the wait above never completes normally
+
+    server = Server("blocker", on_call_tool=call_tool)
+    recording = RecordingTransport(InMemoryTransport(server))
+
+    async with Client(recording, mode="legacy") as client:
+        with anyio.fail_after(5):
+            async with anyio.create_task_group() as task_group:  # pragma: no branch
+
+                async def call() -> None:
+                    await client.call_tool("block", {})
+                    raise NotImplementedError  # unreachable: the surrounding scope is cancelled mid-flight
+
+                task_group.start_soon(call)
+                await handler_started.wait()
+                task_group.cancel_scope.cancel()
+
+    (call_request,) = [
+        item.message
+        for item in recording.sent
+        if isinstance(item.message, JSONRPCRequest) and item.message.method == "tools/call"
+    ]
+    (cancellation,) = [
+        item.message
+        for item in recording.sent
+        if isinstance(item.message, JSONRPCNotification) and item.message.method == "notifications/cancelled"
+    ]
+    assert cancellation.params == snapshot({"requestId": 2, "reason": "caller cancelled"})
+    assert cancellation.params is not None and cancellation.params["requestId"] == call_request.id
+
+
 @requirement("protocol:cancel:in-flight")
 @requirement("protocol:cancel:handler-abort-propagates")
 async def test_cancellation_stops_in_flight_handler(connect: Connect) -> None:
@@ -87,6 +137,77 @@ async def call_and_capture_error() -> None:
     assert errors == snapshot([ErrorData(code=0, message="Request cancelled")])
 
 
+@requirement("protocol:cancel:in-flight")
+async def test_client_answers_a_cancelled_server_initiated_request_with_the_code_zero_error(connect: Connect) -> None:
+    """Cancelling a server-initiated request interrupts the client's callback, and the client
+    answers with the code-0 error -- the client half of the divergence on this requirement (the
+    spec says the receiver should not respond at all). The server cancels its own sampling
+    request while still awaiting it, so the client's answer is observed as the awaited call's
+    failure; the whole exchange sits under one fail_after, so a silent client fails the test
+    instead of hanging it.
+    """
+    callback_started = anyio.Event()
+    callback_cancelled = anyio.Event()
+    client_request_ids: list[types.RequestId] = []
+    errors: list[ErrorData] = []
+
+    async def sampling_callback(
+        context: ClientRequestContext, params: types.CreateMessageRequestParams
+    ) -> types.CreateMessageResult:
+        client_request_ids.append(context.request_id)
+        callback_started.set()
+        try:
+            await anyio.Event().wait()  # blocks until the cancellation interrupts it
+        except anyio.get_cancelled_exc_class():
+            callback_cancelled.set()
+            raise
+        raise NotImplementedError  # unreachable
+
+    async def list_tools(
+        ctx: ServerRequestContext, params: types.PaginatedRequestParams | None
+    ) -> types.ListToolsResult:
+        return types.ListToolsResult(tools=[types.Tool(name="canceller", input_schema={"type": "object"})])
+
+    async def call_tool(ctx: ServerRequestContext, params: types.CallToolRequestParams) -> CallToolResult:
+        assert params.name == "canceller"
+        request = types.CreateMessageRequest(
+            params=types.CreateMessageRequestParams(
+                messages=[types.SamplingMessage(role="user", content=TextContent(text="Say hello."))],
+                max_tokens=8,
+            )
+        )
+        with anyio.fail_after(5):
+            async with anyio.create_task_group() as task_group:
+
+                async def sample_and_capture_error() -> None:
+                    with pytest.raises(MCPError) as exc_info:
+                        await ctx.session.send_request(request, types.CreateMessageResult)
+                    errors.append(exc_info.value.error)
+
+                task_group.start_soon(sample_and_capture_error)
+                await callback_started.wait()
+                await ctx.session.send_notification(
+                    types.CancelledNotification(
+                        params=types.CancelledNotificationParams(
+                            request_id=client_request_ids[0], reason="user aborted"
+                        )
+                    ),
+                    related_request_id=ctx.request_id,
+                )
+            # The join above completes only when the client's answer arrives; the enclosing
+            # fail_after turns a silent client into a TimeoutError -- a failed test, not a hang.
+            await callback_cancelled.wait()
+        return CallToolResult(content=[TextContent(text="cancelled")])
+
+    server = Server("canceller", on_list_tools=list_tools, on_call_tool=call_tool)
+
+    async with connect(server, sampling_callback=sampling_callback) as client:
+        result = await client.call_tool("canceller", {})
+
+    assert result == snapshot(CallToolResult(content=[TextContent(text="cancelled")]))
+    assert errors == snapshot([ErrorData(code=0, message="Request cancelled")])
+
+
 @requirement("protocol:cancel:no-further-notifications")
 async def test_no_notifications_for_a_request_arrive_after_its_cancellation(connect: Connect) -> None:
     """After a request is cancelled, no further notifications for it reach the wire (spec-mandated).