grafana · sd2k · Feb 6, 2025 · Feb 6, 2025 · Feb 10, 2025 · Feb 10, 2025
@@ -21,8 +21,10 @@ mcp-grafana = "mcp_grafana.cli:app"
 
 [dependency-groups]
 dev = [
+    "httpx-sse>=0.4.0",
     "pytest>=8.3.4",
     "pytest-asyncio>=0.25.2",
+    "pytest-httpserver>=1.1.1",
 ]
 lint = [
     "ruff>=0.8.5",

@@ -1,7 +1,6 @@
 import enum
 from types import MethodType
 
-from mcp.server import FastMCP
 import typer
 
 from . import mcp
@@ -17,57 +16,12 @@ class Transport(enum.StrEnum):
 @app.command()
 def run(transport: Transport = Transport.stdio, header_auth: bool = False):
     if transport == Transport.sse and header_auth:
+        from .middleware import run_sse_async_with_middleware
+
         # Monkeypatch the run_sse_async method to inject a Grafana middleware.
         # This is a bit of a hack, but fastmcp doesn't have a way of adding
         # middleware. It's not unreasonable to do this really, since fastmcp
         # is just a thin wrapper around the low level mcp server.
-        mcp.run_sse_async = MethodType(run_sse_async, mcp)
+        mcp.run_sse_async = MethodType(run_sse_async_with_middleware, mcp)
 
     mcp.run(transport.value)
-
-
-async def run_sse_async(self: FastMCP) -> None:
-    """
-    Run the server using SSE transport, with a middleware that extracts
-    Grafana authentication information from the request headers.
-
-    The vast majority of this code is the same as the original run_sse_async
-    method (see https://github.com/modelcontextprotocol/python-sdk/blob/44c0004e6c69e336811bb6793b7176e1eda50015/src/mcp/server/fastmcp/server.py#L436-L468).
-    """
-
-    from mcp.server.sse import SseServerTransport
-    from starlette.applications import Starlette
-    from starlette.routing import Mount, Route
-    import uvicorn
-
-    from .middleware import GrafanaMiddleware
-
-    sse = SseServerTransport("/messages/")
-
-    async def handle_sse(request):
-        async with GrafanaMiddleware(request):
-            async with sse.connect_sse(
-                request.scope, request.receive, request._send
-            ) as streams:
-                await self._mcp_server.run(
-                    streams[0],
-                    streams[1],
-                    self._mcp_server.create_initialization_options(),
-                )
-
-    starlette_app = Starlette(
-        debug=self.settings.debug,
-        routes=[
-            Route("/sse", endpoint=handle_sse),
-            Mount("/messages/", app=sse.handle_post_message),
-        ],
-    )
-
-    config = uvicorn.Config(
-        starlette_app,
-        host=self.settings.host,
-        port=self.settings.port,
-        log_level=self.settings.log_level.lower(),
-    )
-    server = uvicorn.Server(config)
-    await server.serve()
@@ -1,5 +1,6 @@
 from dataclasses import dataclass
 
+from mcp.server import FastMCP
 from starlette.datastructures import Headers
 
 from .client import GrafanaClient, grafana_client
@@ -55,3 +56,48 @@ async def __aenter__(self):
     async def __aexit__(self, exc_type, exc_val, exc_tb):
         if self.token is not None:
             grafana_settings.reset(self.token)
+
+
+async def run_sse_async_with_middleware(self: FastMCP) -> None:
+    """
+    Run the server using SSE transport, with a middleware that extracts
+    Grafana authentication information from the request headers.
+
+    The vast majority of this code is the same as the original run_sse_async
+    method (see https://github.com/modelcontextprotocol/python-sdk/blob/44c0004e6c69e336811bb6793b7176e1eda50015/src/mcp/server/fastmcp/server.py#L436-L468).
+    """
+
+    from mcp.server.sse import SseServerTransport
+    from starlette.applications import Starlette
+    from starlette.routing import Mount, Route
+    import uvicorn
+
+    sse = SseServerTransport("/messages/")
+
+    async def handle_sse(request):
+        async with GrafanaMiddleware(request):
+            async with sse.connect_sse(
+                request.scope, request.receive, request._send
+            ) as streams:
+                await self._mcp_server.run(
+                    streams[0],
+                    streams[1],
+                    self._mcp_server.create_initialization_options(),
+                )
+
+    starlette_app = Starlette(
+        debug=self.settings.debug,
+        routes=[
+            Route("/sse", endpoint=handle_sse),
+            Mount("/messages/", app=sse.handle_post_message),
+        ],
+    )
+
+    config = uvicorn.Config(
+        starlette_app,
+        host=self.settings.host,
+        port=self.settings.port,
+        log_level=self.settings.log_level.lower(),
+    )
+    server = uvicorn.Server(config)
+    await server.serve()
@@ -0,0 +1,222 @@
+import asyncio
+import json
+from types import MethodType
+from typing import AsyncIterator
+
+import anyio
+import httpx
+from mcp.types import (
+    LATEST_PROTOCOL_VERSION,
+    CallToolResult,
+    ClientCapabilities,
+    ClientNotification,
+    Implementation,
+    InitializeRequest,
+    InitializeRequestParams,
+    InitializedNotification,
+    JSONRPCNotification,
+    JSONRPCRequest,
+    JSONRPCResponse,
+)
+import pytest
+from httpx_sse import aconnect_sse
+
+from mcp_grafana import mcp
+from mcp_grafana.middleware import run_sse_async_with_middleware
+
+from pytest_httpserver import HTTPServer
+
+
+class TestMiddleware:
+    """
+    Test that our injected starlette middleware extracts headers and
+    overrides settings per-request, as expected.
+
+    Also ensure that the contextvars do not leak across requests.
+    """
+
+    @pytest.mark.asyncio
+    async def test_multiple_requests(self):
+        """
+        Ensure that the contextvars do not leak across requests.
+
+        This is a bit of a tricky test, since we're not actually
+        testing the middleware itself, but rather the contextvars
+        that it uses.
+
+        We need to:
+            1. Start a couple of mock Grafana servers
+            2. Start our MCP server
+            3. Send a request to the MCP server pointing to the first
+               Grafana server (using the X-Grafana-Url header)
+            4. Send a different request to the MCP server pointing to
+               the second Grafana server (using the X-Grafana-Url header)
+            5. Ensure that the right request goes to the right server
+        """
+
+        # Start a couple of mock Grafana servers.
+        with HTTPServer(port=10000) as g1, HTTPServer(port=10001) as g2:
+            # Set up some responses from those servers.
+
+            g1.expect_oneshot_request("/api/datasources").respond_with_json([{"id": 1}])
+            g1.expect_oneshot_request(
+                "/api/plugins/grafana-incident-app/resources/api/IncidentsService.CreateIncident",
+                method="POST",
+                # TODO: add proper request body.
+            ).respond_with_json({})  # TODO: add response body
+
+            g2.expect_oneshot_request(
+                "/api/datasources/proxy/uid/foo/api/v1/label/__name__/values"
+            ).respond_with_json({
+                "status": "success",
+                "data": [
+                    "metric1",
+                    "metric2",
+                ],
+            })
+
+            # Hardcode a port for the MCP server.
+            mcp.settings.host = "127.0.0.1"
+            mcp.settings.port = 10002
+
+            # Create clients for each server.
+            # Note these clients send requests to the MCP server, not the Grafana server.
+            # The initial SSE request includes headers that tell the server which
+            # Grafana server to send tool requests to.
+            g1_client = httpx.AsyncClient(
+                base_url=f"http://{mcp.settings.host}:{mcp.settings.port}",
+            )
+            g2_client = httpx.AsyncClient(
+                base_url=f"http://{mcp.settings.host}:{mcp.settings.port}"
+            )
+
+            # Monkeypatch the MCP server to use our middleware.
+            mcp.run_sse_async = MethodType(run_sse_async_with_middleware, mcp)
+
+            async with anyio.create_task_group() as tg:
+                tg.start_soon(mcp.run_sse_async, name="mcp")
+                # Wait for the server to start.
+                await asyncio.sleep(0.1)
+
+                # Send SSE requests to the MCP server, one for each Grafana server.
+                # We can access tool call results over the SSE stream.
+                async with (
+                    aconnect_sse(
+                        g1_client,
+                        "GET",
+                        "/sse",
+                        headers={
+                            "X-Grafana-Url": f"http://{g1.host}:{g1.port}",
+                            "X-Grafana-Api-Key": "abcd123",
+                        },
+                    ) as g1_source,
+                    aconnect_sse(
+                        g2_client,
+                        "GET",
+                        "/sse",
+                        headers={
+                            "X-Grafana-Url": f"http://{g2.host}:{g2.port}",
+                            "X-Grafana-Api-Key": "efgh456",
+                        },
+                    ) as g2_source,
+                ):
+                    g1_iter = g1_source.aiter_sse()
+                    g2_iter = g2_source.aiter_sse()
+                    # The URL to use is in the first SSE message.
+                    g1_url = (await g1_iter.__anext__()).data
+                    g2_url = (await g2_iter.__anext__()).data
+
+                    # The MCP protocol requires us to send an initialize request
+                    # before we can send any other requests.
+                    await initialize(g1_client, g1_url, g1_iter)
+                    await initialize(g2_client, g2_url, g2_iter)
+
+                    # Send a tool call request using the first URL.
+                    await g1_client.post(
+                        g1_url,
+                        json={
+                            "jsonrpc": "2.0",
+                            "id": 2,
+                            "method": "tools/call",
+                            "params": {"name": "list_datasources"},
+                        },
+                    )
+                    result = await jsonrpc_result(g1_iter)
+                    # This must have come from the first Grafana server.
+                    assert json.loads(result.content[0].text) == json.dumps(  # type: ignore
+                        [{"id": 1}], indent=4
+                    )
+
+                    # Send a tool call request using the second URL.
+                    await g2_client.post(
+                        g2_url,
+                        json={
+                            "jsonrpc": "2.0",
+                            "id": 2,
+                            "method": "tools/call",
+                            "params": {
+                                "name": "list_prometheus_metric_names",
+                                "arguments": {"datasource_uid": "foo", "regex": ".*"},
+                            },
+                        },
+                    )
+                    result = await jsonrpc_result(g2_iter)
+                    metrics = [x.text for x in result.content]  # type: ignore
+                    # This must have come from the second Grafana server.
+                    assert metrics == ["metric1", "metric2"]
+
+                # As ridiculous as it sounds, there is no way to stop the uvicorn
+                # server other than raising a signal (sigint or sigterm), which would
+                # also cause the test to fail. Instead, we just cancel the task group
+                # and let the test finish.
+                # The annoying part of this is that there are tons of extra logs emitted
+                # by uvicorn which can't be captured by pytest...
+                tg.cancel_scope.cancel()
+
+
+async def initialize(client: httpx.AsyncClient, url: str, stream: AsyncIterator):
+    """
+    Handle the initialization handshake with the MCP server.
+    """
+    req = InitializeRequest(
+        method="initialize",
+        params=InitializeRequestParams(
+            protocolVersion=LATEST_PROTOCOL_VERSION,
+            capabilities=ClientCapabilities(
+                sampling=None,
+                experimental=None,
+            ),
+            clientInfo=Implementation(name="mcp-grafana", version="0.1.2"),
+        ),
+    )
+    jdoc = JSONRPCRequest(
+        jsonrpc="2.0",
+        id=1,
+        **req.model_dump(by_alias=True, mode="json"),
+    )
+    resp = await client.post(url, json=jdoc.model_dump(by_alias=True))
+    resp.raise_for_status()
+
+    req = ClientNotification(
+        InitializedNotification(method="notifications/initialized")
+    )
+    jdoc = JSONRPCNotification(
+        jsonrpc="2.0",
+        **req.model_dump(by_alias=True, mode="json"),
+    )
+    await client.post(url, json=jdoc.model_dump(by_alias=True))
+
+    # Consume the stream to ensure that the initialization handshake
+    # is complete.
+    sse = await stream.__anext__()
+    data = json.loads(sse.data)
+    assert "result" in data
+
+
+async def jsonrpc_result(stream: AsyncIterator) -> CallToolResult:
+    """
+    Extract the result of a 'call tool' JSONRPC request from the SSE stream.
+    """
+    jdoc = (await stream.__anext__()).data
+    resp = JSONRPCResponse.model_validate_json(jdoc)
+    return CallToolResult.model_validate(resp.result)