microsoft · joshimai · Apr 12, 2024 · Mar 26, 2024 · Mar 27, 2024 · Mar 28, 2024
diff --git a/pccommon/pccommon/middleware.py b/pccommon/pccommon/middleware.py
@@ -1,96 +1,123 @@
 import asyncio
 import logging
 import time
-from typing import Awaitable, Callable
+from functools import wraps
+from typing import Any, Callable
 
 from fastapi import HTTPException, Request, Response
 from fastapi.applications import FastAPI
-from starlette.middleware.base import BaseHTTPMiddleware
-from starlette.responses import PlainTextResponse
+from fastapi.dependencies.utils import (
+    get_body_field,
+    get_dependant,
+    get_parameterless_sub_dependant,
+)
+from fastapi.responses import PlainTextResponse
+from fastapi.routing import APIRoute, request_response
 from starlette.status import HTTP_504_GATEWAY_TIMEOUT
-from starlette.types import Message
+from starlette.types import ASGIApp, Receive, Scope, Send
 
 from pccommon.logging import get_custom_dimensions
 from pccommon.tracing import trace_request
 
 logger = logging.getLogger(__name__)
 
 
-async def handle_exceptions(
-    request: Request,
-    call_next: Callable[[Request], Awaitable[Response]],
-) -> Response:
-    try:
-        return await call_next(request)
-    except HTTPException:
+async def http_exception_handler(request: Request, exc: Exception) -> Any:
+    # Log the exception with additional request info if needed
+    logger.exception("Exception when handling request", exc_info=exc)
+    # Return a custom response for HTTPException
+    if isinstance(exc, HTTPException):
         raise
-    except Exception as e:
+    # Handle other exceptions, possibly with a generic response
+    else:
         logger.exception(
             "Exception when handling request",
-            extra=get_custom_dimensions({"stackTrace": f"{e}"}, request),
+            extra=get_custom_dimensions({"stackTrace": f"{exc}"}, request),
         )
         raise
 
 
-class RequestTracingMiddleware(BaseHTTPMiddleware):
-    """Custom middleware to use opencensus request traces
-
-    Middleware implementations that access a Request object directly
-    will cause subsequent middleware or route handlers to hang. See
-
-    https://github.com/tiangolo/fastapi/issues/394
-
-    for more details on this implementation.
-
-    An alternative approach is to use dependencies on the APIRouter, but
-    the stac-fast api implementation makes that difficult without having
-    to override much of the app initialization.
-    """
-
-    def __init__(self, app: FastAPI, service_name: str):
-        super().__init__(app)
+def with_timeout(
+    timeout_seconds: float,
+) -> Callable[[Callable[..., Any]], Callable[..., Any]]:
+    def with_timeout_(func: Callable[..., Any]) -> Callable[..., Any]:
+        if asyncio.iscoroutinefunction(func):
+            logger.debug("Adding timeout to function %s", func.__name__)
+
+            @wraps(func)
+            async def inner(*args: Any, **kwargs: Any) -> Any:
+                start_time = time.monotonic()
+                try:
+                    return await asyncio.wait_for(
+                        func(*args, **kwargs), timeout=timeout_seconds
+                    )
+                except asyncio.TimeoutError as e:
+                    process_time = time.monotonic() - start_time
+                    # don't have a request object here to get custom dimensions.
+                    log_dimensions = {
+                        "request_time": process_time,
+                    }
+                    logger.exception(
+                        f"Request timeout {e}",
+                        extra=log_dimensions,
+                    )
+
+                    ref_id = log_dimensions.get("ref_id")
+                    debug_msg = (
+                        f" Debug information for support: {ref_id}" if ref_id else ""
+                    )
+
+                    return PlainTextResponse(
+                        f"The request exceeded the maximum allowed time, please"
+                        " try again. If the issue persists, please contact "
+                        "[email protected]."
+                        f"\n\n{debug_msg}",
+                        status_code=HTTP_504_GATEWAY_TIMEOUT,
+                    )
+
+            return inner
+        else:
+            return func
+
+    return with_timeout_
+
+
+def add_timeout(app: FastAPI, timeout_seconds: float) -> None:
+    for route in app.router.routes:
+        if isinstance(route, APIRoute):
+            new_endpoint = with_timeout(timeout_seconds)(route.endpoint)
+            route.endpoint = new_endpoint
+            route.dependant = get_dependant(path=route.path_format, call=route.endpoint)
+            for depends in route.dependencies[::-1]:
+                route.dependant.dependencies.insert(
+                    0,
+                    get_parameterless_sub_dependant(
+                        depends=depends, path=route.path_format
+                    ),
+                )
+            route.body_field = get_body_field(
+                dependant=route.dependant, name=route.unique_id
+            )
+            route.app = request_response(route.get_route_handler())
+
+
+class TraceMiddleware:
+    def __init__(self, app: ASGIApp, service_name: str):
+        self.app = app
         self.service_name = service_name
 
-    async def set_body(self, request: Request) -> None:
-        receive_ = await request._receive()
-
-        async def receive() -> Message:
-            return receive_
-
-        request._receive = receive
+    async def __call__(self, scope: Scope, receive: Receive, send: Send) -> None:
+        if scope["type"] == "http":
+            request: Request = Request(scope, receive)
 
-    async def dispatch(
-        self, request: Request, call_next: Callable[[Request], Awaitable[Response]]
-    ) -> Response:
-        await self.set_body(request)
-        response = await trace_request(self.service_name, request, call_next)
-        return response
+            async def call_next(request: Request) -> Response:
+                # Create a response object to mimic trace_requests call_next
+                # argument
+                response = Response()
+                await self.app(scope, receive, send)
+                return response
 
+            await trace_request(self.service_name, request, call_next)
 
-async def timeout_middleware(
-    request: Request,
-    call_next: Callable[[Request], Awaitable[Response]],
-    timeout: int,
-) -> Response:
-    try:
-        start_time = time.time()
-        return await asyncio.wait_for(call_next(request), timeout=timeout)
-
-    except asyncio.TimeoutError:
-        process_time = time.time() - start_time
-        log_dimensions = get_custom_dimensions({"request_time": process_time}, request)
-
-        logger.exception(
-            "Request timeout",
-            extra=log_dimensions,
-        )
-
-        ref_id = log_dimensions["custom_dimensions"].get("ref_id")
-        debug_msg = f"Debug information for support: {ref_id}" if ref_id else ""
-
-        return PlainTextResponse(
-            f"The request exceeded the maximum allowed time, please try again."
-            " If the issue persists, please contact [email protected]."
-            f"\n\n{debug_msg}",
-            status_code=HTTP_504_GATEWAY_TIMEOUT,
-        )
+        else:
+            await self.app(scope, receive, send)
diff --git a/pccommon/pccommon/tracing.py b/pccommon/pccommon/tracing.py
@@ -3,11 +3,13 @@
 import re
 from typing import Awaitable, Callable, List, Optional, Tuple, Union, cast
 
+import fastapi
 from fastapi import Request, Response
 from opencensus.ext.azure.trace_exporter import AzureExporter
 from opencensus.trace.samplers import ProbabilitySampler
 from opencensus.trace.span import SpanKind
 from opencensus.trace.tracer import Tracer
+from starlette.datastructures import QueryParams
 
 from pccommon.config import get_apis_config
 from pccommon.constants import (
@@ -249,3 +251,63 @@ def _iter_cql(cql: dict, property_name: str) -> Optional[Union[str, List[str]]]:
                             return result
     # No collection was found
     return None
+
+
+def add_stac_attributes_from_search(search_json: str, request: fastapi.Request) -> None:
+    """
+    Try to add the Collection ID and Item ID from a search to the current span.
+    """
+    collection_id, item_id = parse_collection_from_search(
+        json.loads(search_json), request.method, request.query_params
+    )
+    tracer = Tracer(
+        exporter=exporter,
+        sampler=ProbabilitySampler(1.0),
+    )
+
+    with tracer.span("main") as span:
+        if (
+            hasattr(request.state, "parent_span")
+            and request.state.parent_span is not None
+        ):
+            request.state.parent_span = span
+            if collection_id is not None:
+                tracer.add_attribute_to_current_span(
+                    attribute_key="collection", attribute_value=collection_id
+                )
+                if item_id is not None:
+                    tracer.add_attribute_to_current_span(
+                        attribute_key="item", attribute_value=item_id
+                    )
+        else:
+            logger.warning("No 'parent_span' attribute found in request.state")
+
+
+def parse_collection_from_search(
+    body: dict,
+    method: str,
+    query_params: QueryParams,
+) -> Tuple[Optional[str], Optional[str]]:
+    """
+    Parse the collection id from a search request.
+
+    The search endpoint is a bit of a special case. If it's a GET, the collection
+    and item ids are in the querystring. If it's a POST, the collection and item may
+    be in either a CQL-JSON or CQL2-JSON filter body, or a query/stac-ql body.
+    """
+    if method.lower() == "get":
+        collection_id = query_params.get("collections")
+        item_id = query_params.get("ids")
+        return (collection_id, item_id)
+    elif method.lower() == "post":
+        try:
+            if "collections" in body:
+                return _parse_queryjson(body)
+            elif "filter" in body:
+                return _parse_cqljson(body["filter"])
+        except json.JSONDecodeError as e:
+            logger.warning(
+                "Unable to parse search body as JSON. Ignoring collection"
+                f"parameter. {e}"
+            )
+    return (None, None)
diff --git a/pccommon/tests/test_timeouts.py b/pccommon/tests/test_timeouts.py
@@ -1,14 +1,14 @@
 import asyncio
-import random
-from typing import Awaitable, Callable
+from typing import Any
 
 import pytest
-from fastapi import FastAPI, Request, Response
-from fastapi.responses import PlainTextResponse
+from fastapi import FastAPI
+
+# from fastapi.responses import PlainTextResponse
 from httpx import AsyncClient
-from starlette.status import HTTP_200_OK, HTTP_504_GATEWAY_TIMEOUT
+from starlette.status import HTTP_504_GATEWAY_TIMEOUT
 
-from pccommon.middleware import timeout_middleware
+from pccommon.middleware import add_timeout
 
 TIMEOUT_SECONDS = 2
 BASE_URL = "http://test"
@@ -20,80 +20,22 @@
 app.state.service_name = "test"
 
 
-@app.middleware("http")
-async def _timeout_middleware(
-    request: Request, call_next: Callable[[Request], Awaitable[Response]]
-) -> Response:
-    """Add a timeout to all requests."""
-    return await timeout_middleware(request, call_next, timeout=TIMEOUT_SECONDS)
-
-
-# Test endpoint to sleep for a configurable amount of time, which may exceed the
-# timeout middleware setting
-@app.get("/sleep", response_class=PlainTextResponse)
-async def route_for_test(t: int) -> str:
-    await asyncio.sleep(t)
-    return "Done"
-
-
-# Test endpoint to sleep and confirm that the task is cancelled after the timeout
-@app.get("/cancel", response_class=PlainTextResponse)
-async def route_for_cancel_test(t: int) -> str:
-    for i in range(t):
-        await asyncio.sleep(1)
-        if i > TIMEOUT_SECONDS:
-            raise Exception("Task should have been cancelled")
-
-    return "Done"
-
-
-# Test middleware
-# ===============
-
-
-async def success_response(client: AsyncClient, timeout: int) -> None:
-    print("making request")
-    response = await client.get("/sleep", params={"t": timeout})
-    assert response.status_code == HTTP_200_OK
-    assert response.text == "Done"
+@app.get("/asleep")
+async def asleep() -> Any:
+    await asyncio.sleep(1)
+    return {}
 
 
-async def timeout_response(client: AsyncClient, timeout: int) -> None:
-    response = await client.get("/sleep", params={"t": timeout})
-    assert response.status_code == HTTP_504_GATEWAY_TIMEOUT
-
-
-@pytest.mark.asyncio
-async def test_timeout() -> None:
-    async with AsyncClient(app=app, base_url=BASE_URL) as client:
-        await timeout_response(client, 10)
-
+# Run this after registering the routes
 
-@pytest.mark.asyncio
-async def test_no_timeout() -> None:
-    async with AsyncClient(app=app, base_url=BASE_URL) as client:
-        await success_response(client, 1)
+add_timeout(app, timeout_seconds=0.001)
 
 
 @pytest.mark.asyncio
-async def test_multiple_requests() -> None:
-    async with AsyncClient(app=app, base_url=BASE_URL) as client:
-        timeout_tasks = []
-        for _ in range(100):
-            t = TIMEOUT_SECONDS + random.randint(1, 10)
-            timeout_tasks.append(asyncio.ensure_future(timeout_response(client, t)))
-
-        await asyncio.gather(*timeout_tasks)
-
-        success_tasks = []
-        for _ in range(100):
-            t = TIMEOUT_SECONDS - 1
-            success_tasks.append(asyncio.ensure_future(success_response(client, t)))
+async def test_add_timeout() -> None:
 
-        await asyncio.gather(*success_tasks)
+    client = AsyncClient(app=app, base_url=BASE_URL)
 
+    response = await client.get("/asleep")
 
-@pytest.mark.asyncio
-async def test_request_cancelled() -> None:
-    async with AsyncClient(app=app, base_url=BASE_URL) as client:
-        await client.get("/cancel", params={"t": 10})
+    assert response.status_code == HTTP_504_GATEWAY_TIMEOUT