"""Regression tests for Gateway lifespan shutdown. These tests guard the invariant that lifespan shutdown is *bounded*: a misbehaving channel whose ``stop()`` blocks forever must not keep the uvicorn worker alive. A hung worker is the precondition for the signal-reentrancy deadlock described in ``app.gateway.app._SHUTDOWN_HOOK_TIMEOUT_SECONDS``. """ from __future__ import annotations import asyncio from contextlib import asynccontextmanager from unittest.mock import MagicMock, patch from fastapi import FastAPI @asynccontextmanager async def _noop_langgraph_runtime(_app): yield async def _run_lifespan_with_hanging_stop() -> float: """Drive the lifespan context with stop_channel_service hanging forever. Returns the elapsed wall-clock seconds. """ from app.gateway.app import _SHUTDOWN_HOOK_TIMEOUT_SECONDS, lifespan async def hang_forever() -> None: await asyncio.sleep(3600) app = FastAPI() fake_service = MagicMock() fake_service.get_status = MagicMock(return_value={}) async def fake_start(): return fake_service with ( patch("app.gateway.app.get_app_config"), patch("app.gateway.app.get_gateway_config", return_value=MagicMock(host="x", port=0)), patch("app.gateway.app.langgraph_runtime", _noop_langgraph_runtime), patch("app.channels.service.start_channel_service", side_effect=fake_start), patch("app.channels.service.stop_channel_service", side_effect=hang_forever), ): loop = asyncio.get_event_loop() start = loop.time() async with lifespan(app): pass elapsed = loop.time() - start assert _SHUTDOWN_HOOK_TIMEOUT_SECONDS < 30.0, "Timeout constant must stay modest" return elapsed def test_shutdown_is_bounded_when_channel_stop_hangs(): """Lifespan exit must complete near the configured timeout, not hang.""" from app.gateway.app import _SHUTDOWN_HOOK_TIMEOUT_SECONDS elapsed = asyncio.run(_run_lifespan_with_hanging_stop()) # Generous upper bound: timeout + 2s slack for scheduling overhead. assert elapsed < _SHUTDOWN_HOOK_TIMEOUT_SECONDS + 2.0, f"Lifespan shutdown took {elapsed:.2f}s; expected <= {_SHUTDOWN_HOOK_TIMEOUT_SECONDS + 2.0:.1f}s" # Lower bound: the wait_for should actually have waited. assert elapsed >= _SHUTDOWN_HOOK_TIMEOUT_SECONDS - 0.5, f"Lifespan exited too quickly ({elapsed:.2f}s); wait_for may not have been invoked."