AndyMik90 · Rex-Arnab · Feb 18, 2026 · Feb 18, 2026 · Feb 18, 2026 · Feb 18, 2026
diff --git a/apps/backend/agents/session.py b/apps/backend/agents/session.py
@@ -648,6 +648,27 @@ async def run_agent_session(
 
                         current_tool = None
 
+            # Handle rate_limit_event SystemMessage from sdk_patches
+            elif (
+                msg_type == "SystemMessage"
+                and getattr(msg, "subtype", None) == "rate_limit_event"
+            ):
+                debug(
+                    "session",
+                    "Rate limit event received — Claude Code is paused, stream remains open",
+                )
+                print(
+                    "[Rate limit] Claude Code is waiting for rate limit reset...",
+                    flush=True,
+                )
+                if task_logger:
+                    task_logger.log(
+                        "Rate limit reached — waiting for reset (stream remains open)",
+                        LogEntryType.INFO,
+                        phase,
+                        print_to_console=False,
+                    )
+
         print("\n" + "-" * 70 + "\n")
 
         # Check if build is complete

diff --git a/apps/backend/core/error_utils.py b/apps/backend/core/error_utils.py
@@ -56,6 +56,7 @@ def is_rate_limit_error(error: Exception) -> bool:
         for p in [
             "limit reached",
             "rate limit",
+            "rate_limit",  # Catches "Unknown message type: rate_limit_event" from claude_agent_sdk
             "too many requests",
             "usage limit",
             "quota exceeded",

diff --git a/apps/backend/core/sdk_patches.py b/apps/backend/core/sdk_patches.py
@@ -0,0 +1,56 @@
+"""Runtime patches for third-party SDK bugs."""
+
+import logging
+
+logger = logging.getLogger(__name__)
+
+
+def apply_claude_agent_sdk_patches() -> None:
+    """Patch claude_agent_sdk to handle rate_limit_event gracefully.
+
+    The bundled SDK raises MessageParseError for unknown message types including
+    rate_limit_event. This patch returns a SystemMessage instead of raising,
+    allowing the message loop in session.py to handle it and keep the stream open
+    while Claude Code waits for the rate limit to reset.
+
+    Patches both:
+    - message_parser.parse_message (the module attribute)
+    - _internal.client.parse_message (the already-bound module-level name that
+      the client's receive_response() generator actually calls via
+      `from .message_parser import parse_message` at import time)
+
+    Idempotent — safe to call multiple times from different entry points.
+    """
+    try:
+        from claude_agent_sdk._internal import client as _ic
+        from claude_agent_sdk._internal import message_parser as _mp
+        from claude_agent_sdk.types import SystemMessage as _SystemMessage
+
+        if getattr(_mp, "_rate_limit_patched", False):
+            logger.debug("claude_agent_sdk already patched — skipping")
+            return
+
+        _orig_parse = _mp.parse_message
+
+        def _patched_parse(data: dict) -> object:
+            if isinstance(data, dict) and data.get("type") == "rate_limit_event":
+                logger.warning(
+                    "Rate limit event received from Claude Code — "
+                    "returning as SystemMessage so the stream stays open: %s",
+                    data,
+                )
+                return _SystemMessage(subtype="rate_limit_event", data=data)
+            return _orig_parse(data)
+
+        _patched_parse.__wrapped__ = _orig_parse  # type: ignore[attr-defined]
+
+        _mp.parse_message = _patched_parse
+        _ic.parse_message = _patched_parse
+        _mp._rate_limit_patched = True  # type: ignore[attr-defined]
+        logger.debug("claude_agent_sdk patched to handle rate_limit_event")
+    except Exception:
+        logger.warning(
+            "Failed to apply claude_agent_sdk rate_limit_event patch — "
+            "rate limit events may cause unexpected session failures",
+            exc_info=True,
+        )
diff --git a/apps/backend/run.py b/apps/backend/run.py
@@ -70,6 +70,11 @@
     if "_new_stream" in dir():
         del _new_stream
 
+from core.sdk_patches import apply_claude_agent_sdk_patches  # pragma: no cover
+
+apply_claude_agent_sdk_patches()  # pragma: no cover
+
+
 # Validate platform-specific dependencies BEFORE any imports that might
 # trigger graphiti_core -> real_ladybug -> pywintypes import chain (ACS-253)
 from core.dependency_validator import validate_platform_dependencies

diff --git a/apps/backend/runners/github/runner.py b/apps/backend/runners/github/runner.py
@@ -62,6 +62,10 @@
 
 validate_platform_dependencies()
 
+from core.sdk_patches import apply_claude_agent_sdk_patches  # pragma: no cover
+
+apply_claude_agent_sdk_patches()  # pragma: no cover
+
 # Load .env file with centralized error handling
 from cli.utils import import_dotenv
 

diff --git a/apps/backend/runners/gitlab/runner.py b/apps/backend/runners/gitlab/runner.py
@@ -32,6 +32,10 @@
 
 validate_platform_dependencies()
 
+from core.sdk_patches import apply_claude_agent_sdk_patches  # pragma: no cover
+
+apply_claude_agent_sdk_patches()  # pragma: no cover
+
 # Load .env file with centralized error handling
 from cli.utils import import_dotenv
 

diff --git a/apps/backend/runners/ideation_runner.py b/apps/backend/runners/ideation_runner.py
@@ -32,6 +32,10 @@
 
 validate_platform_dependencies()
 
+from core.sdk_patches import apply_claude_agent_sdk_patches  # pragma: no cover
+
+apply_claude_agent_sdk_patches()  # pragma: no cover
+
 # Load .env file with centralized error handling
 from cli.utils import import_dotenv
 

diff --git a/apps/backend/runners/insights_runner.py b/apps/backend/runners/insights_runner.py
@@ -21,6 +21,10 @@
 
 validate_platform_dependencies()
 
+from core.sdk_patches import apply_claude_agent_sdk_patches  # pragma: no cover
+
+apply_claude_agent_sdk_patches()  # pragma: no cover
+
 # Load .env file with centralized error handling
 from cli.utils import import_dotenv
 

diff --git a/apps/backend/runners/roadmap_runner.py b/apps/backend/runners/roadmap_runner.py
@@ -27,6 +27,10 @@
 
 validate_platform_dependencies()
 
+from core.sdk_patches import apply_claude_agent_sdk_patches  # pragma: no cover
+
+apply_claude_agent_sdk_patches()  # pragma: no cover
+
 # Load .env file with centralized error handling
 from cli.utils import import_dotenv
 

diff --git a/apps/backend/runners/spec_runner.py b/apps/backend/runners/spec_runner.py
@@ -83,6 +83,11 @@
 # Add auto-claude to path (parent of runners/)
 sys.path.insert(0, str(Path(__file__).parent.parent))
 
+
+from core.sdk_patches import apply_claude_agent_sdk_patches  # pragma: no cover
+
+apply_claude_agent_sdk_patches()  # pragma: no cover
+
 # Validate platform-specific dependencies BEFORE any imports that might
 # trigger graphiti_core -> real_ladybug -> pywintypes import chain (ACS-253)
 from core.dependency_validator import validate_platform_dependencies

diff --git a/tests/test_sdk_patches.py b/tests/test_sdk_patches.py
@@ -0,0 +1,212 @@
+#!/usr/bin/env python3
+"""
+Tests for core.sdk_patches
+============================
+
+Covers:
+- apply_claude_agent_sdk_patches() happy path
+- Idempotency guard (no double-wrapping)
+- rate_limit_event returns SystemMessage
+- Other unknown message types still raise
+- Graceful failure when SDK internals are unavailable
+"""
+
+import sys
+
+# Ensure backend is on the path
+from pathlib import Path
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+sys.path.insert(0, str(Path(__file__).parent.parent / "apps" / "backend"))
+
+
+# ---------------------------------------------------------------------------
+# Helpers
+# ---------------------------------------------------------------------------
+
+
+def _make_sdk_mocks():
+    """Build a minimal fake claude_agent_sdk module tree."""
+
+    class _FakeMessageParseError(Exception):
+        pass
+
+    class _FakeSystemMessage:
+        def __init__(self, subtype: str, data: dict):
+            self.subtype = subtype
+            self.data = data
+
+    def _real_parse(data):
+        msg_type = data.get("type") if isinstance(data, dict) else None
+        if msg_type == "rate_limit_event":
+            raise _FakeMessageParseError(f"Unknown message type: {msg_type}")
+        if msg_type == "assistant":
+            return MagicMock(type="assistant")
+        raise _FakeMessageParseError(f"Unknown message type: {msg_type}")
+
+    # Build fake module objects
+    mp_mod = MagicMock()
+    mp_mod.parse_message = _real_parse
+    del mp_mod._rate_limit_patched  # ensure sentinel absent at start
+
+    ic_mod = MagicMock()
+    ic_mod.parse_message = _real_parse
+
+    types_mod = MagicMock()
+    types_mod.SystemMessage = _FakeSystemMessage
+
+    sdk_mod = MagicMock()
+
+    internal_mod = MagicMock()
+    internal_mod.message_parser = mp_mod
+    internal_mod.client = ic_mod
+
+    return sdk_mod, internal_mod, mp_mod, ic_mod, types_mod, _FakeMessageParseError
+
+
+# ---------------------------------------------------------------------------
+# Fixtures
+# ---------------------------------------------------------------------------
+
+
+@pytest.fixture(autouse=True)
+def _clean_patch_sentinel():
+    """Remove any leftover _rate_limit_patched sentinel between tests."""
+    yield
+    # Remove sdk_patches from sys.modules so each test gets a fresh import
+    sys.modules.pop("core.sdk_patches", None)
+
+
+# ---------------------------------------------------------------------------
+# Tests for apply_claude_agent_sdk_patches
+# ---------------------------------------------------------------------------
+
+
+class TestApplyClaudeAgentSdkPatches:
+    def _build_modules(self):
+        sdk, internal, mp, ic, types, err = _make_sdk_mocks()
+        modules = {
+            "claude_agent_sdk": sdk,
+            "claude_agent_sdk._internal": internal,
+            "claude_agent_sdk._internal.message_parser": mp,
+            "claude_agent_sdk._internal.client": ic,
+            "claude_agent_sdk.types": types,
+        }
+        return modules, mp, ic, types, err
+
+    def test_patches_both_call_sites(self):
+        """parse_message is replaced on both _mp and _ic after patching."""
+        modules, mp, ic, types, _ = self._build_modules()
+        original = mp.parse_message
+
+        with patch.dict(sys.modules, modules):
+            from core.sdk_patches import apply_claude_agent_sdk_patches
+
+            apply_claude_agent_sdk_patches()
+
+        assert mp.parse_message is not original
+        assert ic.parse_message is not original
+        assert mp.parse_message is ic.parse_message
+
+    def test_rate_limit_event_returns_system_message(self):
+        """rate_limit_event data is converted to a SystemMessage without raising."""
+        modules, mp, ic, types, _ = self._build_modules()
+
+        with patch.dict(sys.modules, modules):
+            from core.sdk_patches import apply_claude_agent_sdk_patches
+
+            apply_claude_agent_sdk_patches()
+
+        result = ic.parse_message({"type": "rate_limit_event", "retry_after": 30})
+        assert type(result).__name__ == "_FakeSystemMessage"
+        assert result.subtype == "rate_limit_event"
+
+    def test_other_unknown_types_still_raise(self):
+        """Non-rate-limit unknown message types still propagate MessageParseError."""
+        modules, mp, ic, types, FakeErr = self._build_modules()
+
+        with patch.dict(sys.modules, modules):
+            from core.sdk_patches import apply_claude_agent_sdk_patches
+
+            apply_claude_agent_sdk_patches()
+
+        with pytest.raises(FakeErr, match="Unknown message type: totally_unknown"):
+            ic.parse_message({"type": "totally_unknown"})
+
+    def test_valid_messages_pass_through(self):
+        """Known message types are delegated to the original parser unchanged."""
+        modules, mp, ic, types, _ = self._build_modules()
+
+        with patch.dict(sys.modules, modules):
+            from core.sdk_patches import apply_claude_agent_sdk_patches
+
+            apply_claude_agent_sdk_patches()
+
+        result = ic.parse_message({"type": "assistant"})
+        assert result is not None
+
+    def test_idempotent_second_call_skips_rewrap(self):
+        """Calling apply_claude_agent_sdk_patches twice does not double-wrap."""
+        modules, mp, ic, types, _ = self._build_modules()
+
+        with patch.dict(sys.modules, modules):
+            from core.sdk_patches import apply_claude_agent_sdk_patches
+
+            apply_claude_agent_sdk_patches()
+            patched_once = ic.parse_message
+            apply_claude_agent_sdk_patches()
+            patched_twice = ic.parse_message
+
+        assert patched_once is patched_twice
+
+    def test_sets_rate_limit_patched_sentinel(self):
+        """_rate_limit_patched sentinel is set on the message_parser module."""
+        modules, mp, ic, types, _ = self._build_modules()
+
+        with patch.dict(sys.modules, modules):
+            from core.sdk_patches import apply_claude_agent_sdk_patches
+
+            apply_claude_agent_sdk_patches()
+
+        assert getattr(mp, "_rate_limit_patched", False) is True
+
+    def test_wrapped_attribute_preserves_original(self):
+        """__wrapped__ on the patched function points to the original parser."""
+        modules, mp, ic, types, _ = self._build_modules()
+        original = mp.parse_message
+
+        with patch.dict(sys.modules, modules):
+            from core.sdk_patches import apply_claude_agent_sdk_patches
+
+            apply_claude_agent_sdk_patches()
+
+        assert mp.parse_message.__wrapped__ is original
+
+    def test_graceful_failure_when_sdk_unavailable(self, caplog):
+        """Patch fails silently with a warning when the SDK is not installed."""
+        import logging
+
+        broken = {"claude_agent_sdk._internal": None}
+        with patch.dict(sys.modules, broken):
+            sys.modules.pop("core.sdk_patches", None)
+            with caplog.at_level(logging.WARNING, logger="core.sdk_patches"):
+                from core.sdk_patches import apply_claude_agent_sdk_patches
+
+                apply_claude_agent_sdk_patches()
+
+        assert any("Failed to apply" in r.message for r in caplog.records)
+
+    def test_non_dict_data_passes_to_original(self):
+        """Non-dict data skips the rate_limit check and goes to original parser."""
+        modules, mp, ic, types, FakeErr = self._build_modules()
+
+        with patch.dict(sys.modules, modules):
+            from core.sdk_patches import apply_claude_agent_sdk_patches
+
+            apply_claude_agent_sdk_patches()
+
+        # Original parser raises for non-dict / unknown input
+        with pytest.raises(FakeErr):
+            ic.parse_message("not-a-dict")