matdev83
diff --git a/‎AGENTS.md‎
Lines changed: 1 addition & 0 deletions b/‎AGENTS.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎dev/scripts/demo_gemini_api_key_loading_fix.py‎
Lines changed: 3 additions & 3 deletions b/‎dev/scripts/demo_gemini_api_key_loading_fix.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎dev/scripts/run_pycycle.py‎
Lines changed: 108 additions & 0 deletions b/‎dev/scripts/run_pycycle.py‎
Lines changed: 108 additions & 0 deletions
diff --git a/‎pyproject.toml‎
Lines changed: 11 additions & 0 deletions b/‎pyproject.toml‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎src/connectors/openai_codex/codex_quota_notifications.py‎
Lines changed: 10 additions & 1 deletion b/‎src/connectors/openai_codex/codex_quota_notifications.py‎
Lines changed: 10 additions & 1 deletion
diff --git a/‎src/connectors/openai_codex/credentials.py‎
Lines changed: 14 additions & 2 deletions b/‎src/connectors/openai_codex/credentials.py‎
Lines changed: 14 additions & 2 deletions
diff --git a/‎src/connectors/openai_codex/managed_oauth_models.py‎
Lines changed: 2 additions & 1 deletion b/‎src/connectors/openai_codex/managed_oauth_models.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎src/connectors/openai_codex/managed_oauth_selector.py‎
Lines changed: 14 additions & 1 deletion b/‎src/connectors/openai_codex/managed_oauth_selector.py‎
Lines changed: 14 additions & 1 deletion
diff --git a/‎src/connectors/openai_codex/payload.py‎
Lines changed: 6 additions & 70 deletions b/‎src/connectors/openai_codex/payload.py‎
Lines changed: 6 additions & 70 deletions
@@ -84,6 +84,7 @@ When working on specs, the user will invoke `/kiro:*` commands. Follow the instr
 | **Lint/Fix** | `./.venv/Scripts/python.exe -m ruff check --fix .` |
 | **Format** | `./.venv/Scripts/python.exe -m black .` |
 | **Boundary Type Check** | `./.venv/Scripts/python.exe dev/scripts/check_boundary_types.py` |
+| **Circular import scan (pycycle)** | `./.venv/Scripts/python.exe dev/scripts/run_pycycle.py` |
 | **Inspect CBOR wire captures** | `./.venv/Scripts/python.exe scripts/inspect_cbor_capture.py <file> --detect-issues` |
 
 ## Quality & Testing Standards
 
@@ -153,7 +153,7 @@ def demo_full_integration(monkeypatch) -> None:
             return_value=["gemini"],
         ),
         patch(
-            "src.core.config.models.backends.backend_registry.get_registered_backends",
+            "src.core.services.backend_registry.backend_registry.get_registered_backends",
             return_value=["gemini"],
         ),
     ):
@@ -232,7 +232,7 @@ def demo_single_base_key_only(monkeypatch) -> None:
             return_value=["gemini"],
         ),
         patch(
-            "src.core.config.models.backends.backend_registry.get_registered_backends",
+            "src.core.services.backend_registry.backend_registry.get_registered_backends",
             return_value=["gemini"],
         ),
     ):
@@ -271,7 +271,7 @@ def demo_single_numbered_key_only(monkeypatch) -> None:
             return_value=["gemini"],
         ),
         patch(
-            "src.core.config.models.backends.backend_registry.get_registered_backends",
+            "src.core.services.backend_registry.backend_registry.get_registered_backends",
             return_value=["gemini"],
         ),
     ):
 
@@ -0,0 +1,108 @@
+#!/usr/bin/env python3
+"""
+Run pycycle using settings from ``[tool.pycycle]`` in the repository ``pyproject.toml``.
+
+Upstream ``pycycle --source <path>`` is unusable with current Click (the option is typed as a
+boolean), so this script invokes ``pycycle --here`` with the working directory set to
+``resolve_dir`` (typically ``src`` for this layout).
+
+Usage::
+
+    ./.venv/Scripts/python.exe dev/scripts/run_pycycle.py
+    ./.venv/Scripts/python.exe dev/scripts/run_pycycle.py --verbose
+"""
+
+from __future__ import annotations
+
+import argparse
+import shutil
+import subprocess
+import sys
+from collections.abc import Mapping
+from pathlib import Path
+from typing import Any
+
+import tomli
+
+
+def _find_pyproject(start: Path) -> Path:
+    for directory in (start, *start.parents):
+        candidate = directory / "pyproject.toml"
+        if candidate.is_file():
+            return candidate
+    msg = "pyproject.toml not found (expected an ancestor of this script)."
+    raise SystemExit(msg)
+
+
+def _load_pycycle_config(pyproject_path: Path) -> dict[str, Any]:
+    with pyproject_path.open("rb") as handle:
+        data = tomli.load(handle)
+    tool = data.get("tool") or {}
+    if not isinstance(tool, Mapping):
+        return {}
+    pycycle = tool.get("pycycle") or {}
+    if not isinstance(pycycle, Mapping):
+        return {}
+    return dict(pycycle)
+
+
+def _pycycle_executable() -> str:
+    scripts_dir = Path(sys.executable).resolve().parent
+    for name in ("pycycle.exe", "pycycle"):
+        candidate = scripts_dir / name
+        if candidate.is_file():
+            return str(candidate)
+    found = shutil.which("pycycle")
+    if found:
+        return found
+    msg = (
+        "pycycle executable not found. Install dev dependencies, for example: "
+        "pip install -e .[dev]"
+    )
+    raise SystemExit(msg)
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(description=__doc__)
+    parser.add_argument(
+        "--verbose",
+        action="store_true",
+        help="Verbose pycycle output (overrides [tool.pycycle].verbose when set).",
+    )
+    args = parser.parse_args()
+
+    script_path = Path(__file__).resolve()
+    pyproject_path = _find_pyproject(script_path.parent)
+    repo_root = pyproject_path.parent
+    cfg = _load_pycycle_config(pyproject_path)
+
+    resolve_dir = str(cfg.get("resolve_dir") or "src")
+    encoding = cfg.get("encoding")
+    ignore = str(cfg.get("ignore") or "")
+    verbose = bool(cfg.get("verbose")) or args.verbose
+
+    target = (repo_root / resolve_dir).resolve()
+    try:
+        target.relative_to(repo_root.resolve())
+    except ValueError:
+        msg = f"resolve_dir {resolve_dir!r} escapes repository root."
+        raise SystemExit(msg)
+    if not target.is_dir():
+        msg = f"Analysis directory does not exist: {target}"
+        raise SystemExit(msg)
+
+    cmd: list[str] = [_pycycle_executable(), "--here"]
+    if encoding:
+        cmd.extend(["--encoding", str(encoding)])
+    stripped_ignore = ignore.strip()
+    if stripped_ignore:
+        cmd.extend(["--ignore", stripped_ignore])
+    if verbose:
+        cmd.append("--verbose")
+
+    completed = subprocess.run(cmd, cwd=target, check=False)
+    return int(completed.returncode)
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
@@ -91,6 +91,7 @@ dev = [
     "respx",
     "dependency-injector",
     "vulture",
+    "pycycle==0.0.8",
     "pytest-snapshot==0.9.0",
     "mypy==1.10.0",
     "hypothesis==6.112.1",
@@ -448,6 +449,16 @@ ignore_names = [
     "tool_name"
 ]
 
+# Circular import scan (bndr/pycycle). Upstream does not read this table; dev/scripts/run_pycycle.py does.
+# Note: `pycycle --source <path>` is broken with modern Click (option is inferred as boolean), so the
+# wrapper runs `pycycle --here` with cwd set to `resolve_dir`.
+[tool.pycycle]
+resolve_dir = "src"
+encoding = "utf-8"
+# Comma-separated directory basenames excluded during traversal (passed to pycycle --ignore).
+ignore = ""
+verbose = false
+
 [tool.testmon]
 run_variant_expression = "','.join(sorted(str(v) for v in [sys.version_info[:2], sys.platform]))"
 historian = "git"
 
@@ -20,6 +20,10 @@
 
 _CODEX_QUOTA_NOTIFICATION_TITLE = "OpenAI Codex: Quota reached"
 
+# Dedupe key component when every managed account is simultaneously unavailable:
+# one desktop alert per quota window, not one per account that hits 429 last.
+_CODEX_QUOTA_ALL_ACCOUNTS_DEDUPE_ID = "__all_managed_accounts__"
+
 _EXTENDED_WINDOW = "extended (~weekly_or_plan_quota)"
 
 
@@ -96,7 +100,12 @@ async def maybe_notify_codex_quota_reached(
     until_display = until_iso if until_iso else "unknown"
     dedupe_until = until_iso if until_iso else "none"
 
-    key = (managed_account_id, quota_type, dedupe_until)
+    dedupe_account_id = (
+        _CODEX_QUOTA_ALL_ACCOUNTS_DEDUPE_ID
+        if all_accounts_exhausted
+        else managed_account_id
+    )
+    key = (dedupe_account_id, quota_type, dedupe_until)
     if key in dedupe_keys:
         return
 
 
@@ -541,12 +541,21 @@ async def _load_managed_auth(self, force_reload: bool = False) -> bool:
         if not self._managed_enabled():
             return False
 
+        # Skip managed path when nothing is on disk — avoids selector/refresh work
+        # and prevents long rate-limit polling loops during bootstrap (tests/CI).
+        if not await self._managed_has_accounts():
+            return False
+
         if force_reload:
             await self._managed_selector.reload_accounts()
 
         account = self._managed_selector.get_current_account()
         if account is None or account.needs_reauth:
-            account = await self._managed_selector.get_next_account()
+            # Initial bootstrap must not block on rate-limit recovery sleeps
+            # (see ManagedOAuthAccountSelector.get_next_account); fall back to legacy.
+            account = await self._managed_selector.get_next_account(
+                wait_for_rate_limit_recovery=False,
+            )
 
         if account is None:
             return False
@@ -862,7 +871,10 @@ async def refresh_access_token(self) -> bool:
     async def _refresh_managed_access_token(self) -> bool:
         account = self._managed_selector.get_current_account()
         if account is None:
-            account = await self._managed_selector.get_next_account()
+            # Refresh path should also avoid blocking on rate-limit recovery sleeps.
+            account = await self._managed_selector.get_next_account(
+                wait_for_rate_limit_recovery=False,
+            )
         if account is None:
             return False
 
 
@@ -227,7 +227,8 @@ class ManagedOAuthConfig(BaseModel):
     #: when upstream sends very large ``resets_in_seconds``. Full upstream metadata is
     #: still stored on ``last_codex_usage_limit``.
     rate_limit_local_cooldown_cap_seconds: float = 1800.0
-    #: Max idle polls (sleeps) while all accounts are rate-limited before giving up.
+    #: Max idle polls (sleeps) while all accounts are rate-limited before giving up
+    #: (only when ``get_next_account`` is invoked with ``wait_for_rate_limit_recovery=True``).
     max_rate_limit_idle_polls: int = 48
 
     @classmethod
 
@@ -237,8 +237,17 @@ async def get_next_account(
         *,
         session_id: str | None = None,
         ignore_session_affinity: bool = False,
+        wait_for_rate_limit_recovery: bool = True,
     ) -> ManagedOAuthAccount | None:
-        """Return next usable account and perform proactive refresh."""
+        """Return next usable account and perform proactive refresh.
+
+        When every available account is currently rate-limited, the default
+        behaviour is to sleep (bounded by ``max_rate_limit_wait_seconds``) and
+        poll until one becomes eligible again or ``max_rate_limit_idle_polls``
+        is exceeded. Callers that must not block in-flight requests (for example
+        :meth:`rotate_on_rate_limit`) should pass ``wait_for_rate_limit_recovery=False``
+        to return ``None`` immediately in that situation.
+        """
         await self._ensure_accounts_loaded()
 
         rate_limit_idle_polls = 0
@@ -250,6 +259,8 @@ async def get_next_account(
                 return None
 
             if not eligible:
+                if not wait_for_rate_limit_recovery:
+                    return None
                 rate_limit_idle_polls += 1
                 if rate_limit_idle_polls > self._max_rate_limit_idle_polls:
                     return None
@@ -381,6 +392,7 @@ async def rotate_on_rate_limit(
         return await self.get_next_account(
             session_id=session_id,
             ignore_session_affinity=True,
+            wait_for_rate_limit_recovery=False,
         )
 
     async def rotate_on_auth_failure(
@@ -398,4 +410,5 @@ async def rotate_on_auth_failure(
         return await self.get_next_account(
             session_id=session_id,
             ignore_session_affinity=True,
+            wait_for_rate_limit_recovery=False,
         )
@@ -5,7 +5,6 @@
 
 from __future__ import annotations
 
-import json
 import logging
 import uuid
 from copy import deepcopy
@@ -665,75 +664,12 @@ def convert_dict_to_payload(
     @staticmethod
     def _sanitize_responses_input(input_value: Any) -> list[dict[str, Any] | Any]:
         """Make a Responses `input` array safe for ChatGPT Codex backend.
-
-        - Removes `item_reference` entries (AI SDK/OpenCode server-state references)
-        - Strips per-item `id` fields for stateless mode (`store: false`)
-        - Removes unsupported per-item `metadata` blocks
-        - Converts orphaned `function_call_output` entries into assistant messages
-          to preserve context while avoiding backend validation errors
+        
+        Note: We must NOT strip `id`, `metadata`, or `item_reference` fields, nor 
+        modify `function_call_output` entries. The Codex backend relies on the exact 
+        shape of these messages (including `id`s) to perform context (write) caching.
+        Stripping them causes cache misses and rapid quota exhaustion.
         """
         if not isinstance(input_value, list):
             return []
-
-        filtered: list[dict[str, Any]] = []
-        for item in input_value:
-            if not isinstance(item, dict):
-                continue
-
-            item_type = item.get("type")
-            if item_type == "item_reference":
-                continue
-
-            item_dict = dict(item)
-            item_dict.pop("id", None)
-            item_dict.pop("metadata", None)
-            filtered.append(item_dict)
-
-        function_call_ids: set[str] = set()
-        for item in filtered:
-            if item.get("type") == "function_call":
-                call_id = item.get("call_id")
-                if isinstance(call_id, str) and call_id:
-                    function_call_ids.add(call_id)
-
-        safe: list[dict[str, Any]] = []
-        for item in filtered:
-            if item.get("type") == "function_call_output":
-                call_id = item.get("call_id")
-                if (
-                    isinstance(call_id, str)
-                    and call_id
-                    and call_id not in function_call_ids
-                ):
-                    tool_name = item.get("name")
-                    if not isinstance(tool_name, str) or not tool_name:
-                        tool_name = "tool"
-                    output_val = item.get("output")
-                    if isinstance(output_val, str):
-                        output_text = output_val
-                    else:
-                        try:
-                            output_text = json.dumps(output_val)
-                        except Exception:
-                            output_text = str(output_val)
-
-                    if len(output_text) > 16000:
-                        output_text = output_text[:16000] + "\n...[truncated]"
-
-                    safe.append(
-                        {
-                            "type": "message",
-                            "role": "assistant",
-                            "content": [
-                                {
-                                    "type": "output_text",
-                                    "text": f"[Previous {tool_name} result; call_id={call_id}]: {output_text}",
-                                }
-                            ],
-                        }
-                    )
-                    continue
-
-            safe.append(item)
-
-        return safe
+        return [dict(item) if isinstance(item, dict) else item for item in input_value]