feat(runtime-usage): add provider usage scrapers as optional local adapters (batch 3, #32)

2026-05-20 20:55:05 -05:00 · 2026-05-20 20:55:05 -05:00 · 1a847133ce
parent 609d04095d
commit 1a847133ce
5 changed files with 971 additions and 1 deletions
--- a/backend/app/api/gateways.py
+++ b/backend/app/api/gateways.py
@ -10,6 +10,8 @@ from sqlmodel import col

 from app.api.deps import require_org_admin, require_org_member
 from app.core.auth import AuthContext, get_auth_context
+from app.core.config import settings
+from app.core.time import utcnow
 from app.db import crud
 from app.db.pagination import paginate
 from app.db.session import get_session
@ -26,8 +28,13 @@ from app.schemas.gateways import (
    GatewayTemplatesSyncResult,
    GatewayUpdate,
 )
-from app.schemas.runtime_usage import RuntimeUsageResponse
+from app.schemas.runtime_usage import (
+    ProviderUsageResponse,
+    ProviderUsageScrapeResult,
+    RuntimeUsageResponse,
+)
 from app.services.openclaw.runtime_usage import get_runtime_usage
+from app.services.openclaw.usage_scrapers import get_provider_usage
 from app.schemas.pagination import DefaultLimitOffsetPage
 from app.services.openclaw.admin_service import GatewayAdminLifecycleService
 from app.services.openclaw.session_service import GatewayTemplateSyncQuery
@ -272,6 +279,79 @@ async def get_gateway_runtime_usage(
    )


+@router.get(
+    "/{gateway_id}/provider-usage",
+    response_model=ProviderUsageResponse,
+    summary="Gateway provider-native usage (opt-in scraper)",
+    description=(
+        "Return provider-native subscription usage data scraped from the CLI "
+        "(e.g. ``claude /usage``).  Returns an empty results list when "
+        "USAGE_SCRAPER_ENABLED=false (the default).  "
+        "Enable with USAGE_SCRAPER_ENABLED=true and ensure the required "
+        "prerequisites (tmux, claude binary) are accessible from the backend process."
+    ),
+)
+async def get_gateway_provider_usage(
+    gateway_id: UUID,
+    session: AsyncSession = SESSION_DEP,
+    ctx: OrganizationContext = ORG_MEMBER_DEP,
+) -> ProviderUsageResponse:
+    """Scrape provider-native usage for the specified gateway (opt-in)."""
+    service = GatewayAdminLifecycleService(session)
+    await service.require_gateway(
+        gateway_id=gateway_id,
+        organization_id=ctx.organization.id,
+    )
+    now = utcnow()
+
+    if not settings.usage_scraper_enabled:
+        return ProviderUsageResponse(
+            gateway_id=gateway_id,
+            generated_at=now,
+            scraper_enabled=False,
+            results=[],
+        )
+
+    enabled_providers = [
+        p.strip()
+        for p in settings.usage_scraper_providers.split(",")
+        if p.strip()
+    ]
+    scrape_results = await get_provider_usage(
+        gateway_id=str(gateway_id),
+        enabled_providers=enabled_providers,
+        tmux_socket=settings.usage_scraper_tmux_socket,
+        include_raw=settings.usage_scraper_include_raw,
+    )
+
+    results = [
+        ProviderUsageScrapeResult(
+            provider=r.provider,
+            source_name=r.source_name,
+            scraped_at=r.scraped_at,
+            fresh=r.fresh,
+            freshness_ttl_seconds=r.freshness_ttl_seconds,
+            current_pct=r.parsed.current_pct,
+            remaining_ms=r.parsed.remaining_ms,
+            remaining_label=r.parsed.remaining_label,
+            weekly_messages_used=r.parsed.weekly_messages_used,
+            weekly_messages_limit=r.parsed.weekly_messages_limit,
+            weekly_tokens_used=r.parsed.weekly_tokens_used,
+            weekly_cost_usd=r.parsed.weekly_cost_usd,
+            raw_text=r.parsed.raw_text,
+            error=r.error or r.parsed.error,
+        )
+        for r in scrape_results
+    ]
+
+    return ProviderUsageResponse(
+        gateway_id=gateway_id,
+        generated_at=now,
+        scraper_enabled=True,
+        results=results,
+    )
+
+
@router.delete("/{gateway_id}", response_model=OkResponse)
 async def delete_gateway(
    gateway_id: UUID,
--- a/backend/app/core/config.py
+++ b/backend/app/core/config.py
@ -89,6 +89,21 @@ class Settings(BaseSettings):
    # OpenClaw gateway runtime compatibility
    gateway_min_version: str = "2026.02.9"

+    # Provider usage scrapers (opt-in; off by default)
+    usage_scraper_enabled: bool = False
+    # Comma-separated list of enabled provider adapters, e.g. "claude_cli_tmux"
+    usage_scraper_providers: str = "claude_cli_tmux"
+    # TTL in seconds before a cached scrape result is considered stale
+    usage_scraper_cache_ttl_seconds: int = 300
+    # Directory for scraper output cache files (defaults to system temp)
+    usage_scraper_cache_dir: str = ""
+    # Full path to the claude binary (empty = auto-detect on PATH)
+    usage_scraper_claude_bin: str = ""
+    # Tmux socket path (empty = default tmux socket)
+    usage_scraper_tmux_socket: str = ""
+    # Include raw CLI output in API response (useful for debugging; off by default)
+    usage_scraper_include_raw: bool = False
+
    # Logging
    log_level: str = "INFO"
    log_format: str = "text"
--- a/backend/app/schemas/runtime_usage.py
+++ b/backend/app/schemas/runtime_usage.py
@ -72,6 +72,42 @@ class TopSession(SQLModel):
    updated_at: str | None = None


+class ProviderUsageScrapeResult(SQLModel):
+    """Structured result from one provider-native usage scrape (e.g. Claude CLI /usage).
+
+    Returned by GET /gateways/{id}/provider-usage.
+    All fields are optional — partial data is still useful and expected
+    when CLI output format changes or the session is quiet.
+    """
+
+    provider: str          # "anthropic", "openai", "google"
+    source_name: str       # "claude_cli_tmux", "gemini_scrape", etc.
+    scraped_at: datetime
+    fresh: bool            # True if within the freshness window
+    freshness_ttl_seconds: int
+
+    current_pct: float | None = None       # 0–100 % of current window used
+    remaining_ms: int | None = None        # ms until window resets
+    remaining_label: str | None = None     # human-readable "2h 47m"
+
+    weekly_messages_used: int | None = None
+    weekly_messages_limit: int | None = None
+    weekly_tokens_used: int | None = None
+    weekly_cost_usd: float | None = None
+
+    raw_text: str | None = None   # included when DEBUG_SCRAPER_RAW=true
+    error: str | None = None      # set when scrape or parse failed
+
+
+class ProviderUsageResponse(SQLModel):
+    """Response envelope for GET /gateways/{id}/provider-usage."""
+
+    gateway_id: UUID
+    generated_at: datetime
+    scraper_enabled: bool
+    results: list[ProviderUsageScrapeResult]
+
+
 class RuntimeUsageResponse(SQLModel):
    """Complete runtime usage payload returned by GET /gateways/{id}/runtime-usage."""

--- a/backend/app/services/openclaw/usage_scrapers.py
+++ b/backend/app/services/openclaw/usage_scrapers.py
@ -0,0 +1,550 @@
+"""Provider-native usage scrapers for supplemental limit/percentage data.
+
+Design principles:
+- Opt-in only: all scrapers are disabled by default (USAGE_SCRAPER_ENABLED=false).
+- Supplemental: scraper data enriches JSONL-based metrics; it is never the
+  primary source of truth for tokens or spend.
+- Isolated: each provider adapter is independent and can fail without
+  affecting the rest of the system.
+- Testable: parse_claude_usage() is a pure function with no side effects.
+- Fragile by nature: CLI text output changes — treat results as best-effort.
+
+Tmux requirement for ClaudeTmuxScraper:
+  The backend process must have access to the host's tmux socket.  For
+  Docker-based local installs, mount the socket:
+    -v /tmp/tmux-1000:/tmp/tmux-1000 (or whatever $TMUX uses)
+  For bare-metal runs, no extra config is needed.
+"""
+
+from __future__ import annotations
+
+import asyncio
+import os
+import re
+import tempfile
+from abc import ABC, abstractmethod
+from dataclasses import dataclass, field
+from datetime import datetime, timedelta
+from pathlib import Path
+from typing import ClassVar
+
+from app.core.logging import get_logger
+from app.core.time import utcnow
+
+logger = get_logger(__name__)
+
+# ---------------------------------------------------------------------------
+# Internal result dataclass (not a schema — stays inside the service layer)
+# ---------------------------------------------------------------------------
+
+@dataclass
+class ParsedClaudeUsage:
+    """Structured result from parsing one block of ``claude /usage`` text."""
+
+    raw_text: str
+    current_pct: float | None = None
+    remaining_ms: int | None = None
+    remaining_label: str | None = None
+    weekly_messages_used: int | None = None
+    weekly_messages_limit: int | None = None
+    weekly_tokens_used: int | None = None
+    weekly_cost_usd: float | None = None
+    error: str | None = None
+
+
+@dataclass
+class ScrapeResult:
+    """Complete result from one scraper invocation (parsed + metadata)."""
+
+    provider: str
+    source_name: str
+    scraped_at: datetime
+    fresh: bool
+    freshness_ttl_seconds: int
+    parsed: ParsedClaudeUsage
+    error: str | None = None
+
+
+# ---------------------------------------------------------------------------
+# Parser — pure function, no I/O
+# ---------------------------------------------------------------------------
+
+# Strip thousands-separator commas from a numeric string
+def _strip_commas(s: str) -> str:
+    return s.replace(",", "")
+
+
+def _parse_int(s: str) -> int:
+    return int(_strip_commas(s.strip()))
+
+
+def _parse_float(s: str) -> float:
+    return float(_strip_commas(s.strip()))
+
+
+# Matches "67%" or "67.5%" anywhere on a line, with optional surrounding words
+_PCT_RE = re.compile(
+    r"(?:^|[\s(])(\d+(?:\.\d+)?)\s*%",
+    re.MULTILINE,
+)
+
+# Matches "resets in", "resets at", "remaining", "time remaining", "next reset"
+# followed by the time expression
+_RESET_LINE_RE = re.compile(
+    r"(?:resets?\s+in[:\s]*|remaining[:\s]*|time\s+remaining[:\s]*|next\s+reset[:\s]*in[:\s]*)"
+    r"(.+?)(?:\)|$)",
+    re.IGNORECASE | re.MULTILINE,
+)
+
+# Also match "in 2h 47m" or "(resets in 2h 47m)" embedded in longer lines
+_INLINE_RESET_RE = re.compile(
+    r"\(\s*resets?\s+in\s+(.+?)\s*\)",
+    re.IGNORECASE,
+)
+
+# Time components: optional days, optional hours, optional minutes
+_TIME_PARTS_RE = re.compile(
+    r"(?:(\d+)\s*d(?:ay)?s?)?"          # days
+    r"\s*(?:(\d+)\s*h(?:our)?s?)?"      # hours
+    r"\s*(?:(\d+)\s*m(?:in(?:ute)?s?)?)?"  # minutes
+    r"|(<?)\s*1\s*m",                   # "< 1m" edge case
+    re.IGNORECASE,
+)
+
+# Weekly/daily usage lines
+_WEEKLY_MSGS_RE = re.compile(
+    # "messages: 234 / 500"  OR  "234 messages"  OR  "Messages: 234"
+    r"(?:messages?[:\s]+(\d[\d,]*)(?:\s*/\s*(\d[\d,]*))?)"
+    r"|(?:(\d[\d,]*)\s+messages?)",
+    re.IGNORECASE,
+)
+_WEEKLY_INPUT_RE = re.compile(r"input\s+tokens?[:\s]+([\d,]+)", re.IGNORECASE)
+_WEEKLY_OUTPUT_RE = re.compile(r"output\s+tokens?[:\s]+([\d,]+)", re.IGNORECASE)
+_WEEKLY_TOKENS_RE = re.compile(r"(?:total\s+)?tokens?[:\s]+([\d,]+)", re.IGNORECASE)
+_WEEKLY_COST_RE = re.compile(r"\$\s*([\d]+\.[\d]{1,4})", re.IGNORECASE)
+
+
+def _parse_remaining_ms(time_str: str) -> tuple[int, str] | None:
+    """Convert a time string like '2h 47m', '1 day 4h', '< 1m' to milliseconds.
+
+    Returns (ms, normalised_label) or None if nothing matches.
+    """
+    s = time_str.strip()
+    if not s:
+        return None
+
+    # "< 1m" / "< 1 minute"
+    if re.match(r"<\s*1\s*m", s, re.IGNORECASE):
+        return 30_000, "< 1m"  # represent as 30 seconds
+
+    m = _TIME_PARTS_RE.search(s)
+    if not m:
+        return None
+
+    days    = int(m.group(1) or 0)
+    hours   = int(m.group(2) or 0)
+    minutes = int(m.group(3) or 0)
+
+    total_ms = (days * 86400 + hours * 3600 + minutes * 60) * 1000
+    if total_ms == 0:
+        return None
+
+    # Build a compact human label
+    parts = []
+    if days:    parts.append(f"{days}d")
+    if hours:   parts.append(f"{hours}h")
+    if minutes: parts.append(f"{minutes}m")
+    label = " ".join(parts) if parts else s
+
+    return total_ms, label
+
+
+def parse_claude_usage(raw: str) -> ParsedClaudeUsage:
+    """Parse a block of text from ``claude /usage`` into structured fields.
+
+    This is a pure function — no I/O, no side effects.  It never raises;
+    on failure it sets ``error`` and leaves numeric fields as None.
+    """
+    result = ParsedClaudeUsage(raw_text=raw)
+
+    if not raw or not raw.strip():
+        result.error = "empty output"
+        return result
+
+    # ---- percentage --------------------------------------------------------
+    for m in _PCT_RE.finditer(raw):
+        pct = float(m.group(1))
+        if 0.0 <= pct <= 100.0:
+            result.current_pct = pct
+            break  # take the first plausible percentage
+
+    # ---- remaining time ----------------------------------------------------
+    time_str: str | None = None
+
+    # Try inline "(resets in X)" pattern first (most specific)
+    inline = _INLINE_RESET_RE.search(raw)
+    if inline:
+        time_str = inline.group(1)
+
+    # Fall back to line-level patterns
+    if not time_str:
+        line_m = _RESET_LINE_RE.search(raw)
+        if line_m:
+            time_str = line_m.group(1).strip()
+
+    if time_str:
+        parsed_time = _parse_remaining_ms(time_str)
+        if parsed_time:
+            result.remaining_ms, result.remaining_label = parsed_time
+
+    # ---- weekly stats  -----------------------------------------------------
+    # Try to find a "weekly" or "this week" section
+    weekly_section = raw
+    week_header = re.search(
+        r"(?:this\s+week|weekly|week\b)[^\n]*\n(.+?)(?=\n\s*\n|\Z)",
+        raw, re.IGNORECASE | re.DOTALL
+    )
+    if week_header:
+        weekly_section = week_header.group(0)
+
+    # messages (with optional limit)
+    msgs_m = _WEEKLY_MSGS_RE.search(weekly_section)
+    if msgs_m:
+        try:
+            # group(1) = "messages: N", group(3) = "N messages"
+            used_str = msgs_m.group(1) or msgs_m.group(3)
+            if used_str:
+                result.weekly_messages_used = _parse_int(used_str)
+            if msgs_m.group(2):
+                result.weekly_messages_limit = _parse_int(msgs_m.group(2))
+        except (ValueError, TypeError):
+            pass
+
+    # tokens — prefer input+output sum if both present
+    input_m  = _WEEKLY_INPUT_RE.search(weekly_section)
+    output_m = _WEEKLY_OUTPUT_RE.search(weekly_section)
+    if input_m and output_m:
+        try:
+            result.weekly_tokens_used = (
+                _parse_int(input_m.group(1)) + _parse_int(output_m.group(1))
+            )
+        except (ValueError, TypeError):
+            pass
+    elif not result.weekly_tokens_used:
+        tok_m = _WEEKLY_TOKENS_RE.search(weekly_section)
+        if tok_m:
+            try:
+                result.weekly_tokens_used = _parse_int(tok_m.group(1))
+            except (ValueError, TypeError):
+                pass
+
+    # Alt-key patterns: "weekly tokens: 9,876,543" anywhere in the text
+    if result.weekly_tokens_used is None:
+        alt_tok = re.search(
+            r"weekly\s+tokens?[:\s]+([\d,]+)", raw, re.IGNORECASE
+        )
+        if alt_tok:
+            try:
+                result.weekly_tokens_used = _parse_int(alt_tok.group(1))
+            except (ValueError, TypeError):
+                pass
+
+    # cost
+    cost_m = _WEEKLY_COST_RE.search(weekly_section)
+    if cost_m:
+        try:
+            result.weekly_cost_usd = _parse_float(cost_m.group(1))
+        except (ValueError, TypeError):
+            pass
+
+    # ---- validation --------------------------------------------------------
+    all_none = (
+        result.current_pct is None
+        and result.remaining_ms is None
+        and result.weekly_messages_used is None
+        and result.weekly_tokens_used is None
+    )
+    if all_none:
+        result.error = "no parseable usage data found"
+
+    return result
+
+
+# ---------------------------------------------------------------------------
+# Adapter interface
+# ---------------------------------------------------------------------------
+
+class RuntimeUsageProviderAdapter(ABC):
+    """Abstract base for provider-native usage scrapers."""
+
+    provider: ClassVar[str]
+    source_name: ClassVar[str]
+    freshness_ttl_seconds: ClassVar[int] = 300
+
+    @abstractmethod
+    async def fetch_raw(self) -> str:
+        """Return the raw text output from the provider's usage source."""
+
+    @abstractmethod
+    def parse(self, raw: str) -> ParsedClaudeUsage:
+        """Parse raw text into structured fields."""
+
+    def is_available(self) -> bool:
+        """Return True if the prerequisites for this adapter exist on this host."""
+        return True
+
+    async def scrape(self) -> ScrapeResult:
+        """Run fetch_raw + parse, returning a ScrapeResult regardless of errors."""
+        now = utcnow()
+        try:
+            raw = await self.fetch_raw()
+            parsed = self.parse(raw)
+            return ScrapeResult(
+                provider=self.provider,
+                source_name=self.source_name,
+                scraped_at=now,
+                fresh=True,
+                freshness_ttl_seconds=self.freshness_ttl_seconds,
+                parsed=parsed,
+            )
+        except Exception as exc:
+            logger.warning(
+                "usage_scraper.fetch_failed provider=%s source=%s error=%s",
+                self.provider, self.source_name, exc,
+            )
+            return ScrapeResult(
+                provider=self.provider,
+                source_name=self.source_name,
+                scraped_at=now,
+                fresh=False,
+                freshness_ttl_seconds=self.freshness_ttl_seconds,
+                parsed=ParsedClaudeUsage(raw_text="", error=str(exc)),
+                error=str(exc),
+            )
+
+
+# ---------------------------------------------------------------------------
+# Claude CLI tmux adapter
+# ---------------------------------------------------------------------------
+
+_TMUX_WAIT_SECONDS = 2.0     # seconds to wait after sending /usage
+_TMUX_CAPTURE_LINES = 80     # lines to capture from the tmux pane
+
+
+async def _run(
+    *args: str,
+    timeout: float = 5.0,
+) -> tuple[str, str]:
+    """Run a subprocess and return (stdout, stderr)."""
+    proc = await asyncio.create_subprocess_exec(
+        *args,
+        stdout=asyncio.subprocess.PIPE,
+        stderr=asyncio.subprocess.PIPE,
+    )
+    stdout, stderr = await asyncio.wait_for(proc.communicate(), timeout=timeout)
+    return stdout.decode("utf-8", errors="replace"), stderr.decode("utf-8", errors="replace")
+
+
+async def _find_claude_tmux_pane(tmux_socket: str = "") -> str | None:
+    """Find the first tmux pane running ``claude``; return pane id or None."""
+    base = ["tmux"]
+    if tmux_socket:
+        base += ["-S", tmux_socket]
+    try:
+        stdout, _ = await _run(
+            *base,
+            "list-panes", "-a",
+            "-F", "#{pane_id}:#{pane_current_command}",
+        )
+    except (FileNotFoundError, asyncio.TimeoutError, OSError):
+        return None
+
+    for line in stdout.splitlines():
+        parts = line.strip().split(":", 1)
+        if len(parts) == 2:
+            pane_id, command = parts
+            if "claude" in command.lower():
+                return pane_id
+    return None
+
+
+async def _tmux_send_and_capture(
+    pane_id: str,
+    command: str = "/usage",
+    tmux_socket: str = "",
+    wait_seconds: float = _TMUX_WAIT_SECONDS,
+) -> str:
+    """Send a command to a tmux pane and return the captured output."""
+    base = ["tmux"]
+    if tmux_socket:
+        base += ["-S", tmux_socket]
+
+    # Clear the pane buffer so we capture fresh output
+    await _run(*base, "clear-history", "-t", pane_id)
+    # Send the command
+    await _run(*base, "send-keys", "-t", pane_id, command, "Enter")
+    # Wait for the response to render
+    await asyncio.sleep(wait_seconds)
+    # Capture the pane contents
+    stdout, _ = await _run(
+        *base,
+        "capture-pane", "-pt", pane_id,
+        "-J",               # join wrapped lines
+        "-e",               # include escape sequences (ignored in text mode)
+    )
+    # Strip ANSI escape codes
+    ansi_re = re.compile(r"\x1b\[[0-9;]*[mGKHF]")
+    return ansi_re.sub("", stdout)
+
+
+class ClaudeTmuxScraper(RuntimeUsageProviderAdapter):
+    """Scraper that sends ``/usage`` to an active Claude tmux session.
+
+    Requires:
+    - tmux is installed and accessible from the backend process.
+    - At least one tmux pane is running the ``claude`` CLI.
+    - For Docker installs: mount the host tmux socket into the container.
+
+    This adapter is fragile by design — CLI output format changes over time.
+    Treat results as supplemental hints, not accounting truth.
+    """
+
+    provider: ClassVar[str] = "anthropic"
+    source_name: ClassVar[str] = "claude_cli_tmux"
+    freshness_ttl_seconds: ClassVar[int] = 300
+
+    def __init__(
+        self,
+        tmux_socket: str = "",
+        wait_seconds: float = _TMUX_WAIT_SECONDS,
+    ) -> None:
+        self.tmux_socket = tmux_socket
+        self.wait_seconds = wait_seconds
+
+    def is_available(self) -> bool:
+        import shutil
+        return shutil.which("tmux") is not None
+
+    async def fetch_raw(self) -> str:
+        pane_id = await _find_claude_tmux_pane(self.tmux_socket)
+        if pane_id is None:
+            raise RuntimeError(
+                "No tmux pane found running 'claude'. "
+                "Start a Claude session before enabling the tmux scraper."
+            )
+        return await _tmux_send_and_capture(
+            pane_id,
+            tmux_socket=self.tmux_socket,
+            wait_seconds=self.wait_seconds,
+        )
+
+    def parse(self, raw: str) -> ParsedClaudeUsage:
+        return parse_claude_usage(raw)
+
+
+# ---------------------------------------------------------------------------
+# Simple TTL cache
+# ---------------------------------------------------------------------------
+
+class UsageScraperCache:
+    """In-memory TTL cache for scrape results.
+
+    Optionally writes results to a cache directory so they survive
+    backend restarts (useful for slow-changing subscription data).
+    """
+
+    def __init__(
+        self,
+        ttl_seconds: int = 300,
+        cache_dir: str = "",
+    ) -> None:
+        self.ttl_seconds = ttl_seconds
+        self._memory: dict[str, tuple[datetime, ScrapeResult]] = {}
+        self._cache_dir = Path(cache_dir) if cache_dir else Path(tempfile.gettempdir()) / "pipeline-usage-cache"
+
+    def _key(self, gateway_id: str, source_name: str) -> str:
+        return f"{gateway_id}:{source_name}"
+
+    def get(self, gateway_id: str, source_name: str) -> ScrapeResult | None:
+        key = self._key(gateway_id, source_name)
+        entry = self._memory.get(key)
+        if entry is None:
+            return None
+        cached_at, result = entry
+        age = (utcnow() - cached_at).total_seconds()
+        if age > self.ttl_seconds:
+            del self._memory[key]
+            return None
+        return result
+
+    def set(self, gateway_id: str, source_name: str, result: ScrapeResult) -> None:
+        key = self._key(gateway_id, source_name)
+        self._memory[key] = (utcnow(), result)
+
+
+# Module-level singleton cache used by the endpoint
+_cache = UsageScraperCache()
+
+
+# ---------------------------------------------------------------------------
+# Public entry point
+# ---------------------------------------------------------------------------
+
+def build_adapters(
+    enabled_providers: list[str],
+    tmux_socket: str = "",
+) -> list[RuntimeUsageProviderAdapter]:
+    """Instantiate enabled adapters from a list of provider names."""
+    registry: dict[str, type[RuntimeUsageProviderAdapter]] = {
+        "claude_cli_tmux": ClaudeTmuxScraper,
+    }
+    adapters = []
+    for name in enabled_providers:
+        cls = registry.get(name.strip().lower())
+        if cls is None:
+            logger.warning("usage_scraper.unknown_provider name=%s", name)
+            continue
+        kwargs: dict = {}
+        if name == "claude_cli_tmux":
+            kwargs["tmux_socket"] = tmux_socket
+        adapter = cls(**kwargs)
+        if adapter.is_available():
+            adapters.append(adapter)
+        else:
+            logger.info("usage_scraper.not_available provider=%s", name)
+    return adapters
+
+
+async def get_provider_usage(
+    gateway_id: str,
+    enabled_providers: list[str],
+    tmux_socket: str = "",
+    include_raw: bool = False,
+) -> list[ScrapeResult]:
+    """Run all enabled adapters for a gateway, using cache where fresh.
+
+    Returns one ScrapeResult per adapter (errors included, never raises).
+    """
+    adapters = build_adapters(enabled_providers, tmux_socket=tmux_socket)
+    results: list[ScrapeResult] = []
+    for adapter in adapters:
+        cached = _cache.get(gateway_id, adapter.source_name)
+        if cached is not None:
+            results.append(cached)
+            continue
+        result = await adapter.scrape()
+        _cache.set(gateway_id, adapter.source_name, result)
+        if not include_raw and result.parsed:
+            result.parsed.raw_text = None  # strip unless explicitly requested
+        results.append(result)
+        logger.info(
+            "usage_scraper.result gateway_id=%s provider=%s source=%s "
+            "pct=%s remaining_ms=%s error=%s",
+            gateway_id,
+            result.provider,
+            result.source_name,
+            result.parsed.current_pct,
+            result.parsed.remaining_ms,
+            result.error,
+        )
+    return results
--- a/backend/tests/test_runtime_usage_scrapers.py
+++ b/backend/tests/test_runtime_usage_scrapers.py
@ -0,0 +1,289 @@
+# ruff: noqa: INP001
+"""Tests for provider usage scraper parsers.
+
+All tests are pure-Python — no subprocess, no tmux, no gateway connection.
+Each fixture string represents a realistic sample of `claude /usage` output.
+Tests are written first and drive the parser implementation.
+"""
+
+from __future__ import annotations
+
+import pytest
+
+# We import the parse function directly — it is pure and has no side effects.
+from app.services.openclaw.usage_scrapers import parse_claude_usage
+
+
+# ---------------------------------------------------------------------------
+# Fixture text samples
+# ---------------------------------------------------------------------------
+
+# Standard output from `claude /usage` in Claude Code (subscription plan)
+FIXTURE_STANDARD = """
+╭──────────────────────────────────────────────────────────────────╮
+│                       Claude Code Usage                          │
+╰──────────────────────────────────────────────────────────────────╯
+
+ Usage window (resets in 2h 47m):
+   67% of limit used
+
+ This week (Mon – Sun):
+   Messages:      234
+   Input tokens:  1,234,567
+   Output tokens:   456,789
+   Est. cost:     $4.23
+"""
+
+# Minimal output — just the percentage and reset time
+FIXTURE_MINIMAL = """
+Rate limit: 45% used
+Resets in: 3h 15m
+"""
+
+# Output with messages limit shown as X/Y
+FIXTURE_WITH_LIMIT = """
+Usage window resets in 1h 5m:
+  Messages: 178 / 500  (35% used)
+  Input tokens: 890,123
+  Output tokens: 234,567
+
+Weekly usage:
+  Messages: 892
+  Cost: $8.76
+"""
+
+# Sub-minute remaining time
+FIXTURE_ALMOST_RESET = """
+Usage: 99% of window used
+Resets in: 42m
+"""
+
+# Only minutes remaining without hours
+FIXTURE_MINUTES_ONLY = """
+Context: 72% used
+Time remaining: 28m
+"""
+
+# Days + hours format
+FIXTURE_DAYS_HOURS = """
+Next reset: in 1 day 4h
+Current usage: 12%
+"""
+
+# "< 1 minute" edge case
+FIXTURE_UNDER_ONE_MINUTE = """
+Usage: 100%
+Resets in: < 1m
+"""
+
+# Output without any percentage but with reset time
+FIXTURE_NO_PCT = """
+Session active.
+Window resets in: 4h 0m
+No usage data available.
+"""
+
+# Output with zero usage
+FIXTURE_ZERO_USAGE = """
+Usage window (resets in 5h 0m):
+  0% of limit used
+
+Weekly: 0 messages, $0.00
+"""
+
+# Completely empty
+FIXTURE_EMPTY = ""
+
+# Garbage / error text
+FIXTURE_ERROR = "Error: claude: command not found"
+
+# Multi-line noise around the real data
+FIXTURE_NOISY = """
+...
+Checking session...
+Fetching usage stats...
+
+Usage (resets in 2h 0m): 55% used
+
+Messages this week: 301
+
+...Done.
+"""
+
+# Alternate key casing variants that some versions might use
+FIXTURE_ALT_KEYS = """
+rate limit window: 89% Used
+RESETS IN: 0h 30m
+weekly messages: 412
+weekly tokens: 9,876,543
+"""
+
+
+# ---------------------------------------------------------------------------
+# Tests
+# ---------------------------------------------------------------------------
+
+class TestParseClaudeUsagePercentage:
+
+    def test_standard_percentage(self):
+        r = parse_claude_usage(FIXTURE_STANDARD)
+        assert r.current_pct == pytest.approx(67.0)
+
+    def test_minimal_percentage(self):
+        r = parse_claude_usage(FIXTURE_MINIMAL)
+        assert r.current_pct == pytest.approx(45.0)
+
+    def test_with_limit_percentage(self):
+        r = parse_claude_usage(FIXTURE_WITH_LIMIT)
+        assert r.current_pct == pytest.approx(35.0)
+
+    def test_near_full_percentage(self):
+        r = parse_claude_usage(FIXTURE_ALMOST_RESET)
+        assert r.current_pct == pytest.approx(99.0)
+
+    def test_zero_percentage(self):
+        r = parse_claude_usage(FIXTURE_ZERO_USAGE)
+        assert r.current_pct == pytest.approx(0.0)
+
+    def test_no_percentage_returns_none(self):
+        r = parse_claude_usage(FIXTURE_NO_PCT)
+        assert r.current_pct is None
+
+    def test_empty_returns_none(self):
+        r = parse_claude_usage(FIXTURE_EMPTY)
+        assert r.current_pct is None
+
+    def test_error_text_returns_none(self):
+        r = parse_claude_usage(FIXTURE_ERROR)
+        assert r.current_pct is None
+
+    def test_alt_key_casing(self):
+        r = parse_claude_usage(FIXTURE_ALT_KEYS)
+        assert r.current_pct == pytest.approx(89.0)
+
+    def test_noisy_output(self):
+        r = parse_claude_usage(FIXTURE_NOISY)
+        assert r.current_pct == pytest.approx(55.0)
+
+
+class TestParseClaudeUsageRemainingTime:
+
+    def test_hours_and_minutes(self):
+        r = parse_claude_usage(FIXTURE_STANDARD)
+        # 2h 47m = 10020 seconds = 10,020,000 ms
+        assert r.remaining_ms == pytest.approx(10_020_000, rel=1e-3)
+        assert r.remaining_label == "2h 47m"
+
+    def test_hours_and_minutes_variant(self):
+        r = parse_claude_usage(FIXTURE_MINIMAL)
+        # 3h 15m = 11700 seconds
+        assert r.remaining_ms == pytest.approx(11_700_000, rel=1e-3)
+
+    def test_minutes_only(self):
+        r = parse_claude_usage(FIXTURE_MINUTES_ONLY)
+        # 28m = 1680 seconds
+        assert r.remaining_ms == pytest.approx(1_680_000, rel=1e-3)
+        assert r.remaining_label == "28m"
+
+    def test_days_and_hours(self):
+        r = parse_claude_usage(FIXTURE_DAYS_HOURS)
+        # 1 day 4h = 28 hours = 100800 seconds
+        assert r.remaining_ms == pytest.approx(100_800_000, rel=1e-3)
+
+    def test_under_one_minute(self):
+        r = parse_claude_usage(FIXTURE_UNDER_ONE_MINUTE)
+        assert r.remaining_ms is not None
+        assert r.remaining_ms < 60_000  # less than 1 minute
+
+    def test_short_reset(self):
+        r = parse_claude_usage(FIXTURE_ALMOST_RESET)
+        # 42m = 2520 seconds
+        assert r.remaining_ms == pytest.approx(2_520_000, rel=1e-3)
+
+    def test_no_time_returns_none(self):
+        r = parse_claude_usage(FIXTURE_ERROR)
+        assert r.remaining_ms is None
+        assert r.remaining_label is None
+
+    def test_empty_returns_none(self):
+        r = parse_claude_usage(FIXTURE_EMPTY)
+        assert r.remaining_ms is None
+
+    def test_with_limit_time(self):
+        r = parse_claude_usage(FIXTURE_WITH_LIMIT)
+        # 1h 5m = 3900 seconds
+        assert r.remaining_ms == pytest.approx(3_900_000, rel=1e-3)
+
+    def test_hours_only(self):
+        r = parse_claude_usage(FIXTURE_NO_PCT)
+        # 4h 0m = 14400 seconds
+        assert r.remaining_ms == pytest.approx(14_400_000, rel=1e-3)
+
+    def test_alt_keys_30m(self):
+        r = parse_claude_usage(FIXTURE_ALT_KEYS)
+        # "0h 30m" = 30m = 1800s
+        assert r.remaining_ms == pytest.approx(1_800_000, rel=1e-3)
+
+
+class TestParseClaudeUsageWeeklyStats:
+
+    def test_weekly_messages_no_limit(self):
+        r = parse_claude_usage(FIXTURE_STANDARD)
+        assert r.weekly_messages_used == 234
+        assert r.weekly_messages_limit is None  # no limit shown
+
+    def test_weekly_messages_with_limit(self):
+        r = parse_claude_usage(FIXTURE_WITH_LIMIT)
+        assert r.weekly_messages_used == 892
+
+    def test_weekly_tokens(self):
+        r = parse_claude_usage(FIXTURE_STANDARD)
+        # Input + output = 1,234,567 + 456,789 = 1,691,356
+        assert r.weekly_tokens_used == 1_691_356
+
+    def test_weekly_cost(self):
+        r = parse_claude_usage(FIXTURE_STANDARD)
+        assert r.weekly_cost_usd == pytest.approx(4.23, rel=1e-3)
+
+    def test_zero_weekly(self):
+        r = parse_claude_usage(FIXTURE_ZERO_USAGE)
+        assert r.weekly_messages_used == 0
+        assert r.weekly_cost_usd == pytest.approx(0.0)
+
+    def test_no_weekly_returns_none(self):
+        r = parse_claude_usage(FIXTURE_MINIMAL)
+        assert r.weekly_messages_used is None
+        assert r.weekly_cost_usd is None
+
+    def test_alt_keys_weekly_tokens(self):
+        r = parse_claude_usage(FIXTURE_ALT_KEYS)
+        assert r.weekly_tokens_used == 9_876_543
+
+
+class TestParseClaudeUsageEdgeCases:
+
+    def test_returns_dataclass_always(self):
+        """parse_claude_usage never raises — it always returns a result."""
+        for fixture in [
+            FIXTURE_STANDARD, FIXTURE_MINIMAL, FIXTURE_EMPTY,
+            FIXTURE_ERROR, FIXTURE_NOISY, FIXTURE_ALT_KEYS,
+        ]:
+            result = parse_claude_usage(fixture)
+            assert result is not None
+
+    def test_error_field_on_empty(self):
+        r = parse_claude_usage(FIXTURE_EMPTY)
+        assert r.error is not None  # signals "no parseable content"
+
+    def test_no_error_on_good_output(self):
+        r = parse_claude_usage(FIXTURE_STANDARD)
+        assert r.error is None
+
+    def test_raw_text_preserved(self):
+        r = parse_claude_usage(FIXTURE_MINIMAL)
+        assert r.raw_text == FIXTURE_MINIMAL
+
+    def test_messages_comma_separated_numbers(self):
+        """Numbers like 1,234,567 must be parsed correctly."""
+        r = parse_claude_usage(FIXTURE_STANDARD)
+        assert r.weekly_tokens_used == 1_691_356  # 1,234,567 + 456,789