PyPI - codex-meter - Versions diffs - 0.3.0__py3-none-any.whl - Mend

codex-meter 0.3.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (26) hide show

codex_meter/__init__.py +12 -0
codex_meter/__main__.py +4 -0
codex_meter/aggregation.py +127 -0
codex_meter/budgets.py +133 -0
codex_meter/cli.py +2455 -0
codex_meter/config.py +164 -0
codex_meter/exporters.py +339 -0
codex_meter/forecasts.py +92 -0
codex_meter/humanize.py +38 -0
codex_meter/insights.py +132 -0
codex_meter/intervals.py +129 -0
codex_meter/live.py +286 -0
codex_meter/models.py +282 -0
codex_meter/parse_cache.py +189 -0
codex_meter/parser.py +498 -0
codex_meter/pricing.py +311 -0
codex_meter/prom_export.py +116 -0
codex_meter/py.typed +0 -0
codex_meter/render.py +545 -0
codex_meter/timeutil.py +75 -0
codex_meter/windows.py +153 -0
codex_meter-0.3.0.dist-info/METADATA +304 -0
codex_meter-0.3.0.dist-info/RECORD +26 -0
codex_meter-0.3.0.dist-info/WHEEL +4 -0
codex_meter-0.3.0.dist-info/entry_points.txt +2 -0
codex_meter-0.3.0.dist-info/licenses/LICENSE +21 -0

codex_meter/pricing.py ADDED Viewed

@@ -0,0 +1,311 @@
+"""Embedded Codex rate card + RateCard resolver (offline-first)."""
+from __future__ import annotations
+import json
+from dataclasses import dataclass, replace
+from decimal import Decimal
+from pathlib import Path
+from codex_meter.models import (
+    CostTotals,
+    LongContextRule,
+    PricingSource,
+    Rates,
+    Usage,
+    decimal_value,
+)
+LONG_CONTEXT_INPUT_THRESHOLD = 272_000
+ZERO = Decimal("0")
+DEFAULT_API_RATES = Rates(input=5.0, cached_input=0.5, output=30.0)
+DEFAULT_CREDIT_RATES = Rates(input=125.0, cached_input=12.5, output=750.0)
+LONG_CONTEXT_1050K = LongContextRule(
+    threshold=LONG_CONTEXT_INPUT_THRESHOLD, input_mult=2.0, output_mult=1.5
+)
+@dataclass(frozen=True)
+class ModelCard:
+    """One Codex model's pricing. Missing rates are intentionally unpriced."""
+    name: str
+    api_rates: Rates | None
+    credit_rates: Rates | None
+    fast_multiplier: float = 1.0
+    long_context: LongContextRule | None = None
+MODEL_CARDS: tuple[ModelCard, ...] = (
+    ModelCard(
+        name="gpt-5.5",
+        api_rates=Rates(5.0, 0.5, 30.0),
+        credit_rates=Rates(125.0, 12.5, 750.0),
+        fast_multiplier=2.5,
+        long_context=LONG_CONTEXT_1050K,
+    ),
+    ModelCard(
+        name="gpt-5.4",
+        api_rates=Rates(2.5, 0.25, 15.0),
+        credit_rates=Rates(62.5, 6.25, 375.0),
+        fast_multiplier=2.0,
+        long_context=LONG_CONTEXT_1050K,
+    ),
+    ModelCard(
+        name="gpt-5.4-mini",
+        api_rates=Rates(0.75, 0.075, 4.5),
+        credit_rates=Rates(18.75, 1.875, 113.0),
+    ),
+    ModelCard(
+        name="gpt-5.3-codex",
+        api_rates=Rates(1.75, 0.175, 14.0),
+        credit_rates=Rates(43.75, 4.375, 350.0),
+    ),
+    ModelCard(
+        name="gpt-5.2",
+        api_rates=Rates(1.75, 0.175, 14.0),
+        credit_rates=Rates(43.75, 4.375, 350.0),
+    ),
+    ModelCard(
+        name="gpt-5.1-codex-max",
+        api_rates=Rates(1.25, 0.125, 10.0),
+        credit_rates=None,
+    ),
+)
+MODELS_BY_NAME: dict[str, ModelCard] = {card.name: card for card in MODEL_CARDS}
+PRICING_SOURCES = [
+    PricingSource(
+        name="OpenAI API pricing",
+        url="https://developers.openai.com/api/docs/pricing",
+        checked="2026-05-13",
+    ),
+    PricingSource(
+        name="GPT-5.5 model pricing and long-context rule",
+        url="https://developers.openai.com/api/docs/models/gpt-5.5",
+        checked="2026-05-13",
+    ),
+    PricingSource(
+        name="GPT-5.4 model pricing and long-context rule",
+        url="https://developers.openai.com/api/docs/models/gpt-5.4",
+        checked="2026-05-13",
+    ),
+    PricingSource(
+        name="Codex rate card",
+        url="https://help.openai.com/en/articles/20001106-codex-rate-card",
+        checked="2026-05-13",
+    ),
+    PricingSource(
+        name="Codex fast mode multipliers",
+        url="https://developers.openai.com/codex/speed",
+        checked="2026-05-13",
+    ),
+    PricingSource(
+        name="GPT-5.1-Codex-Max model pricing",
+        url="https://developers.openai.com/api/docs/models/gpt-5.1-codex-max",
+        checked="2026-05-13",
+    ),
+]
+def normalize_model(model: str | None) -> str:
+    raw = (model or "").strip().lower()
+    if not raw:
+        return ""
+    aliases = {
+        "gpt-5.4-mini": ("gpt-5.4-mini", "gpt-5-4-mini"),
+        "gpt-5.3-codex-spark": ("gpt-5.3-codex-spark", "gpt-5-3-codex-spark"),
+        "gpt-5.3-codex": ("gpt-5.3-codex", "gpt-5-3-codex"),
+        "gpt-5.1-codex-max": ("gpt-5.1-codex-max", "gpt-5-1-codex-max"),
+    }
+    for normalized, prefixes in aliases.items():
+        if raw in prefixes or any(raw.startswith(f"{prefix}-") for prefix in prefixes):
+            return normalized
+    for known in sorted(MODELS_BY_NAME, key=len, reverse=True):
+        if raw == known or raw.startswith(f"{known}-"):
+            return known
+    return raw
+def normalize_service_tier(value: str | None) -> str:
+    raw = (value or "").strip().lower()
+    if raw in {"fast", "priority"}:
+        return "fast"
+    if raw in {"standard", "default", "regular"}:
+        return "standard"
+    return ""
+def _parse_overrides(raw: object, section: str) -> dict[str, Rates]:
+    if not isinstance(raw, dict):
+        return {}
+    values = raw.get(section, {})
+    if not isinstance(values, dict):
+        raise ValueError(f"rates file section {section!r} must be an object")
+    parsed: dict[str, Rates] = {}
+    for model, item in values.items():
+        if not isinstance(item, dict):
+            raise ValueError(f"rates for {model!r} must be an object")
+        reasoning_raw = item.get("reasoning_output")
+        parsed[normalize_model(model)] = Rates(
+            input=decimal_value(item["input"]),
+            cached_input=decimal_value(item["cached_input"]),
+            output=decimal_value(item["output"]),
+            reasoning_output=decimal_value(reasoning_raw) if reasoning_raw is not None else None,
+        )
+    return parsed
+@dataclass(frozen=True)
+class RateCard:
+    """Per-run rate resolver. Loads any local overrides exactly once."""
+    api_overrides: dict[str, Rates]
+    credit_overrides: dict[str, Rates]
+    pricing_mode: str
+    @classmethod
+    def load(cls, path: Path | None, pricing_mode: str = "model") -> RateCard:
+        if path is None:
+            return cls(api_overrides={}, credit_overrides={}, pricing_mode=pricing_mode)
+        try:
+            raw = json.loads(path.expanduser().read_text())
+        except (OSError, json.JSONDecodeError) as exc:
+            raise ValueError(f"Could not read rates file {path}: {exc}") from exc
+        return cls(
+            api_overrides=_parse_overrides(raw, "api"),
+            credit_overrides=_parse_overrides(raw, "credits"),
+            pricing_mode=pricing_mode,
+        )
+    def cost_for(
+        self, usage: Usage, model: str, service_tier: str
+    ) -> tuple[CostTotals, bool, bool]:
+        normalized = normalize_model(model)
+        flat = self.pricing_mode == "flat"
+        card = MODELS_BY_NAME.get(normalized)
+        rule = card.long_context if (card and not flat) else None
+        long_context = rule is not None and usage.input_tokens > rule.threshold
+        input_mult = decimal_value(rule.input_mult if long_context and rule else 1)
+        output_mult = decimal_value(rule.output_mult if long_context and rule else 1)
+        billable_usage, ambiguous_reasoning = _billable_usage(usage)
+        api_rates, api_unpriced, api_local = self._resolve_api_rates(normalized, card, flat)
+        credit_rates, credit_unpriced, credit_local = self._resolve_credit_rates(
+            normalized, card, flat
+        )
+        standard_credits = _estimate(billable_usage, credit_rates, input_mult, output_mult)
+        adjusted_credits = standard_credits
+        estimated = flat
+        if service_tier == "fast" and card is not None and credit_rates is not None:
+            adjusted_credits = standard_credits * decimal_value(card.fast_multiplier)
+        elif service_tier == "fast" and credit_rates is not None:
+            estimated = True
+        return (
+            CostTotals(
+                api_dollars=_estimate(billable_usage, api_rates, input_mult, output_mult),
+                standard_credits=standard_credits,
+                adjusted_credits=adjusted_credits,
+                api_unpriced_events=int(api_unpriced),
+                credit_unpriced_events=int(credit_unpriced),
+                estimated_events=int(estimated),
+                ambiguous_reasoning_events=int(ambiguous_reasoning),
+                local_override_events=int(api_local or credit_local),
+            ),
+            long_context,
+            card is None and api_unpriced and credit_unpriced,
+        )
+    def cache_savings_for(self, usage: Usage, model: str, service_tier: str) -> CostTotals:
+        if not usage.cached_input_tokens:
+            return CostTotals()
+        uncached_usage = replace(usage, cached_input_tokens=0)
+        uncached_cost, _, _ = self.cost_for(uncached_usage, model, service_tier)
+        actual_cost, _, _ = self.cost_for(usage, model, service_tier)
+        return CostTotals(
+            api_dollars=max(ZERO, uncached_cost.api_dollars - actual_cost.api_dollars),
+            standard_credits=max(
+                ZERO, uncached_cost.standard_credits - actual_cost.standard_credits
+            ),
+            adjusted_credits=max(
+                ZERO, uncached_cost.adjusted_credits - actual_cost.adjusted_credits
+            ),
+            api_unpriced_events=max(
+                uncached_cost.api_unpriced_events, actual_cost.api_unpriced_events
+            ),
+            credit_unpriced_events=max(
+                uncached_cost.credit_unpriced_events, actual_cost.credit_unpriced_events
+            ),
+            estimated_events=max(uncached_cost.estimated_events, actual_cost.estimated_events),
+            ambiguous_reasoning_events=max(
+                uncached_cost.ambiguous_reasoning_events,
+                actual_cost.ambiguous_reasoning_events,
+            ),
+            local_override_events=max(
+                uncached_cost.local_override_events, actual_cost.local_override_events
+            ),
+        )
+    def _resolve_api_rates(
+        self, normalized: str, card: ModelCard | None, flat: bool
+    ) -> tuple[Rates | None, bool, bool]:
+        if flat:
+            return DEFAULT_API_RATES, False, False
+        if normalized in self.api_overrides:
+            return self.api_overrides[normalized], False, True
+        if card and card.api_rates is not None:
+            return card.api_rates, False, False
+        return None, True, False
+    def _resolve_credit_rates(
+        self, normalized: str, card: ModelCard | None, flat: bool
+    ) -> tuple[Rates | None, bool, bool]:
+        if flat:
+            return DEFAULT_CREDIT_RATES, False, False
+        if normalized in self.credit_overrides:
+            return self.credit_overrides[normalized], False, True
+        if card and card.credit_rates is not None:
+            return card.credit_rates, False, False
+        return None, True, False
+def _billable_usage(usage: Usage) -> tuple[Usage, bool]:
+    reasoning = usage.reasoning_output_tokens
+    if not reasoning:
+        return usage, False
+    total_with_reasoning_in_output = usage.input_tokens + usage.output_tokens
+    total_with_reasoning_separate = usage.input_tokens + usage.output_tokens + reasoning
+    if usage.total_tokens == total_with_reasoning_in_output:
+        return replace(usage, reasoning_output_tokens=0), False
+    if usage.total_tokens == total_with_reasoning_separate:
+        return usage, False
+    return replace(usage, reasoning_output_tokens=0), True
+def _estimate(
+    usage: Usage, rates: Rates | None, input_mult: Decimal, output_mult: Decimal
+) -> Decimal:
+    if rates is None:
+        return ZERO
+    return (
+        decimal_value(usage.uncached_input_tokens) * rates.input * input_mult
+        + decimal_value(usage.cached_input_tokens) * rates.cached_input * input_mult
+        + decimal_value(usage.output_tokens) * rates.output * output_mult
+        + decimal_value(usage.reasoning_output_tokens)
+        * rates.effective_reasoning_output
+        * output_mult
+    ) / Decimal("1000000")
+def estimate_event_cost(
+    usage: Usage,
+    model: str,
+    service_tier: str,
+    pricing_mode: str,
+    rates_file: Path | None = None,
+) -> tuple[CostTotals, bool, bool]:
+    """Single-event pricing. Builds a fresh RateCard — prefer caching one per run."""
+    card = RateCard.load(rates_file, pricing_mode)
+    return card.cost_for(usage, model, service_tier)

codex_meter/prom_export.py ADDED Viewed

@@ -0,0 +1,116 @@
+"""Prometheus exporter. Opt-in via the `[prom]` extra.
+Why a separate module? `prometheus_client` is an optional dependency. Importing
+this module triggers the dependency check; the rest of codex-meter stays import-clean.
+"""
+from __future__ import annotations
+import http.server
+from collections.abc import Callable
+from dataclasses import dataclass, field
+try:
+    from prometheus_client import CollectorRegistry, Gauge, generate_latest
+except ImportError as exc:  # pragma: no cover - import guard tested via integration only
+    raise ImportError(
+        "prometheus-client is not installed. Install with: pip install 'codex-meter[prom]'"
+    ) from exc
+PROM_CONTENT_TYPE = "text/plain; version=0.0.4; charset=utf-8"
+@dataclass(frozen=True)
+class MetricsSnapshot:
+    credits_used: float
+    burn_per_hour: float
+    primary_window_percent: float
+    secondary_window_percent: float
+    events_total: int
+    long_context_events_total: int
+    tokens_total: dict[tuple[str, str, str], int] = field(default_factory=dict)
+def build_metrics_text(snapshot: MetricsSnapshot) -> bytes:
+    """Render a Prometheus text-format payload from a snapshot."""
+    registry = CollectorRegistry()
+    credits = Gauge(
+        "codex_meter_credits_used",
+        "Adjusted credits in the current rolling window.",
+        registry=registry,
+    )
+    credits.set(snapshot.credits_used)
+    burn = Gauge(
+        "codex_meter_burn_per_hour",
+        "Burn rate (credits per hour) for the active window.",
+        registry=registry,
+    )
+    burn.set(snapshot.burn_per_hour)
+    window_pct = Gauge(
+        "codex_meter_window_used_percent",
+        "Rate-limit window used percent (0..100).",
+        ["window"],
+        registry=registry,
+    )
+    window_pct.labels(window="primary").set(snapshot.primary_window_percent)
+    window_pct.labels(window="secondary").set(snapshot.secondary_window_percent)
+    tokens = Gauge(
+        "codex_meter_tokens_total",
+        "Token counts by model, tier, and kind (input|cached|output|reasoning).",
+        ["model", "tier", "kind"],
+        registry=registry,
+    )
+    for (model, tier, kind), count in snapshot.tokens_total.items():
+        tokens.labels(model=model, tier=tier, kind=kind).set(count)
+    events = Gauge(
+        "codex_meter_events_total",
+        "Token-count events observed in the current window.",
+        registry=registry,
+    )
+    events.set(snapshot.events_total)
+    long_ctx = Gauge(
+        "codex_meter_long_context_events_total",
+        "Long-context events (>=threshold input tokens) observed in the current window.",
+        registry=registry,
+    )
+    long_ctx.set(snapshot.long_context_events_total)
+    return generate_latest(registry)
+def make_handler(snapshot_fn: Callable[[], MetricsSnapshot]):
+    """Build a BaseHTTPRequestHandler subclass that exposes /metrics."""
+    class Handler(http.server.BaseHTTPRequestHandler):
+        def do_GET(self):  # noqa: N802 — HTTPServer naming convention
+            if self.path != "/metrics":
+                self.send_error(404, "Only /metrics is exported")
+                return
+            body = build_metrics_text(snapshot_fn())
+            self.send_response(200)
+            self.send_header("Content-Type", PROM_CONTENT_TYPE)
+            self.send_header("Content-Length", str(len(body)))
+            self.end_headers()
+            self.wfile.write(body)
+        def log_message(self, fmt: str, *args: object) -> None:  # silence default logging
+            return
+    return Handler
+def serve_forever(host: str, port: int, snapshot_fn: Callable[[], MetricsSnapshot]) -> None:
+    """Bind and serve /metrics until interrupted. Default bind is 127.0.0.1."""
+    server = http.server.ThreadingHTTPServer((host, port), make_handler(snapshot_fn))
+    try:
+        server.serve_forever()
+    except KeyboardInterrupt:
+        pass
+    finally:
+        server.server_close()

codex_meter/py.typed ADDED Viewed

File without changes