npm - nexo-brain - Versions diffs - 7.32.0 → 7.34.0 - Mend

nexo-brain 7.32.0 → 7.34.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

package/.claude-plugin/plugin.json +1 -1
package/README.md +1 -1
package/package.json +1 -1
package/src/consolidation_prep.py +380 -0
package/src/db/__init__.py +5 -1
package/src/db/_episodic.py +32 -0
package/src/db/_memory_v2.py +276 -0
package/src/db/_protocol.py +35 -0
package/src/db/_schema.py +207 -0
package/src/hooks/auto_capture.py +60 -24
package/src/learning_resolver.py +42 -0
package/src/local_context/api.py +237 -33
package/src/local_context/db.py +3 -2
package/src/local_context/usage_events.py +2 -0
package/src/memory_retrieval.py +96 -7
package/src/message_batch_preview.py +290 -0
package/src/plugins/protocol.py +218 -27
package/src/ppr.py +473 -0
package/src/pre_answer_router.py +316 -3
package/src/pre_answer_runtime.py +156 -1
package/src/resolution_cache.py +1119 -0
package/src/scripts/deep-sleep/apply_findings.py +86 -9
package/src/scripts/deep-sleep/rewrite.py +625 -0
package/src/scripts/nexo-deep-sleep.sh +10 -0
package/src/scripts/nexo-followup-runner.py +110 -8
package/src/scripts/nexo-morning-agent.py +43 -2
package/src/scripts/nexo-postmortem-consolidator.py +44 -1
package/src/self_error_detector.py +414 -0
package/src/semantic_layers.py +30 -3
package/templates/core-prompts/morning-agent.md +3 -0
package/templates/core-prompts/postmortem-consolidator.md +29 -2

package/src/learning_resolver.py CHANGED Viewed

@@ -173,6 +173,46 @@ def applies_overlap(left: str, right: str) -> bool:
     return False
+def normalized_key(title: str, applies_to: str = "") -> str:
+    """Stable dedup key for a learning: normalized title + sorted applies scope.
+    Public thin wrapper so callers (e.g. the nightly consolidation brief builder)
+    depend only on the resolver's public surface for dedup math. Two learnings
+    that differ only in casing/whitespace of the title and ordering of applies_to
+    tokens collapse to the same key.
+    """
+    title_key = _normalize_text(title)
+    scope_tokens = sorted(
+        {_normalize_applies_token(item) for item in _split_applies_to(applies_to)} - {""}
+    )
+    if scope_tokens:
+        return f"{title_key}|{','.join(scope_tokens)}"
+    return title_key
+def candidate_similarity(text_a: str, text_b: str) -> float:
+    """Similarity between two free-text snippets using the resolver's own math.
+    Wraps hybrid_similarity_score with the SAME thresholds used in _similarity
+    (the per-candidate resolution path) so consolidation_prep and the resolver
+    stay in lockstep. Returns 0.0 when either side is empty.
+    """
+    left = str(text_a or "").strip()
+    right = str(text_b or "").strip()
+    if not left or not right:
+        return 0.0
+    return float(
+        hybrid_similarity_score(
+            left,
+            right,
+            keyword_extractor=extract_keywords,
+            strong_semantic_threshold=0.82,
+            moderate_semantic_threshold=0.74,
+            moderate_keyword_floor=0.08,
+        )
+    )
 def _table_columns(conn: sqlite3.Connection, table: str) -> set[str]:
     try:
         return {str(row["name"]) for row in conn.execute(f"PRAGMA table_info({table})").fetchall()}
@@ -413,7 +453,9 @@ __all__ = [
     "CANONICAL_ACTIONS",
     "applies_overlap",
     "authority_rank",
+    "candidate_similarity",
     "looks_contradictory",
     "normalize_authority",
+    "normalized_key",
     "resolve_learning_candidate",
 ]

package/src/local_context/api.py CHANGED Viewed

@@ -50,6 +50,12 @@ INITIAL_INDEX_STARTED_AT_KEY = "initial_index_started_at"
 PERFORMANCE_PROFILE_KEY = "performance_profile"
 DEFAULT_PERFORMANCE_PROFILE = os.environ.get("NEXO_LOCAL_INDEX_PERFORMANCE_PROFILE", "medium").strip().lower() or "medium"
 VALID_CONTEXT_MODES = {"compact", "full"}
+# FTS5 keyword recall over local_chunks. Additive, guarded, reversible.
+# Backfill batch size; 0 disables the incremental backfill entirely.
+FTS_BACKFILL_BATCH = int(os.environ.get("NEXO_LOCAL_FTS_BACKFILL_BATCH", "500") or "500")
+FTS_MIGRATION_CURSOR_KEY = "fts_migration_cursor"
+FTS_MIGRATION_DONE_KEY = "fts_migration_done"
+FTS_BACKFILL_TOTAL_KEY = "fts_backfill_total"
 EMBEDDING_REFRESH_JOB = "embedding_refresh"
 ENTITY_FACTS_JOB = "entity_facts"
 BACKGROUND_INDEX_JOB_TYPES = {ENTITY_FACTS_JOB}
@@ -3541,6 +3547,14 @@ def run_once(
         }
     scan_result = scan_once(limit=effective_scan_limit)
     job_result = process_jobs(limit=effective_process_limit)
+    # Incremental FTS backfill: bounded one-batch-per-tick, after the disk-budget
+    # gate (above) and after process_jobs. Best-effort — never let it break the
+    # cron tick. Skips itself when disabled (batch=0) or already done.
+    if FTS_BACKFILL_BATCH > 0:
+        try:
+            _backfill_fts_rows(conn, batch_limit=FTS_BACKFILL_BATCH)
+        except Exception:
+            pass
     conn_after = _conn()
     initial_after = _initial_scan_status(conn_after, list_roots(readonly=False))
     blocking_active_after = _active_job_count(conn_after, blocking_only=True)
@@ -4109,6 +4123,32 @@ def _status_from_conn(conn, *, readonly: bool = False) -> dict:
         "permissions": [],
         "models": model_status()["models"],
         "support_log_available": True,
+        "fts_recall": _fts_status(conn),
+    }
+def _fts_status(conn) -> dict:
+    """Operator-facing FTS5 backfill progress (so progress can be watched)."""
+    try:
+        done = _get_state_conn(conn, FTS_MIGRATION_DONE_KEY, "0") == "1"
+    except Exception:
+        done = False
+    try:
+        cursor = int(_get_state_conn(conn, FTS_MIGRATION_CURSOR_KEY, "0") or "0")
+    except Exception:
+        cursor = 0
+    try:
+        total = int(_get_state_conn(conn, FTS_BACKFILL_TOTAL_KEY, "0") or "0")
+    except Exception:
+        total = 0
+    return {
+        "enabled": _fts_enabled_env(),
+        "available": _fts_available(conn),
+        "done": done,
+        "cursor": cursor,
+        "total": total,
+        "read_path": "fts" if _fts_ready(conn) else "like",
+        "backfill_batch": FTS_BACKFILL_BATCH,
     }
@@ -4433,6 +4473,136 @@ def _context_prefilter_limit(default: int = 1200) -> int:
     return max(100, min(value, 5000))
+def _fts_enabled_env() -> bool:
+    """Feature flag for the FTS5 read path (default on; set 0/false to roll back)."""
+    value = os.environ.get("NEXO_LOCAL_CONTEXT_FTS_ENABLED", "1").strip().lower()
+    return value not in {"0", "false", "no", "off"}
+def _fts_available(conn) -> bool:
+    """True if the local_chunks_fts FTS5 vtab exists and MATCH works.
+    Hosts without FTS5 support fall back to a plain shadow table that does NOT
+    support MATCH, so the cheap probe runs a trivial MATCH and catches
+    OperationalError. The probe (a sqlite_master lookup + MATCH LIMIT 0) is fast
+    enough to run inline without caching, which avoids stale per-connection
+    cache bugs across reconnects.
+    """
+    try:
+        row = conn.execute(
+            "SELECT 1 FROM sqlite_master WHERE type IN ('table','view') AND name='local_chunks_fts' LIMIT 1"
+        ).fetchone()
+        if not row:
+            return False
+        # Trivial MATCH proves this is a real FTS5 vtab (shadow fallback raises).
+        conn.execute(
+            "SELECT rowid FROM local_chunks_fts WHERE local_chunks_fts MATCH ? LIMIT 0",
+            ("nexo_fts_probe",),
+        ).fetchall()
+        return True
+    except sqlite3.OperationalError:
+        return False
+    except Exception:
+        return False
+def _fts_ready(conn) -> bool:
+    """The FTS read path is authoritative only when: backfill done AND the
+    feature flag is on AND FTS5 is actually available on this host."""
+    if not _fts_enabled_env():
+        return False
+    if _get_state_conn(conn, FTS_MIGRATION_DONE_KEY, "0") != "1":
+        return False
+    return _fts_available(conn)
+def _fts_match_expr(terms: list[str]) -> str:
+    """Build a safe FTS5 MATCH expression from query terms.
+    Each term is double-quoted (FTS5 phrase syntax) with embedded double quotes
+    doubled, neutralizing FTS operators/special chars; terms are OR-joined.
+    Returns '' when there is nothing safe to match.
+    """
+    quoted = []
+    for term in terms:
+        cleaned = str(term or "").strip()
+        if not cleaned:
+            continue
+        quoted.append('"' + cleaned.replace('"', '""') + '"')
+    return " OR ".join(quoted)
+def _backfill_fts_rows(conn, *, batch_limit: int | None = None) -> dict:
+    """Incrementally mirror legacy local_chunks rows into local_chunks_fts.
+    Idempotent + resumable: a cursor (max processed rowid) is persisted in
+    local_index_state per batch and committed, so a crash resumes from the last
+    committed rowid. INSERT OR REPLACE keyed by rowid makes re-runs safe.
+    When no rows remain past the cursor the done flag is set. Returns a small
+    status dict. NOTE: new chunks written after schema migration already get FTS
+    rows via the local_chunks_fts triggers, so this only handles pre-existing
+    rows (the legacy 19GB DB).
+    """
+    if batch_limit is None:
+        batch_limit = FTS_BACKFILL_BATCH
+    batch_limit = int(batch_limit)
+    if batch_limit <= 0:
+        return {"ok": True, "skipped": "disabled", "done": _get_state_conn(conn, FTS_MIGRATION_DONE_KEY, "0") == "1"}
+    if not _fts_available(conn):
+        return {"ok": True, "skipped": "fts_unavailable", "done": False}
+    if _get_state_conn(conn, FTS_MIGRATION_DONE_KEY, "0") == "1":
+        return {"ok": True, "skipped": "already_done", "done": True}
+    def _run() -> dict:
+        try:
+            cursor = int(_get_state_conn(conn, FTS_MIGRATION_CURSOR_KEY, "0") or "0")
+        except Exception:
+            cursor = 0
+        # Snapshot the total once (first backfill tick) so the operator status
+        # surface can show progress without a COUNT(*) on the 19GB table per tick.
+        if _get_state_conn(conn, FTS_BACKFILL_TOTAL_KEY, "") == "":
+            try:
+                total_row = conn.execute("SELECT COUNT(*) AS total FROM local_chunks").fetchone()
+                _set_state_conn(conn, FTS_BACKFILL_TOTAL_KEY, str(int(total_row["total"] or 0)))
+            except Exception:
+                pass
+        rows = conn.execute(
+            """
+            SELECT c.rowid AS rid, c.text AS text,
+                   COALESCE(a.privacy_class, 'normal') AS privacy_class,
+                   COALESCE(a.status, 'active') AS asset_status
+            FROM local_chunks c
+            LEFT JOIN local_assets a ON a.asset_id = c.asset_id
+            WHERE c.rowid > ?
+            ORDER BY c.rowid ASC
+            LIMIT ?
+            """,
+            (cursor, batch_limit),
+        ).fetchall()
+        if not rows:
+            _set_state_conn(conn, FTS_MIGRATION_DONE_KEY, "1")
+            conn.commit()
+            return {"ok": True, "done": True, "processed": 0, "cursor": cursor}
+        max_rid = cursor
+        for row in rows:
+            rid = int(row["rid"])
+            conn.execute("DELETE FROM local_chunks_fts WHERE rowid = ?", (rid,))
+            conn.execute(
+                """
+                INSERT INTO local_chunks_fts(rowid, text, privacy_class, asset_status)
+                VALUES (?, ?, ?, ?)
+                """,
+                (rid, str(row["text"] or ""), str(row["privacy_class"] or "normal"), str(row["asset_status"] or "active")),
+            )
+            if rid > max_rid:
+                max_rid = rid
+        _set_state_conn(conn, FTS_MIGRATION_CURSOR_KEY, str(max_rid))
+        conn.commit()
+        return {"ok": True, "done": False, "processed": len(rows), "cursor": max_rid}
+    return _with_sqlite_busy_retry(_run)
 def _context_candidate_rows(
     conn,
     entity_asset_ids: list[str],
@@ -4444,39 +4614,73 @@ def _context_candidate_rows(
     prefilter_limit = min(int(base_limit or 5000), _context_prefilter_limit())
     prefilter_rows = []
     if terms:
-        term_clauses = []
-        params: list[str] = []
-        for term in terms:
-            term_clauses.append("(lower(a.path) LIKE ? OR lower(COALESCE(v.summary, '')) LIKE ? OR lower(c.text) LIKE ?)")
-            like = f"%{term}%"
-            params.extend([like, like, like])
-        prefilter_rows = conn.execute(
-            f"""
-            SELECT c.chunk_id, c.asset_id, c.text, a.path, a.file_type, a.privacy_class, v.summary,
-                   e.vector_json, e.model_id, e.model_revision, e.dimension
-            FROM local_chunks c
-            JOIN local_assets a ON a.asset_id = c.asset_id
-            LEFT JOIN local_asset_versions v ON v.version_id = c.version_id
-            LEFT JOIN local_embeddings e ON e.chunk_id = c.chunk_id
-            WHERE a.status='active'
-              AND a.privacy_class='normal'
-              AND ({" OR ".join(term_clauses)})
-            ORDER BY
-              CASE
-                WHEN {" OR ".join("lower(a.path) LIKE ?" for _ in terms)} THEN 0
-                WHEN {" OR ".join("lower(COALESCE(v.summary, '')) LIKE ?" for _ in terms)} THEN 1
-                ELSE 2
-              END,
-              c.created_at DESC
-            LIMIT ?
-            """,
-            [
-                *params,
-                *(f"%{term}%" for term in terms),
-                *(f"%{term}%" for term in terms),
-                prefilter_limit,
-            ],
-        ).fetchall()
+        used_fts = False
+        # DUAL-READ: only take the FTS path once the backfill is done AND the
+        # flag is on AND FTS5 is available. Until then (or on rollback) the
+        # EXACT legacy LIKE path runs, so retrieval is unaffected mid-migration.
+        if _fts_ready(conn):
+            match_expr = _fts_match_expr(terms)
+            if match_expr:
+                try:
+                    prefilter_rows = conn.execute(
+                        """
+                        SELECT c.chunk_id, c.asset_id, c.text, a.path, a.file_type, a.privacy_class, v.summary,
+                               e.vector_json, e.model_id, e.model_revision, e.dimension
+                        FROM local_chunks_fts f
+                        JOIN local_chunks c ON c.rowid = f.rowid
+                        JOIN local_assets a ON a.asset_id = c.asset_id
+                        LEFT JOIN local_asset_versions v ON v.version_id = c.version_id
+                        LEFT JOIN local_embeddings e ON e.chunk_id = c.chunk_id
+                        WHERE local_chunks_fts MATCH ?
+                          AND f.privacy_class='normal'
+                          AND f.asset_status='active'
+                          AND a.status='active'
+                          AND a.privacy_class='normal'
+                        ORDER BY bm25(local_chunks_fts), c.created_at DESC
+                        LIMIT ?
+                        """,
+                        (match_expr, prefilter_limit),
+                    ).fetchall()
+                    used_fts = True
+                except sqlite3.OperationalError:
+                    # Malformed FTS expression (odd user input) -> fall back to
+                    # the legacy LIKE path below instead of erroring the answer.
+                    prefilter_rows = []
+                    used_fts = False
+        if not used_fts:
+            term_clauses = []
+            params: list[str] = []
+            for term in terms:
+                term_clauses.append("(lower(a.path) LIKE ? OR lower(COALESCE(v.summary, '')) LIKE ? OR lower(c.text) LIKE ?)")
+                like = f"%{term}%"
+                params.extend([like, like, like])
+            prefilter_rows = conn.execute(
+                f"""
+                SELECT c.chunk_id, c.asset_id, c.text, a.path, a.file_type, a.privacy_class, v.summary,
+                       e.vector_json, e.model_id, e.model_revision, e.dimension
+                FROM local_chunks c
+                JOIN local_assets a ON a.asset_id = c.asset_id
+                LEFT JOIN local_asset_versions v ON v.version_id = c.version_id
+                LEFT JOIN local_embeddings e ON e.chunk_id = c.chunk_id
+                WHERE a.status='active'
+                  AND a.privacy_class='normal'
+                  AND ({" OR ".join(term_clauses)})
+                ORDER BY
+                  CASE
+                    WHEN {" OR ".join("lower(a.path) LIKE ?" for _ in terms)} THEN 0
+                    WHEN {" OR ".join("lower(COALESCE(v.summary, '')) LIKE ?" for _ in terms)} THEN 1
+                    ELSE 2
+                  END,
+                  c.created_at DESC
+                LIMIT ?
+                """,
+                [
+                    *params,
+                    *(f"%{term}%" for term in terms),
+                    *(f"%{term}%" for term in terms),
+                    prefilter_limit,
+                ],
+            ).fetchall()
     fallback_limit = prefilter_limit if not terms else max(120, min(500, prefilter_limit // 3))
     base_rows = conn.execute(

package/src/local_context/db.py CHANGED Viewed

@@ -8,7 +8,7 @@ from typing import Iterable
 from urllib.parse import quote
 import paths
-from db._schema import _m63_local_context_layer, _m64_local_context_live_dirs
+from db._schema import _m63_local_context_layer, _m64_local_context_live_dirs, _m84_local_chunks_fts
 LOCAL_CONTEXT_DB_NAME = "local-context.db"
 MIGRATION_STATE_KEY = "local_context_db_migrated_from_main"
@@ -118,7 +118,8 @@ def _ensure_schema(conn: sqlite3.Connection) -> None:
     _m64_local_context_live_dirs(conn)
     _ensure_entity_dossier_schema(conn)
     _ensure_local_context_v2_schema(conn)
-    conn.execute("PRAGMA user_version=65")
+    _m84_local_chunks_fts(conn)
+    conn.execute("PRAGMA user_version=84")
     conn.commit()

package/src/local_context/usage_events.py CHANGED Viewed

@@ -352,6 +352,7 @@ def record_router_usage(
     elapsed_ms: int | None = None,
     deadline_ms: int | None = None,
     used_before_response: bool = True,
+    cache_hit: bool = False,
     db_path: str | os.PathLike[str] | None = None,
 ) -> dict[str, Any]:
     evidence_refs = router_payload.get("evidence_refs") or []
@@ -374,6 +375,7 @@ def record_router_usage(
         "escalated_from": router_payload.get("escalated_from") or budget_policy.get("escalated_from") or "",
         "escalated_to": router_payload.get("escalated_to") or budget_policy.get("escalated_to") or "",
         "route_cache_key": budget_policy.get("route_cache_key") or "",
+        "cache_hit": bool(cache_hit or router_payload.get("cache_hit")),
         "max_sources": budget_policy.get("max_sources") or 0,
         "max_source_timeout_ms": budget_policy.get("max_source_timeout_ms") or 0,
         "allowed_sources": budget_policy.get("allowed_sources") or [],

package/src/memory_retrieval.py CHANGED Viewed

@@ -9,12 +9,24 @@ from typing import Any
 from db import (
     build_pre_action_context,
+    get_memory_observations_by_uids,
     list_memory_events,
     list_memory_observations,
     process_memory_observation_queue,
     search_memory_observations_fts,
+    vector_scan_observations,
 )
+# Weight for the semantic (vector) signal when fused with the lexical/FTS score.
+# A strong paraphrase match (high cosine) can carry an observation that the
+# token-overlap score missed entirely, while still ranking below an exact
+# lexical hit on the same query.
+_VECTOR_FUSION_WEIGHT = 0.85
+# Minimum cosine for a semantic-only candidate to survive the relaxed filter.
+# Below this, a vector "match" is noise and must not resurrect an observation
+# that the lexical path already rejected.
+_VECTOR_MIN_SCORE = 0.30
 def _tokens(text: str) -> set[str]:
     return {
@@ -37,6 +49,41 @@ def _score(query: str, text: str, base: float = 0.0) -> float:
     return min(1.0, base + len(overlap) / max(1, len(query_tokens)))
+def _model_is_warm() -> bool:
+    """True only when embedding the query will NOT trigger a cold model load."""
+    try:
+        import cognitive._core as cog
+    except Exception:
+        return False
+    try:
+        if cog._model_download_disabled():
+            return True
+    except Exception:
+        return False
+    return getattr(cog, "_model", None) is not None
+def _maybe_query_embedding(query: str):
+    """Embed the query ONCE for semantic fusion, or return None.
+    CRITICAL latency guard: this never loads a cold model. It returns None
+    (degrading to the FTS/token path) unless the deterministic offline fallback
+    is active or the real model is already warm in-process. Any failure also
+    yields None.
+    """
+    clean = (query or "").strip()
+    if not clean:
+        return None
+    if not _model_is_warm():
+        return None
+    try:
+        import cognitive._core as cog
+        return cog.embed(clean)
+    except Exception:
+        return None
 def _project_hint_values(project_hint: str = "") -> set[str]:
     clean = (project_hint or "").strip()
     if not clean:
@@ -225,6 +272,30 @@ def memory_search(
     ):
         uid = item.get("observation_uid") or f"id:{item.get('id')}"
         observations_by_uid.setdefault(uid, item)
+    # Semantic fusion: embed the query ONCE (only when a model is already warm —
+    # never trigger a cold model load on this latency path) and run a bounded
+    # vector scan over precomputed observation embeddings. Paraphrases that the
+    # lexical/FTS path missed are pulled in here.
+    vector_scores: dict[str, float] = {}
+    if clean_query:
+        query_vector = _maybe_query_embedding(clean_query)
+        if query_vector is not None:
+            for hit in vector_scan_observations(
+                query_vector,
+                limit=max_items * 3,
+                start_ts=start,
+                end_ts=end,
+                min_score=_VECTOR_MIN_SCORE,
+            ):
+                uid = hit.get("observation_uid")
+                if uid:
+                    vector_scores[uid] = float(hit.get("vector_score") or 0.0)
+            # Materialise semantic-only observations the lexical scan did not see.
+            missing_uids = [uid for uid in vector_scores if uid not in observations_by_uid]
+            if missing_uids:
+                for uid, item in get_memory_observations_by_uids(missing_uids).items():
+                    observations_by_uid.setdefault(uid, item)
     observations = list(observations_by_uid.values())
     events = list_memory_events(
         query=clean_query,
@@ -234,12 +305,23 @@ def memory_search(
         end_ts=end,
     )
-    candidates = [
-        _observation_to_candidate(item, clean_query)
-        for item in observations
-        if _within_range(item.get("created_at"), start, end)
-        and _project_matches(item.get("project_key") or "", project_hint)
-    ]
+    candidates = []
+    for item in observations:
+        if not _within_range(item.get("created_at"), start, end):
+            continue
+        if not _project_matches(item.get("project_key") or "", project_hint):
+            continue
+        candidate = _observation_to_candidate(item, clean_query)
+        uid = item.get("observation_uid") or f"id:{item.get('id')}"
+        vector_score = vector_scores.get(uid, 0.0)
+        if vector_score > 0:
+            # Fuse: keep the higher of the lexical score and the weighted vector
+            # signal so a strong paraphrase survives while exact lexical hits
+            # still outrank weak semantic ones.
+            fused = max(float(candidate.get("score") or 0.0), _VECTOR_FUSION_WEIGHT * vector_score)
+            candidate["score"] = round(fused, 4)
+            candidate["vector_score"] = round(vector_score, 4)
+        candidates.append(candidate)
     candidates.extend(
         _event_to_candidate(item, clean_query)
         for item in events
@@ -248,7 +330,14 @@ def memory_search(
     )
     if clean_query:
-        candidates = [item for item in candidates if item.get("score", 0) > 0]
+        # Relaxed filter: a candidate survives if it has a positive lexical score
+        # OR a qualifying semantic (vector) match. Previously the hard score>0
+        # filter dropped semantic-only paraphrase hits before they could rank.
+        candidates = [
+            item
+            for item in candidates
+            if item.get("score", 0) > 0 or item.get("vector_score", 0) > 0
+        ]
     candidates.sort(key=lambda item: (item.get("score", 0), item.get("created_at") or 0), reverse=True)
     candidates = candidates[:max_items]