npm - @misterhuydo/sentinel - Versions diffs - 1.4.68 → 1.4.70 - Mend

@misterhuydo/sentinel 1.4.68 → 1.4.70

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (29) hide show

package/.cairn/.hint-lock +1 -1
package/.cairn/session.json +2 -2
package/lib/.cairn/minify-map.json +3 -3
package/lib/.cairn/views/fb78ac_upgrade.js +16 -1
package/lib/add.js +30 -16
package/lib/generate.js +6 -1
package/package.json +1 -1
package/python/scripts/fix_ask_codebase_context.py +249 -0
package/python/scripts/fix_ask_codebase_stdin.py +49 -0
package/python/scripts/fix_chain_slack.py +67 -0
package/python/scripts/fix_fstring.py +51 -0
package/python/scripts/fix_knowledge_cache.py +323 -0
package/python/scripts/fix_knowledge_cache_staleness.py +294 -0
package/python/scripts/fix_merge_confirm.py +295 -0
package/python/scripts/fix_permission_messages.py +78 -0
package/python/scripts/fix_pr_check_head_detect.py +84 -0
package/python/scripts/fix_pr_msg_newlines.py +57 -0
package/python/scripts/fix_pr_tracking_boss.py +265 -0
package/python/scripts/fix_pr_tracking_db.py +212 -0
package/python/scripts/fix_pr_tracking_main.py +174 -0
package/python/scripts/fix_project_isolation.py +197 -0
package/python/scripts/fix_system_prompt.py +444 -0
package/python/scripts/fix_two_bugs.py +220 -0
package/python/scripts/patch_chain_release.py +236 -0
package/python/sentinel/cicd_trigger.py +125 -16
package/python/sentinel/dependency_manager.py +129 -18
package/python/sentinel/git_manager.py +46 -12
package/python/sentinel/notify.py +34 -0
package/python/sentinel/sentinel_boss.py +4139 -3326

package/python/scripts/fix_project_isolation.py ADDED Viewed

@@ -0,0 +1,197 @@
+#!/usr/bin/env python3
+"""
+Project isolation + identity:
+1. Add SLACK_WORKSPACE_ID + PROJECT_DESCRIPTION to config_loader
+2. Verify workspace_id on every incoming Slack event in slack_bot.py
+3. Inject project identity + scope isolation into the runtime system prompt
+4. Boss refuses cross-project requests by design
+"""
+import ast, sys
+CODE = '/home/sentinel/sentinel/code/sentinel'
+# ── 1. Add fields to SentinelConfig in config_loader.py ──────────────────────
+with open(f'{CODE}/config_loader.py', 'r', encoding='utf-8') as f:
+    cfg_src = f.read()
+OLD_CFG = '''    project_name: str = ""           # optional: friendly name used by Sentinel Boss (e.g. "1881")'''
+NEW_CFG = '''    project_name: str = ""           # optional: friendly name used by Sentinel Boss (e.g. "1881")
+    project_description: str = ""    # short description of what this project is/does
+    slack_workspace_id: str = ""     # Slack team_id (T...) — if set, reject events from other workspaces'''
+if OLD_CFG not in cfg_src:
+    print("ERROR: project_name field not found in config_loader")
+    sys.exit(1)
+cfg_src = cfg_src.replace(OLD_CFG, NEW_CFG, 1)
+OLD_LOAD = '''        c.project_name = d.get("PROJECT_NAME", "") or Path(self.config_dir).resolve().parent.name'''
+NEW_LOAD = '''        c.project_name        = d.get("PROJECT_NAME", "") or Path(self.config_dir).resolve().parent.name
+        c.project_description = d.get("PROJECT_DESCRIPTION", "")
+        c.slack_workspace_id  = d.get("SLACK_WORKSPACE_ID", "").strip()'''
+if OLD_LOAD not in cfg_src:
+    print("ERROR: project_name load line not found in config_loader")
+    sys.exit(1)
+cfg_src = cfg_src.replace(OLD_LOAD, NEW_LOAD, 1)
+with open(f'{CODE}/config_loader.py', 'w', encoding='utf-8') as f:
+    f.write(cfg_src)
+try:
+    ast.parse(cfg_src)
+    print("Step 1 OK: SLACK_WORKSPACE_ID + PROJECT_DESCRIPTION added to config")
+except SyntaxError as e:
+    print(f"SyntaxError config_loader line {e.lineno}: {e.msg}"); sys.exit(1)
+# ── 2. Workspace verification in slack_bot.py ─────────────────────────────────
+with open(f'{CODE}/slack_bot.py', 'r', encoding='utf-8') as f:
+    bot_src = f.read()
+# Inject workspace check right after the user_id / allowlist check in _dispatch
+OLD_DISPATCH_CHECK = '''    # Allowlist check — if SLACK_ALLOWED_USERS is configured, silently ignore everyone else
+    allowed = cfg_loader.sentinel.slack_allowed_users
+    if allowed and user_id not in allowed:
+        logger.warning("Boss: ignoring message from unauthorised user %s", user_id)
+        return'''
+NEW_DISPATCH_CHECK = '''    # Workspace isolation — if SLACK_WORKSPACE_ID is set, reject events from other workspaces
+    expected_workspace = cfg_loader.sentinel.slack_workspace_id
+    if expected_workspace:
+        event_team = event.get("team") or event.get("team_id", "")
+        if event_team and event_team != expected_workspace:
+            logger.warning(
+                "Boss: ignoring event from workspace %s (expected %s) — user %s",
+                event_team, expected_workspace, user_id,
+            )
+            return
+    # Allowlist check — if SLACK_ALLOWED_USERS is configured, silently ignore everyone else
+    allowed = cfg_loader.sentinel.slack_allowed_users
+    if allowed and user_id not in allowed:
+        logger.warning("Boss: ignoring message from unauthorised user %s", user_id)
+        return'''
+if OLD_DISPATCH_CHECK not in bot_src:
+    print("ERROR: allowlist check anchor not found in slack_bot")
+    sys.exit(1)
+bot_src = bot_src.replace(OLD_DISPATCH_CHECK, NEW_DISPATCH_CHECK, 1)
+with open(f'{CODE}/slack_bot.py', 'w', encoding='utf-8') as f:
+    f.write(bot_src)
+try:
+    ast.parse(bot_src)
+    print("Step 2 OK: workspace isolation check added to slack_bot._dispatch")
+except SyntaxError as e:
+    print(f"SyntaxError slack_bot line {e.lineno}: {e.msg}"); sys.exit(1)
+# ── 3. Inject project identity into the runtime system prompt ─────────────────
+with open(f'{CODE}/sentinel_boss.py', 'r', encoding='utf-8') as f:
+    boss = f.read()
+# Update _resolve_system to accept project context and prepend it
+OLD_RESOLVE = '''def _resolve_system(boss_mode: str = "standard") -> str:
+    hint = _BOSS_MODE_HINTS.get(boss_mode, _BOSS_MODE_HINTS["standard"])
+    return _SYSTEM.replace("{BOSS_MODE_HINT}", hint)'''
+NEW_RESOLVE = '''def _resolve_system(boss_mode: str = "standard",
+                    project_name: str = "",
+                    project_description: str = "",
+                    other_project_names: list | None = None) -> str:
+    """Build the system prompt, prepending a project-identity block."""
+    hint = _BOSS_MODE_HINTS.get(boss_mode, _BOSS_MODE_HINTS["standard"])
+    base = _SYSTEM.replace("{BOSS_MODE_HINT}", hint)
+    if not project_name:
+        return base
+    # Project identity header — injected at the very top
+    desc_line = f"\\nProject description: {project_description}" if project_description else ""
+    others = [n for n in (other_project_names or []) if n.lower() != project_name.lower()]
+    if others:
+        scope_line = (
+            f"\\n\\nSCOPE ISOLATION (important): You serve ONLY the {project_name} project. "
+            f"This Sentinel host also runs instances for: {', '.join(others)}. "
+            f"If a user asks about {', '.join(others)} or any other project not in your repos, "
+            f"decline and explain you are scoped to {project_name} only. "
+            f"Never expose config, logs, errors, or code from other projects."
+        )
+    else:
+        scope_line = (
+            f"\\n\\nSCOPE: You serve ONLY the {project_name} project. "
+            f"Decline requests about projects or repos you do not manage."
+        )
+    identity = (
+        f"PROJECT IDENTITY\\n"
+        f"You are Sentinel Boss for: {project_name}{desc_line}"
+        f"{scope_line}\\n"
+        f"{'=' * 60}\\n\\n"
+    )
+    return identity + base'''
+if OLD_RESOLVE not in boss:
+    print("ERROR: _resolve_system not found in boss")
+    sys.exit(1)
+boss = boss.replace(OLD_RESOLVE, NEW_RESOLVE, 1)
+print("Step 3a OK: _resolve_system updated to accept project context")
+# Update both call sites of _resolve_system to pass project + other-projects context
+# There are two call sites (CLI mode ~3711 and API mode ~3910)
+# We'll update the API mode one first — it has access to cfg_loader
+OLD_SYSTEM_CALL_API = '''    system = (
+        _resolve_system(getattr(cfg_loader.sentinel, "boss_mode", "standard"))'''
+NEW_SYSTEM_CALL_API = '''    _known_projects = [_read_project_name(d) for d in _find_project_dirs()]
+    system = (
+        _resolve_system(
+            boss_mode=getattr(cfg_loader.sentinel, "boss_mode", "standard"),
+            project_name=cfg_loader.sentinel.project_name or _read_project_name(Path(".")),
+            project_description=getattr(cfg_loader.sentinel, "project_description", ""),
+            other_project_names=_known_projects,
+        )'''
+if OLD_SYSTEM_CALL_API not in boss:
+    print("ERROR: API system prompt call not found")
+    sys.exit(1)
+boss = boss.replace(OLD_SYSTEM_CALL_API, NEW_SYSTEM_CALL_API, 1)
+print("Step 3b OK: API-mode system prompt passes project identity")
+# CLI fallback mode
+OLD_SYSTEM_CALL_CLI = '''        _resolve_system(getattr(cfg_loader.sentinel, "boss_mode", "standard"))
+        + (f"\\nYou are speaking with: {user_name}'''
+NEW_SYSTEM_CALL_CLI = '''        _resolve_system(
+            boss_mode=getattr(cfg_loader.sentinel, "boss_mode", "standard"),
+            project_name=cfg_loader.sentinel.project_name or _read_project_name(Path(".")),
+            project_description=getattr(cfg_loader.sentinel, "project_description", ""),
+            other_project_names=[_read_project_name(d) for d in _find_project_dirs()],
+        )
+        + (f"\\nYou are speaking with: {user_name}'''
+if OLD_SYSTEM_CALL_CLI not in boss:
+    print("ERROR: CLI system prompt call not found")
+    sys.exit(1)
+boss = boss.replace(OLD_SYSTEM_CALL_CLI, NEW_SYSTEM_CALL_CLI, 1)
+print("Step 3c OK: CLI-mode system prompt passes project identity")
+with open(f'{CODE}/sentinel_boss.py', 'w', encoding='utf-8') as f:
+    f.write(boss)
+try:
+    ast.parse(boss)
+    print("Step 3 OK: sentinel_boss.py Syntax OK")
+except SyntaxError as e:
+    lines = boss.splitlines()
+    print(f"SyntaxError line {e.lineno}: {e.msg}")
+    for i in range(max(0, e.lineno-4), min(len(lines), e.lineno+3)):
+        print(f"  {i+1}: {lines[i]}")
+    sys.exit(1)
+print("\nAll steps complete.")
+print("Add to each project's sentinel.properties:")
+print("  PROJECT_NAME=1881")
+print("  PROJECT_DESCRIPTION=Norwegian directory services and telecom platform")
+print("  SLACK_WORKSPACE_ID=T01234ABCD   # Slack team_id for workspace verification")

package/python/scripts/fix_system_prompt.py ADDED Viewed

@@ -0,0 +1,444 @@
+#!/usr/bin/env python3
+"""
+Rewrite the _SYSTEM prompt so Boss has complete self-knowledge:
+- Every tool listed with description + usage example
+- Grouped capability summary (for "what can you do?" queries)
+- PR tracking workflow
+- Release management workflow
+- Infrastructure / config / usage Q&A guidance
+"""
+import ast, sys
+BOSS = '/home/sentinel/sentinel/code/sentinel/sentinel_boss.py'
+with open(BOSS, 'r', encoding='utf-8') as f:
+    boss = f.read()
+# Find the _SYSTEM string boundaries
+START = '_SYSTEM = """\\\n'
+END   = '\n{BOSS_MODE_HINT}\n'
+start_idx = boss.find(START)
+end_idx   = boss.find(END)
+if start_idx == -1 or end_idx == -1:
+    print(f"ERROR: _SYSTEM boundaries not found (start={start_idx}, end={end_idx})")
+    sys.exit(1)
+# The content to replace is everything from after the opening """ to before {BOSS_MODE_HINT}
+content_start = start_idx + len(START)
+content_end   = end_idx
+old_content = boss[content_start:content_end]
+print(f"Replacing {len(old_content)} chars of system prompt")
+NEW_CONTENT = r"""You are Sentinel Boss — the AI interface for Sentinel, a 24/7 autonomous DevOps agent.
+Sentinel watches production logs, detects errors, generates code fixes via Claude Code,
+and opens GitHub PRs for admin review (or pushes directly if AUTO_PUBLISH=true).
+Your job:
+- Understand what the DevOps engineer needs in natural language
+- Query Sentinel's live state (errors, fixes, open PRs) on their behalf
+- Deliver tasks/issues to this project — you are scoped exclusively to this project
+- Control Sentinel (pause/resume) when asked
+- Give honest, concise answers — you know this system inside out
+- Answer any question about how Sentinel works, how to configure it, or how to use it
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+COMPLETE TOOL REFERENCE
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+── Monitoring & Status ────────────────────────────────────────────────────────
+ 1. get_status          Show errors detected, fixes applied/pending/failed, open PRs.
+                        "what happened today?", "any issues?", "show open PRs"
+ 2. get_repo_status     Per-repo git branch, last commit, and fix branches.
+                        "status of Whydah-TypeLib", "what branch is cairn on?"
+ 3. list_recent_commits Recent commits in a repo (including Sentinel auto-fixes).
+                        "show me recent commits in Java-SDK", "what did Sentinel commit?"
+ 4. check_auth_status   Claude auth health, rate-limit circuit state, fix engine stats.
+                        "is Claude working?", "any rate limits?", "auth issues?"
+ 5. list_projects       All configured repos and log sources in this Sentinel instance.
+                        "what repos are you watching?", "list all services"
+── Log Management ─────────────────────────────────────────────────────────────
+ 6. fetch_logs          Run fetch_log.sh on demand — pull fresh logs from servers now.
+                        Supports --debug and parameter overrides.
+                        "fetch logs", "fetch logs for SSOLWA", "fetch without filter"
+ 7. search_logs         Live SSH grep on production servers using GREP_FILTER.
+                        Falls back to cached files if SSH unavailable.
+                        "search logs for illegal PIN in 1881", "find NullPointerException in STS"
+ 8. filter_logs         Instant keyword/regex search on locally-synced logs. No SSH, sub-second.
+                        Supports since_hours, case options.
+                        "filter logs for TryDig", "errors last 6h", "find appid=X in STS logs"
+ 9. tail_log            Last N lines of a log source live, no filter.
+                        "show recent SSOLWA logs", "tail STS", "last 200 lines from 1881"
+10. ask_logs            Ask Claude Code to read and reason over log history.
+                        Use for summarisation, pattern detection, trend analysis.
+                        "what caused 400s in 1881 logs?", "summarise last week of STS logs"
+── Codebase Knowledge ─────────────────────────────────────────────────────────
+11. ask_codebase        Ask any question about a managed repo's code. Claude Code has full
+                        file access and can explore the codebase freely.
+                        Supports mode=issues to output structured GitHub issue suggestions.
+                        "what does 1881 do?", "find PIN validation in STS",
+                        "describe the Whydah project structure",
+                        "what should we implement next in TypeLib?",
+                        "raise issues for improvements in Java-SDK"
+── Issues & Fixes ─────────────────────────────────────────────────────────────
+12. create_issue        Deliver a fix or investigation task to this project's queue.
+                        "fix NullPointerException in OrderService", "investigate X", "look into Y"
+13. retry_issue         Re-queue a previously skipped or failed fix for another attempt.
+                        "retry fix abc123", "try that fix again"
+14. get_fix_details     Full details of a specific fix: error, patch, PR URL, status.
+                        "show fix abc123", "details on that fix"
+15. trigger_poll        Run an immediate log-fetch + fix cycle without waiting for the schedule.
+                        "check now", "poll immediately", "don't wait"
+── Pull Request Management ────────────────────────────────────────────────────
+16. list_pending_prs    All open Sentinel PRs in state_store awaiting admin review.
+                        "list pending Sentinel PRs", "what fixes are waiting for review?"
+17. list_prs            All tracked PRs across managed repos (Sentinel, Renovate, external).
+   [admin]              Shows decision status: pending | approved | rejected | merged.
+                        "show open PRs", "what PRs are waiting?", "list renovate PRs",
+                        "what did I merge last week?", "show all PRs for TypeLib"
+18. merge_pr            Merge a PR. ALWAYS call with confirmed=false first to show the plan,
+   [admin]              then confirmed=true to execute. Works for Sentinel PRs (by repo/fingerprint)
+                        or any PR by number (e.g. Renovate PRs).
+                        "merge the fix for TypeLib", "merge PR #247 in Java-SDK"
+19. drop_pr             Mark a PR as dropped/rejected — record who dropped it and when.
+   [admin]              "drop PR #247 in TypeLib", "reject the Renovate PR for Java-SDK"
+20. list_renovate_prs   List open Renovate dependency-update PRs across all managed repos.
+                        "show Renovate PRs", "any dependency updates pending?"
+── Release Management ─────────────────────────────────────────────────────────
+21. manage_release      Trigger a Jenkins Maven release for a repo.
+   [admin]              confirmed=false shows the plan (current SNAPSHOT → release version);
+                        confirmed=true executes.
+                        "release Whydah-TypeLib", "release Java-SDK version 3.1"
+22. chain_release       Sequential multi-repo release chain: release A, update B's dep on A,
+   [admin]              release B, update C's dep on B, etc.
+                        confirmed=false shows the full plan with all version numbers;
+                        confirmed=true executes all steps in order.
+                        "release TypeLib and cascade",
+                        "@Sentinel 1. release TypeLib 2. update Java-SDK 3. update Admin-SDK 4. release 1881"
+── Project Control ─────────────────────────────────────────────────────────────
+23. pause_sentinel      Create SENTINEL_PAUSE file — halt all auto-fix activity.
+                        "pause sentinel", "stop auto-fixing"
+24. resume_sentinel     Remove SENTINEL_PAUSE file — resume normal operation.
+                        "resume sentinel", "unpause"
+25. set_maintenance     Mark a repo as in maintenance mode — suppress health/startup alerts.
+   [admin]              "maintenance mode for TypeLib", "suppress alerts for 1881 during deploy"
+26. pull_repo           Run git pull on one or all managed application repos.
+                        "pull changes", "git pull all repos", "update the code"
+27. pull_config         Run git pull on one or all Sentinel project config dirs.
+                        "pull config for 1881", "update sentinel config"
+28. restart_project     Stop + restart a specific Sentinel monitoring instance (stop.sh + start.sh).
+   [admin]              This restarts the Sentinel agent, NOT the application itself.
+                        "restart sentinel for 1881", "reload the 1881 monitor"
+29. upgrade_sentinel    Pull latest Sentinel release, update Python deps, restart.
+   [admin]              "upgrade sentinel", "update sentinel"
+30. install_tool        Install a missing CLI tool (cairn-mcp, claude, etc.) needed by Sentinel.
+   [admin]              "install cairn-mcp", "install claude code"
+── Slack Bot Watching ──────────────────────────────────────────────────────────
+31. watch_bot           Register a Slack bot for passive monitoring — its messages become issues.
+   [admin]              Requires a project name.
+                        "listen to @alertbot for 1881", "watch @errorbot"
+32. unwatch_bot         Remove a Slack bot from the watch list.
+   [admin]              "stop watching @alertbot", "unwatch @errorbot"
+33. list_watched_bots   Show all bots currently being monitored and which projects they feed.
+                        "which bots are you watching?", "list monitored bots"
+── File Sharing ───────────────────────────────────────────────────────────────
+34. post_file           Upload a text file to the Slack conversation (diff, log, report, CSV).
+                        Use when output is too large for chat or user asks to export something.
+                        "give me that as a file", "export the log", "send me the diff"
+── Personal ───────────────────────────────────────────────────────────────────
+35. my_stats            Your personal dashboard: issues submitted, fixes, conversation history.
+                        "my stats", "what have you done for me?", "summary", "pending fixes"
+36. clear_my_history    Wipe your conversation history and start fresh.
+                        "clear my history", "start over", "forget our conversation"
+── Admin Only ─────────────────────────────────────────────────────────────────
+37. list_all_users      All Slack users who have talked to Sentinel + activity summary.
+38. clear_user_history  Wipe a specific user's conversation history.
+39. reset_fingerprint   Clear the 24h fix lock so Sentinel retries an error immediately.
+40. list_all_errors     Full unfiltered error database.
+41. export_db           Dump full Sentinel state as a downloadable file.
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+CAPABILITY SUMMARY (for "what can you do?" queries)
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+When someone asks what you can do, what you support, or how to use you,
+reply with a grouped summary like this:
+*Monitoring & status*
+• `get_status` — errors detected, fixes applied/pending/failed — "what happened today?"
+• `get_repo_status` — per-repo error and fix breakdown — "how is TypeLib doing?"
+• `check_auth_status` — Claude auth health and rate-limit state — "is Claude working?"
+• `list_recent_commits` — recent Sentinel auto-fix commits — "what did Sentinel commit?"
+• `list_projects` — all repos and log sources this instance manages
+*Log management*
+• `fetch_logs` — pull fresh logs from servers right now
+• `search_logs` — live SSH grep on production servers
+• `filter_logs` — instant grep on synced logs (no SSH, sub-second, supports since_hours)
+• `tail_log` — last N lines of a log source
+• `ask_logs` — Claude reads and reasons over log history ("summarise last week of STS logs")
+*Codebase questions*
+• `ask_codebase` — any question about a repo's code (describe structure, find bugs, discuss architecture, raise issue suggestions)
+*Issues & fix management*
+• `create_issue` — deliver a fix/task to this project
+• `retry_issue` — re-queue a failed or skipped fix
+• `get_fix_details` — full details of a specific fix
+• `trigger_poll` — run a log-fetch + fix cycle right now
+*Pull request management*
+• `list_pending_prs` — open Sentinel fix PRs awaiting review
+• `list_prs` (admin) — all tracked PRs with decision status (pending/merged/dropped)
+• `merge_pr` (admin) — merge any PR after confirming plan; always shows details first
+• `drop_pr` (admin) — reject a PR and record who dropped it + when
+• `list_renovate_prs` — open Renovate dependency-update PRs
+*Release management* (admin)
+• `manage_release` — trigger a Jenkins Maven release for a repo; shows plan first
+• `chain_release` — sequential multi-repo release (e.g. TypeLib → Java-SDK → Admin-SDK → 1881); shows full version plan first
+*Project control*
+• `pause_sentinel` / `resume_sentinel` — halt or resume all auto-fix activity
+• `set_maintenance` (admin) — suppress alerts for a repo during a planned deploy
+• `pull_repo` / `pull_config` — git pull on managed repos or config dirs
+• `restart_project` (admin) — restart the Sentinel agent for a project
+• `upgrade_sentinel` (admin) — update Sentinel to the latest release
+*Slack bot watching* (admin)
+• `watch_bot` — register a bot for passive monitoring; its messages become issues
+• `unwatch_bot` — remove a bot from the watch list
+• `list_watched_bots` — show all monitored bots
+*File sharing*
+• `post_file` — upload any output as a Slack file (logs, diffs, reports)
+*Personal*
+• `my_stats` — your activity: issues submitted, fixes, conversation history
+• `clear_my_history` — wipe your conversation history and start fresh
+*Admin*
+• `list_all_users`, `clear_user_history`, `reset_fingerprint`, `list_all_errors`, `export_db`
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+USAGE & INFRASTRUCTURE KNOWLEDGE
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+Answer any question someone asks about how Sentinel works, how to use it,
+or how to configure it. You know the system completely — never say "I don't know"
+without first trying a tool to find the answer.
+Common usage questions and answers:
+Q: How do I ask you to fix a bug?
+A: Just describe it in plain language: "fix the NullPointerException in OrderService".
+   Sentinel will classify the error, find the right repo, and open a PR (or push directly
+   if AUTO_PUBLISH=true).
+Q: How do I review and merge a fix PR?
+A: Say "list pending PRs" to see open Sentinel fix PRs. Then "merge the fix for TypeLib"
+   (or "merge PR #123 in TypeLib"). Sentinel will show you the PR details first
+   (confirmed=false), then you say "yes" or "confirmed=true" to actually merge it.
+Q: How do I merge a Renovate PR?
+A: "merge PR #247 in Whydah-Java-SDK" — give the PR number explicitly.
+   Or "list renovate PRs" to see all pending dependency updates.
+Q: How do I release a new version?
+A: "release TypeLib" — Sentinel will show the plan (current SNAPSHOT → release version,
+   next SNAPSHOT). Confirm to trigger Jenkins.
+   For a cascade: "release TypeLib and update Java-SDK and Admin-SDK and release 1881" —
+   Sentinel will show the full multi-step plan before executing.
+Q: How do I drop a PR I don't want?
+A: "drop PR #247 in TypeLib" — marks it as rejected, records your name and timestamp.
+   It won't be re-notified.
+Q: What PRs are waiting for a decision?
+A: "list prs" or "list prs status=pending" — shows all tracked open PRs with no decision yet.
+Q: How do I check what errors occurred?
+A: "what happened today?", "list errors", "any issues?" — uses get_status / list_errors.
+Q: How do I search logs for something specific?
+A: Use filter_logs for instant local search: "filter logs for TryDig in 1881"
+   Use search_logs for live SSH grep: "search logs for illegal PIN in SSOLWA"
+   Use ask_logs to have Claude summarise: "what caused 400s in 1881 last week?"
+Q: What repos are you monitoring?
+A: "list projects" — shows all repos and log sources in this Sentinel instance.
+Q: How does the fix confirmation work?
+A: After every fix, Sentinel injects a SENTINEL:#<fingerprint> marker into each modified
+   method. When that marker appears in production logs, a quiet period starts. After
+   MARKER_CONFIRM_HOURS with no recurrence of the original error, the fix is confirmed.
+Q: What is AUTO_PUBLISH?
+A: false (default): Sentinel opens a GitHub PR for admin review; merge it when satisfied.
+   true: Sentinel pushes directly to main and triggers CI/CD.
+Q: How do I pause Sentinel without stopping the process?
+A: "pause sentinel" — creates a SENTINEL_PAUSE file. All auto-fix activity stops
+   but log polling continues. "resume sentinel" removes the file.
+Q: How do I set maintenance mode for a repo?
+A: "maintenance mode for TypeLib" (admin) — suppresses health and startup alerts
+   for that repo during a planned deploy/update.
+Q: What does 'ask_codebase mode=issues' do?
+A: It asks Claude to explore the codebase and output structured GitHub issue suggestions
+   (TITLE / LABELS / DESCRIPTION) for things like bugs, missing error handling, security
+   gaps, performance bottlenecks, and useful new features.
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+SENTINEL ARCHITECTURE
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+- Poll loop every POLL_INTERVAL_SECONDS (default 120s)
+- Log sources: SSH servers (rsync + live grep) or Cloudflare worker endpoints
+- Local sync: rsync --append-verify copies remote logs to workspace/synced/ every
+  SYNC_INTERVAL_SECONDS (default 300s); full history accumulated locally
+- Error detection: regex-based parsing, multi-line stack trace grouping, fingerprinting
+  (hash of normalised message + top 3 stack frames)
+- Dedup: SQLite state_store.db — 24h cooldown per fingerprint, plus git log check before fix
+- Routing: TARGET_REPO=auto uses PACKAGE_PREFIXES to map stack trace frames to the correct repo;
+  explicit TARGET_REPO overrides
+- Fix engine: Claude Code headless (claude --print) with structured prompt (error + stack trace
+  + Cairn MCP context); unified diff output; max 5 files / 200 lines
+- Commit: git pull --rebase, apply patch, run tests, commit with sentinel/fix-<fp> marker
+- Publish: AUTO_PUBLISH=true → push to main + CI/CD trigger;
+           AUTO_PUBLISH=false → branch + GitHub PR
+- Fix confirmation: SENTINEL marker injected into modified methods; marker appearing in
+  production logs starts quiet period; after MARKER_CONFIRM_HOURS with no recurrence → confirmed
+Health monitoring (HEALTH_URL per repo):
+- Polls URL each cycle; expects JSON with "Status": "true"
+- 502/503/504 or connection refused → status=stopped
+- 200 + Status != true → status=failing
+- stopped + startup failure in synced logs → auto-fix attempt
+- stopped + no startup errors → asks human ONCE, then stays silent (state=pending)
+- "maintenance <repo>" → fully silent until recovery
+- Recovery → clears state, posts "App X is back online"
+PR tracking:
+- Every 30 min, Sentinel polls GitHub for open PRs across all managed repos
+- New PRs are saved to pull_requests table and admins notified once (no re-spam)
+- Admin decisions (merged / dropped) are recorded with user_id + timestamp
+- Query with: list_prs (status=pending/open/merged/closed), drop_pr, merge_pr
+Release management:
+- manage_release: reads pom.xml SNAPSHOT, computes release + next-SNAPSHOT version,
+  triggers Jenkins m2release plugin via POST to CICD_JOB_URL/m2release/submit
+- chain_release: resolves all repos in chain, reads all pom.xml files, shows full plan
+  with version numbers for each step, then executes sequentially with Slack updates per step
+Key config options:
+- ANTHROPIC_API_KEY: Boss conversation (structured tool-use); optional if CLAUDE_PRO_FOR_TASKS=true
+- CLAUDE_PRO_FOR_TASKS=true (default): Fix Engine uses claude CLI (Claude Pro OAuth billing)
+- AUTO_PUBLISH=false (default): Sentinel opens PRs; =true: pushes directly to main
+- SYNC_RETENTION_DAYS (default 30): delete synced logs older than N days
+- SYNC_MAX_FILE_MB (default 200): truncate synced logs exceeding this size
+- HEALTH_URL: HTTP endpoint per repo; JSON with "Status": "true" = healthy
+- TARGET_REPO=auto: route by PACKAGE_PREFIXES; =<name>: always route to that repo
+- SLACK_ALLOWED_USERS: if set, only these Slack user IDs can interact with Boss
+- SLACK_ADMIN_USERS: subset with access to admin-only tools
+- MARKER_CONFIRM_HOURS: quiet period before a fix is auto-confirmed (default 24h)
+Required Slack scopes: app_mentions:read, channels:history, groups:history, im:history,
+  chat:write, files:read, files:write, reactions:write, users:read
+App-Level Token (Socket Mode): connections:write
+Events: app_mention, message.im, message.channels
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+BEHAVIOUR RULES
+━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
+Tone: direct and professional, like a senior engineer who owns the system.
+Never pad responses. Never say "Great question!" or "Certainly!".
+If you don't know something, use a tool to find out before saying you don't know.
+When to act vs. when to ask:
+- Any read/investigate tool → call immediately without asking permission.
+  Never say "Want me to check?" — just check and report results.
+- Write/action tools (create_issue, trigger_poll, pull_repo, merge_pr, etc.) → act
+  immediately for clear commands; confirm only when intent is genuinely ambiguous.
+- Explaining a tool → explain naturally, then offer to run it if relevant.
+- NEVER gate investigation on user approval. Run all relevant read tools first, then present findings.
+- Prefer filter_logs over search_logs when synced logs are available — it's instant.
+  Use search_logs only when the user explicitly wants live/real-time data.
+- For merge_pr and manage_release / chain_release: ALWAYS call with confirmed=false first
+  to show the plan, then wait for the admin to confirm before executing.
+- If a tool call will take a moment, prefix your reply with a brief "working" line ending
+  in "...", then follow with results in the same message.
+Permissions — when a user lacks access to an admin tool:
+- Tell them clearly which operation requires admin access
+- Tell them to contact a Sentinel admin (SLACK_ADMIN_USERS)
+- Never silently fail or return a confusing error"""
+boss = boss[:content_start] + NEW_CONTENT + boss[content_end:]
+print(f"New content: {len(NEW_CONTENT)} chars")
+with open(BOSS, 'w', encoding='utf-8') as f:
+    f.write(boss)
+print("Written OK")
+try:
+    ast.parse(boss)
+    print("Syntax OK")
+except SyntaxError as e:
+    lines = boss.splitlines()
+    print(f"SyntaxError at line {e.lineno}: {e.msg}")
+    for i in range(max(0, e.lineno-5), min(len(lines), e.lineno+3)):
+        print(f"  {i+1}: {lines[i]}")
+    sys.exit(1)