npm - @a5c-ai/babysitter-github - Versions diffs - 5.0.1-staging.e4c68b9b → 5.0.1-staging.e920fef118ef - Mend

@a5c-ai/babysitter-github 5.0.1-staging.e4c68b9b → 5.0.1-staging.e920fef118ef

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

package/README.md +33 -25
package/bin/install-shared.js +28 -17
package/bin/install.js +9 -0
package/bin/uninstall.js +25 -4
package/commands/call.md +5 -1
package/commands/cleanup.md +30 -8
package/commands/doctor.md +2 -3
package/commands/help.md +2 -1
package/commands/observe.md +6 -1
package/commands/yolo.md +11 -7
package/hooks/babysitter-proxied-post-tool-use.ps1 +12 -0
package/hooks/babysitter-proxied-post-tool-use.sh +3 -0
package/hooks/babysitter-proxied-pre-compact.ps1 +12 -0
package/hooks/babysitter-proxied-pre-compact.sh +3 -0
package/hooks/babysitter-proxied-pre-tool-use.ps1 +12 -0
package/hooks/babysitter-proxied-pre-tool-use.sh +3 -0
package/hooks/babysitter-proxied-session-end.sh +0 -0
package/hooks/babysitter-proxied-session-start.sh +0 -0
package/hooks/babysitter-proxied-user-prompt-submitted.sh +0 -0
package/hooks.json +24 -0
package/package.json +12 -11
package/plugin.json +1 -1
package/scripts/create-release-tag.mjs +18 -0
package/scripts/publish-from-tag.mjs +41 -0
package/skills/babysit/SKILL.md +2 -4
package/skills/call/SKILL.md +5 -1
package/skills/cleanup/SKILL.md +30 -8
package/skills/doctor/SKILL.md +2 -3
package/skills/help/SKILL.md +2 -1
package/skills/observe/SKILL.md +6 -1
package/skills/yolo/SKILL.md +5 -1
package/versions.json +2 -1
package/scripts/sync-command-surfaces.js +0 -62

package/README.md CHANGED Viewed

@@ -18,7 +18,8 @@ directly.
 - **Node.js 22+**
 - **GitHub Copilot CLI** (`copilot`) -- requires an active GitHub Copilot
   subscription
-- **Babysitter SDK CLI** (`@a5c-ai/babysitter-sdk`) -- installed globally
+- **Babysitter CLI** (`@a5c-ai/babysitter`) -- installed globally when using
+  the SDK helper
 ## Installation
@@ -28,7 +29,7 @@ Register the a5c.ai marketplace and install the plugin:
 ```bash
 # Register the marketplace
-copilot plugin marketplace add a5c-ai/babysitter
+copilot plugin marketplace add a5c-ai/babysitter-claude
 # Install the plugin
 copilot plugin install babysitter
@@ -36,42 +37,50 @@ copilot plugin install babysitter
 ### Direct GitHub install
-Install directly from the Git repository using Copilot CLI. Copilot CLI
-discovers the plugin via `.github/plugin/marketplace.json` at the repo root:
+Install directly from the generated external plugin repository:
 ```bash
-copilot plugin install a5c-ai/babysitter
+copilot plugin install a5c-ai/babysitter-github-copilot
 ```
-### Alternative Installation (npm / development)
+### Alternative Installation (SDK helper / development)
-For development or environments where the Copilot CLI plugin system is not
-available, install via npm:
+For development, automation, or environments where the Copilot CLI plugin system is not available, install through the Babysitter SDK helper. This is the canonical scriptable path used by the installer tests and resolves to `npx --yes @a5c-ai/babysitter-github install ...` under the hood:
-Install the SDK CLI first:
+Install the Babysitter CLI first:
 ```bash
-npm install -g @a5c-ai/babysitter-sdk
+npm install -g @a5c-ai/babysitter
 ```
-Then install the GitHub Copilot plugin globally:
+Then install the GitHub Copilot plugin globally or into a workspace:
 ```bash
-npm install -g @a5c-ai/babysitter-github
-babysitter-github install
+# Global install
+babysitter harness:install-plugin github-copilot
+# Workspace install
+babysitter harness:install-plugin github-copilot --workspace /path/to/repo
 ```
-Or install from source:
+You can also run the published package installer directly:
 ```bash
-cd plugins/babysitter-github
-node bin/install.js
+npx --yes @a5c-ai/babysitter-github install --global
+npx --yes @a5c-ai/babysitter-github install --workspace /path/to/repo
+```
+Or install from generated source:
+```bash
+npm run generate:plugins
+node artifacts/generated-plugins/github-copilot/bin/install.js
 ```
-Install into a specific workspace:
+Install into a specific workspace from generated source:
 ```bash
-babysitter-github install --workspace /path/to/repo
+node artifacts/generated-plugins/github-copilot/bin/install.js --workspace /path/to/repo
 ```
 ### GitHub Copilot cloud agent installation
@@ -253,8 +262,7 @@ Copilot CLI looks for the plugin manifest in these paths, checked in order:
 The first match wins. This plugin uses `plugin.json` at the package root.
 For marketplace discovery, Copilot CLI looks for `.github/plugin/marketplace.json`
-at the repository root. This file lists all available plugins in the repo and is
-used when installing via `copilot plugin install OWNER/REPO`.
+at the repository root of the generated plugin repository.
 ### plugin.json Schema
@@ -404,7 +412,7 @@ repository root in `.github/plugin/marketplace.json`:
       "name": "babysitter",
       "description": "Multi-step workflow orchestration with event-sourced state",
       "version": "0.1.0",
-      "source": "./plugins/babysitter-github"
+      "source": "./"
     }
   ]
 }
@@ -461,7 +469,7 @@ These registries are available without running `marketplace add`.
 ## Plugin Structure (Directory Layout)
 ```
-plugins/babysitter-github/
+artifacts/generated-plugins/github-copilot/
   plugin.json              # Plugin manifest (skills, hooks, metadata)
   .github/plugin.json      # Plugin manifest (alternate discovery path)
   hooks.json               # Hook configuration (sessionStart, sessionEnd, userPromptSubmitted)
@@ -579,14 +587,14 @@ compatibility where PowerShell execution is available.
 git clone https://github.com/a5c-ai/babysitter.git
 cd babysitter
 npm install
-cd plugins/babysitter-github
+npm run generate:plugins
 node bin/install.js
 ```
 ### Publishing
 ```bash
-cd plugins/babysitter-github
+cd artifacts/generated-plugins/github-copilot
 npm run deploy            # Publish to npm (public)
 npm run deploy:staging    # Publish to npm with staging tag
 ```
@@ -594,7 +602,7 @@ npm run deploy:staging    # Publish to npm with staging tag
 ### Team installation
 ```bash
-cd plugins/babysitter-github
+cd artifacts/generated-plugins/github-copilot
 npm run team:install
 ```

package/bin/install-shared.js CHANGED Viewed

@@ -13,7 +13,7 @@ function getUserHome() {
 }
 function getHarnessHome() {
-  return path.join(os.homedir(), '.copilot');
+  return path.join(os.homedir(), ".copilot");
 }
 function getHomePluginRoot(scope) {
@@ -104,7 +104,7 @@ function ensureMarketplaceEntry(marketplacePath, pluginRoot) {
     name: PLUGIN_NAME,
     source: relSource,
     description: "Orchestrate complex, multi-step workflows with event-sourced state management, hook-based extensibility, and human-in-the-loop approval",
-    version: "5.0.0",
+    version: "5.0.1-staging.e920fef118ef",
     author: { name: "a5c.ai" },
   };
   if (idx >= 0) marketplace.plugins[idx] = entry;
@@ -454,8 +454,9 @@ function installManagedHooks(packageRoot, copilotHome) {
   mergeManagedHooksConfig(packageRoot, copilotHome);
 }
-function removeLegacyHooks(copilotHome) {
-  for (const hookName of LEGACY_HOOK_SCRIPT_NAMES) {
+function removeManagedHooks(copilotHome) {
+  const managedHookNames = [...LEGACY_HOOK_SCRIPT_NAMES, ...HOOK_SCRIPT_NAMES];
+  for (const hookName of managedHookNames) {
     fs.rmSync(path.join(copilotHome, 'hooks', hookName), { force: true });
   }
@@ -476,10 +477,17 @@ function removeLegacyHooks(copilotHome) {
     const eventHooks = Array.isArray(hooksConfig.hooks[eventName]) ? hooksConfig.hooks[eventName] : [];
     const filteredMatchers = eventHooks
       .map((matcher) => {
+        const directBash = String(matcher?.bash || matcher?.command || '');
+        const directPs = String(matcher?.powershell || '');
+        const hasDirectHook = directBash.length > 0 || directPs.length > 0;
+        const directIsManaged = managedHookNames.some((name) => directBash.includes(name) || directPs.includes(name));
+        if (hasDirectHook) {
+          return directIsManaged ? null : matcher;
+        }
         const hooks = Array.isArray(matcher.hooks) ? matcher.hooks : [];
         const keptHooks = hooks.filter((hook) => {
           const command = String(hook.command || '');
-          return !LEGACY_HOOK_SCRIPT_NAMES.some((name) => command.includes(name));
+          return !managedHookNames.some((name) => command.includes(name));
         });
         return keptHooks.length > 0 ? { ...matcher, hooks: keptHooks } : null;
       })
@@ -498,11 +506,13 @@ function removeLegacyHooks(copilotHome) {
 }
 function installCopilotSurface(packageRoot, copilotHome) {
-  removeLegacyHooks(copilotHome);
+  removeManagedHooks(copilotHome);
   installManagedSkills(packageRoot, copilotHome);
   installManagedHooks(packageRoot, copilotHome);
 }
+const removeLegacyHooks = removeManagedHooks;
 function renderCloudAgentAgentsBlock() {
   return [
     '## Babysitter Cloud Agent',
@@ -831,10 +841,19 @@ module.exports = {
   resolveCliCommand,
   runCli,
   ensureGlobalProcessLibrary,
+  PLUGIN_BUNDLE_ENTRIES,
+  copyRecursive,
+  copyPluginBundle,
+  DEFAULT_MARKETPLACE,
+  normalizeMarketplaceSourcePath,
+  ensureMarketplaceEntry,
+  removeMarketplaceEntry,
+  installManagedSkills,
+  mergeManagedHooksConfig,
+  installManagedHooks,
+  warnWindowsHooks,
   LEGACY_HOOK_SCRIPT_NAMES,
   HOOK_SCRIPT_NAMES,
-  DEFAULT_MARKETPLACE,
-  PLUGIN_BUNDLE_ENTRIES,
   CLOUD_AGENT_BUNDLE_ENTRIES,
   MANAGED_BLOCK_START,
   MANAGED_BLOCK_END,
@@ -849,10 +868,8 @@ module.exports = {
   rewriteCloudSkill,
   registerCopilotPlugin,
   deregisterCopilotPlugin,
-  installManagedSkills,
-  mergeManagedHooksConfig,
-  installManagedHooks,
   removeLegacyHooks,
+  removeManagedHooks,
   installCopilotSurface,
   renderCloudAgentAgentsBlock,
   renderCloudAgentCopilotInstructionsBlock,
@@ -862,12 +879,6 @@ module.exports = {
   installCloudAgentInstructions,
   installCloudAgentSetupSteps,
   installCloudAgentSurface,
-  normalizeMarketplaceSourcePath,
-  ensureMarketplaceEntry,
-  removeMarketplaceEntry,
-  warnWindowsHooks,
-  copyPluginBundle,
-  copyRecursive,
   harnessCliRoute,
   harnessInstall,
 };

package/bin/install.js CHANGED Viewed

@@ -65,6 +65,15 @@ function main() {
   try {
     shared.copyPluginBundle(PACKAGE_ROOT, pluginRoot);
     shared.ensureMarketplaceEntry(marketplacePath, pluginRoot);
+    if (typeof shared.registerCopilotPlugin === 'function') {
+      shared.registerCopilotPlugin(pluginRoot);
+    }
+    if (typeof shared.installCopilotSurface === 'function' && typeof shared.getCopilotHome === 'function') {
+      shared.installCopilotSurface(PACKAGE_ROOT, shared.getCopilotHome());
+    }
+    if (typeof shared.warnWindowsHooks === 'function') {
+      shared.warnWindowsHooks();
+    }
     if (typeof shared.harnessInstall === 'function') {
       shared.harnessInstall(PACKAGE_ROOT, pluginRoot);
     }

package/bin/uninstall.js CHANGED Viewed

@@ -7,17 +7,38 @@ const shared = require('./install-shared');
 function main() {
   const pluginRoot = shared.getHomePluginRoot();
+  const marketplacePath = typeof shared.getHomeMarketplacePath === 'function'
+    ? shared.getHomeMarketplacePath()
+    : null;
+  const copilotHome = typeof shared.getCopilotHome === 'function'
+    ? shared.getCopilotHome()
+    : null;
   if (!fs.existsSync(pluginRoot)) {
     console.log(`[${shared.PLUGIN_NAME}] Plugin not installed at ${pluginRoot}`);
-    return;
+  } else {
+    try {
+      fs.rmSync(pluginRoot, { recursive: true, force: true });
+      console.log(`[${shared.PLUGIN_NAME}] Uninstalled from ${pluginRoot}`);
+    } catch (err) {
+      console.error(`[${shared.PLUGIN_NAME}] Failed to uninstall: ${err.message}`);
+      process.exitCode = 1;
+      return;
+    }
   }
   try {
-    fs.rmSync(pluginRoot, { recursive: true, force: true });
-    console.log(`[${shared.PLUGIN_NAME}] Uninstalled from ${pluginRoot}`);
+    if (typeof shared.deregisterCopilotPlugin === 'function') {
+      shared.deregisterCopilotPlugin(pluginRoot);
+    }
+    if (copilotHome && typeof shared.removeManagedHooks === 'function') {
+      shared.removeManagedHooks(copilotHome);
+    }
+    if (marketplacePath && typeof shared.removeMarketplaceEntry === 'function') {
+      shared.removeMarketplaceEntry(marketplacePath);
+    }
   } catch (err) {
-    console.error(`[${shared.PLUGIN_NAME}] Failed to uninstall: ${err.message}`);
+    console.error(`[${shared.PLUGIN_NAME}] Failed to clean up uninstall state: ${err.message}`);
     process.exitCode = 1;
   }
 }

package/commands/call.md CHANGED Viewed

@@ -4,4 +4,8 @@ argument-hint: Specific instructions for the run.
 allowed-tools: Read, Grep, Write, Task, Bash, Edit, Grep, Glob, WebFetch, WebSearch, Search, AskUserQuestion, TodoWrite, TodoRead, Skill, BashOutput, KillShell, MultiEdit, LS
 ---
-Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md).
+Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md). Then continue executing the returned instructions in this same turn. Do not stop after the Skill tool returns; carry the requested run through to completion proof.
+User arguments for this command:
+$ARGUMENTS

package/commands/cleanup.md CHANGED Viewed

@@ -10,11 +10,33 @@ Create and run a cleanup process using the process at `skills\babysit\process\cr
 Implementation notes (for the process):
 - Parse arguments for `--dry-run` flag (if present, set dryRun: true in inputs) and `--keep-days N` (default: 7)
-- The process scans .a5c/runs/ for completed/failed runs, aggregates insights, writes summaries, then removes old data
-- Always show the user what will be removed before removing (in interactive mode via breakpoints)
-- In non-interactive mode (yolo), proceed with cleanup using defaults
-- The insights file goes to docs/run-history-insights.md
-- Only remove terminal runs (completed/failed) older than the keep-days threshold
-- Never remove active/in-progress runs
-- Remove orphaned process files not referenced by remaining runs
-- After cleanup, show remaining run count and disk usage
+CRITICAL: The cleanup MUST follow this exact phase order. Do NOT delete any run before Phase 2 completes.
+Phase 1 — Scan:
+- Scan .a5c/runs/ for all runs
+- Classify each as terminal (completed/failed) or active (in-progress/created)
+- Identify terminal runs older than the keep-days threshold as removal candidates
+- Never mark active/in-progress runs for removal
+- Count and report: total runs, terminal, active, removal candidates, disk usage
+Phase 2 — Aggregate insights (BEFORE any deletion):
+- For EVERY removal candidate, read its run.json and journal/ events
+- Extract: processId, prompt, status, event count, created date, task summaries
+- Group by process type and extract patterns (retry counts, convergence behavior, failure modes)
+- Append a new dated section to docs/run-history-insights.md with:
+  - Summary statistics (runs removed, disk freed, runs retained)
+  - Run categories with counts and descriptions
+  - Key patterns observed (multi-batch convergence, retry behavior, etc.)
+  - What worked well / what didn't from the run data
+- This file MUST be written and verified before proceeding to Phase 3
+Phase 3 — Confirm removal:
+- In interactive mode, show the user what will be removed via a breakpoint
+- In non-interactive mode (yolo), proceed with defaults
+- In dry-run mode, stop here and show what would be removed
+Phase 4 — Remove:
+- Delete the terminal runs older than keep-days threshold
+- Identify and remove orphaned process files not referenced by remaining runs
+- Show remaining run count and disk usage after cleanup

package/commands/doctor.md CHANGED Viewed

@@ -156,7 +156,6 @@ If it exists:
 **Goal:** Inspect babysitter session files for health and detect runaway loops.
 - Search for session state files using Glob:
-  - `plugins/babysitter/skills/babysit/state/*.md`
   - `.a5c/state/*.md`
   - `.a5c/state/*.json`
 - For each session state file found:
@@ -260,7 +259,7 @@ Mark as PASS if total size < 500MB and no files > 10MB. Mark as WARN if total si
 ### 10a. Hook Registration
-- Locate the plugin root. Check for `CLAUDE_PLUGIN_ROOT` env var, or search for `plugins/babysitter/hooks/hooks.json` by walking up from the current directory.
+- Locate the plugin root. Check for `CLAUDE_PLUGIN_ROOT` env var first, or search for a babysitter `hooks.json` by walking up from the current directory.
 - If found, read `hooks.json` and verify:
   - A `Stop` hook entry exists with a command referencing `babysitter-stop-hook.sh`.
   - A `SessionStart` hook entry exists with a command referencing `babysitter-session-start-hook.sh`.
@@ -315,7 +314,7 @@ If the stop hook shows NO evidence of execution (no log entries, no journal even
 Perform these diagnostic steps in order and report the first failure found:
-1. **Plugin not installed**: Check if `plugins/babysitter/` exists relative to the project root and if `CLAUDE_PLUGIN_ROOT` is set. If the plugin directory doesn't exist, report: "Plugin not installed — the babysitter plugin directory is missing."
+1. **Plugin not installed**: Check if `CLAUDE_PLUGIN_ROOT` is set or if a babysitter plugin directory exists relative to the project root. If neither exists, report: "Plugin not installed — the babysitter plugin directory is missing."
 2. **Plugin not enabled**: Check for Claude settings files:
    - `~/.claude/settings.json` — look for `babysitter` in `enabledPlugins`.

package/commands/help.md CHANGED Viewed

@@ -233,7 +233,8 @@ SECONDARY COMMANDS
   How it works: Runs npx @a5c-ai/babysitter-observer-dashboard@latest which watches
   the .a5c/runs/ directory (or a parent directory containing multiple projects) and
   serves a live dashboard. The process is blocking -- it runs until you stop it, and
-  it prints the local URL to share with the user.
+  it prints the local URL to share with the user. Do not use `babysitter observe`
+  as a fallback; the core Babysitter CLI does not expose that subcommand.
   Example: /babysitter:observe
   (opens browser showing all runs with live-updating task

package/commands/observe.md CHANGED Viewed

@@ -7,6 +7,11 @@ allowed-tools: Read, Grep, Write, Task, Bash
 Run the babysitter observer dashboard:
 1. Determine the watch directory — this is usually the project's container directory (the parent of the project dir), or the current working directory if not specified.
-2. Launch the dashboard: `npx -y @a5c-ai/babysitter-observer-dashboard@latest --watch-dir <dir>`
+2. Launch the standalone dashboard package: `npx -y @a5c-ai/babysitter-observer-dashboard@latest --watch-dir <dir>`.
 3. This is a blocking process — it will keep running until stopped.
 4. Report the URL printed by the dashboard to the user, then open it in the browser.
+Do not fall back to `babysitter observe`; the core Babysitter CLI does not expose
+that subcommand. Some harness runtimes may provide a separate
+`babysitter-agent observe` surface, but this skill uses the verified standalone
+dashboard package.

package/commands/yolo.md CHANGED Viewed

@@ -1,7 +1,11 @@
----
-description: Orchestrate a babysitter run. use this command to start babysitting a complex workflow in a non-interactive mode, without any user interaction or breakpoints in the run.
-argument-hint: Specific instructions for the run.
-allowed-tools: Read, Grep, Write, Task, Bash, Edit, Grep, Glob, WebFetch, WebSearch, Search, AskUserQuestion, TodoWrite, TodoRead, Skill, BashOutput, KillShell, MultiEdit, LS
----
-Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md). but without any user interaction or breakpoints in the run.
+---
+description: Orchestrate a babysitter run. use this command to start babysitting a complex workflow in a non-interactive mode, without any user interaction or breakpoints in the run.
+argument-hint: Specific instructions for the run.
+allowed-tools: Read, Grep, Write, Task, Bash, Edit, Grep, Glob, WebFetch, WebSearch, Search, AskUserQuestion, TodoWrite, TodoRead, Skill, BashOutput, KillShell, MultiEdit, LS
+---
+Start the Babysitter run directly through the CLI, without any user interaction or breakpoints. Do not invoke the Skill tool and do not run an instructions-only command. In Claude Code, use Bash to run `babysitter-agent yolo --harness claude-code --workspace "$PWD" --prompt "<user arguments>" --json`; in Codex, run `babysitter-agent yolo --harness codex --workspace "$PWD" --prompt "<user arguments>" --json`; in other harnesses, use the same command with that harness id. Replace `<user arguments>` with the arguments shown below, wait for the command to finish, and treat the CLI completion proof as the result.
+User arguments for this command:
+$ARGUMENTS

package/hooks/babysitter-proxied-post-tool-use.ps1 ADDED Viewed

@@ -0,0 +1,12 @@
+# PowerShell hook wrapper — sets env vars and delegates to bash
+$env:HOOK_TYPE = 'post-tool-use'
+$env:ADAPTER_NAME = 'copilot'
+$env:PLUGIN_ROOT = Split-Path -Parent (Split-Path -Parent $PSScriptRoot)
+$input_data = [Console]::In.ReadToEnd()
+$result = $input_data | & bash "$PSScriptRoot/../$($MyInvocation.MyCommand.Name -replace '\.ps1$','.sh')" 2>$null
+if ($LASTEXITCODE -eq 0 -and $result) {
+  Write-Output $result
+} else {
+  Write-Output '{}'
+}

package/hooks/babysitter-proxied-post-tool-use.sh ADDED Viewed

@@ -0,0 +1,3 @@
+#!/bin/bash
+set -euo pipefail
+babysitter hook:run --harness unified --hook-type post-tool-use --json

package/hooks/babysitter-proxied-pre-compact.ps1 ADDED Viewed

@@ -0,0 +1,12 @@
+# PowerShell hook wrapper — sets env vars and delegates to bash
+$env:HOOK_TYPE = 'pre-compact'
+$env:ADAPTER_NAME = 'copilot'
+$env:PLUGIN_ROOT = Split-Path -Parent (Split-Path -Parent $PSScriptRoot)
+$input_data = [Console]::In.ReadToEnd()
+$result = $input_data | & bash "$PSScriptRoot/../$($MyInvocation.MyCommand.Name -replace '\.ps1$','.sh')" 2>$null
+if ($LASTEXITCODE -eq 0 -and $result) {
+  Write-Output $result
+} else {
+  Write-Output '{}'
+}

package/hooks/babysitter-proxied-pre-compact.sh ADDED Viewed

@@ -0,0 +1,3 @@
+#!/bin/bash
+set -euo pipefail
+babysitter hook:run --harness unified --hook-type pre-compact --json

package/hooks/babysitter-proxied-pre-tool-use.ps1 ADDED Viewed

@@ -0,0 +1,12 @@
+# PowerShell hook wrapper — sets env vars and delegates to bash
+$env:HOOK_TYPE = 'pre-tool-use'
+$env:ADAPTER_NAME = 'copilot'
+$env:PLUGIN_ROOT = Split-Path -Parent (Split-Path -Parent $PSScriptRoot)
+$input_data = [Console]::In.ReadToEnd()
+$result = $input_data | & bash "$PSScriptRoot/../$($MyInvocation.MyCommand.Name -replace '\.ps1$','.sh')" 2>$null
+if ($LASTEXITCODE -eq 0 -and $result) {
+  Write-Output $result
+} else {
+  Write-Output '{}'
+}

package/hooks/babysitter-proxied-pre-tool-use.sh ADDED Viewed

@@ -0,0 +1,3 @@
+#!/bin/bash
+set -euo pipefail
+babysitter hook:run --harness unified --hook-type pre-tool-use --json

package/hooks/babysitter-proxied-session-end.sh CHANGED Viewed

File without changes

package/hooks/babysitter-proxied-session-start.sh CHANGED Viewed

File without changes

package/hooks/babysitter-proxied-user-prompt-submitted.sh CHANGED Viewed

File without changes

package/hooks.json CHANGED Viewed

@@ -17,6 +17,30 @@
         "timeoutSec": 15
       }
     ],
+    "preToolUse": [
+      {
+        "type": "command",
+        "bash": "./hooks/babysitter-proxied-pre-tool-use.sh",
+        "powershell": "./hooks/babysitter-proxied-pre-tool-use.ps1",
+        "timeoutSec": 30
+      }
+    ],
+    "postToolUse": [
+      {
+        "type": "command",
+        "bash": "./hooks/babysitter-proxied-post-tool-use.sh",
+        "powershell": "./hooks/babysitter-proxied-post-tool-use.ps1",
+        "timeoutSec": 30
+      }
+    ],
+    "PreCompact": [
+      {
+        "type": "command",
+        "bash": "./hooks/babysitter-proxied-pre-compact.sh",
+        "powershell": "./hooks/babysitter-proxied-pre-compact.ps1",
+        "timeoutSec": 30
+      }
+    ],
     "sessionEnd": [
       {
         "type": "command",

package/package.json CHANGED Viewed

@@ -1,28 +1,26 @@
 {
   "name": "@a5c-ai/babysitter-github",
-  "version": "5.0.1-staging.e4c68b9b",
+  "version": "5.0.1-staging.e920fef118ef",
   "description": "Orchestrate complex, multi-step workflows with event-sourced state management, hook-based extensibility, and human-in-the-loop approval",
   "scripts": {
     "deploy": "npm publish --access public",
     "deploy:staging": "npm publish --access public --tag staging",
-    "postinstall": "node bin/install.js",
-    "preuninstall": "node bin/uninstall.js",
-    "team:install": "node scripts/team-install.js",
-    "test": "node scripts/sync-command-surfaces.js --check",
-    "sync:commands": "node scripts/sync-command-surfaces.js"
+    "plugin:install": "node bin/install.js --global",
+    "plugin:uninstall": "node bin/uninstall.js --global",
+    "team:install": "node scripts/team-install.js"
   },
   "bin": {
-    "babysitter-github-copilot": "bin/cli.js"
+    "babysitter-github": "bin/cli.js"
   },
   "files": [
     "bin/",
     "hooks.json",
+    "AGENTS.md",
     "hooks/",
     "skills/",
     "commands/",
     "scripts/",
     "plugin.json",
-    "AGENTS.md",
     "README.md",
     "versions.json",
     "package.json"
@@ -38,11 +36,14 @@
     "access": "public"
   },
   "dependencies": {
-    "@a5c-ai/babysitter-sdk": "5.0.1-staging.e4c68b9b"
+    "@a5c-ai/babysitter-sdk": "5.0.1-staging.e920fef118ef"
   },
   "repository": {
     "type": "git",
-    "url": "https://github.com/a5c-ai/babysitter"
+    "url": "git+https://github.com/a5c-ai/babysitter-github-copilot.git"
   },
-  "homepage": "https://github.com/a5c-ai/babysitter/tree/main/plugins/babysitter-github#readme"
+  "homepage": "https://github.com/a5c-ai/babysitter-github-copilot#readme",
+  "bugs": {
+    "url": "https://github.com/a5c-ai/babysitter-github-copilot/issues"
+  }
 }

package/plugin.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "babysitter",
-  "version": "5.0.1-staging.e4c68b9b",
+  "version": "5.0.1-staging.e920fef118ef",
   "description": "Orchestrate complex, multi-step workflows with event-sourced state management, hook-based extensibility, and human-in-the-loop approval",
   "author": {
     "name": "a5c.ai"

package/scripts/create-release-tag.mjs ADDED Viewed

@@ -0,0 +1,18 @@
+#!/usr/bin/env node
+import { spawnSync } from 'node:child_process';
+import { existsSync, readFileSync } from 'node:fs';
+function run(command, args) {
+  const result = spawnSync(command, args, { encoding: 'utf8', stdio: 'inherit' });
+  if (result.status !== 0) process.exit(result.status || 1);
+}
+const branch = process.env.GITHUB_REF_NAME || 'develop';
+const sha = (process.env.GITHUB_SHA || '').slice(0, 12);
+const version = existsSync('package.json') ? JSON.parse(readFileSync('package.json', 'utf8')).version : JSON.parse(readFileSync('versions.json', 'utf8')).sdkVersion;
+const normalized = String(version).replace(/[^0-9A-Za-z._-]/g, '-');
+const tag = 'release/' + branch + '/v' + normalized + '-' + sha;
+run('git', ['config', 'user.name', 'github-actions[bot]']);
+run('git', ['config', 'user.email', 'github-actions[bot]@users.noreply.github.com']);
+run('git', ['tag', tag]);
+run('git', ['push', 'origin', tag]);

package/scripts/publish-from-tag.mjs ADDED Viewed

@@ -0,0 +1,41 @@
+#!/usr/bin/env node
+import { spawnSync } from 'node:child_process';
+import { readFileSync } from 'node:fs';
+function run(command, args, options = {}) {
+  const result = spawnSync(command, args, { stdio: options.stdio || 'inherit', encoding: options.encoding });
+  if (result.status !== 0 && !options.allowFailure) process.exit(result.status || 1);
+  return result;
+}
+function npmView(packageSpec) {
+  return run('npm', ['view', packageSpec, 'version'], { allowFailure: true, stdio: 'pipe', encoding: 'utf8' }).status === 0;
+}
+const pkg = JSON.parse(readFileSync('package.json', 'utf8'));
+const ref = process.env.GITHUB_REF_NAME || '';
+const branch = ref.split('/')[1] || 'develop';
+const tag = branch === 'main' ? 'latest' : branch;
+if (!process.env.NODE_AUTH_TOKEN) {
+  console.log('NODE_AUTH_TOKEN is not configured; skipping npm publish.');
+  process.exit(0);
+}
+if (npmView(pkg.name + '@' + pkg.version)) {
+  console.log(pkg.name + '@' + pkg.version + ' already exists; ensuring dist-tag ' + tag + '.');
+  run('npm', ['dist-tag', 'add', pkg.name + '@' + pkg.version, tag], { allowFailure: true });
+  process.exit(0);
+}
+for (const field of ['dependencies', 'peerDependencies', 'optionalDependencies']) {
+  for (const [name, version] of Object.entries(pkg[field] || {})) {
+    if (!name.startsWith('@a5c-ai/') || version.startsWith('^') || version.startsWith('~') || version === '*' || version.startsWith('workspace:')) continue;
+    if (!npmView(name + '@' + version)) {
+      console.log('Required internal dependency ' + name + '@' + version + ' is not published yet; skipping npm publish.');
+      process.exit(0);
+    }
+  }
+}
+run('npm', ['publish', '--access', 'public', '--tag', tag]);

package/skills/babysit/SKILL.md CHANGED Viewed

@@ -1,14 +1,12 @@
 ---
 name: babysit
 description: >-
-  Orchestrate via @babysitter. Use this skill when asked to babysit a run,
-  orchestrate a process or whenever it is called explicitly. (babysit,
-  babysitter, orchestrate, orchestrate a run, workflow, etc.)
+  Execute via @babysitter. Use this skill when asked to babysit a task, do anything that is structured process-driven (even a loop) or whenever it is called explicitly. (babysit, babysitter, with a process, orchestrate, orchestrate a run, workflow, loop until, etc.)
 ---
 # babysit
-Orchestrate `.a5c/runs/<runId>/` through iterative execution.
+Follow the commands below exactly. but apply judgement and creativity to get the job done. no matter how small or simple the task may seem, you must use the babysitter SDK and run lifecycle to execute it. This is non-negotiable. If you are asked to do something that seems like it could be done with a simple tool call, you must still use the babysitter SDK to create a run, define tasks, execute them, and complete the run. This is how you will learn and demonstrate mastery of the babysitter system. Always follow the full process, even for trivial tasks.
 ## Dependencies

package/skills/call/SKILL.md CHANGED Viewed

@@ -5,4 +5,8 @@ description: Orchestrate a babysitter run. use this command to start babysitting
 # call
-Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md).
+Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md). Then continue executing the returned instructions in this same turn. Do not stop after the Skill tool returns; carry the requested run through to completion proof.
+User arguments for this command:
+$ARGUMENTS

package/skills/cleanup/SKILL.md CHANGED Viewed

@@ -11,11 +11,33 @@ Create and run a cleanup process using the process at `skills\babysit\process\cr
 Implementation notes (for the process):
 - Parse arguments for `--dry-run` flag (if present, set dryRun: true in inputs) and `--keep-days N` (default: 7)
-- The process scans .a5c/runs/ for completed/failed runs, aggregates insights, writes summaries, then removes old data
-- Always show the user what will be removed before removing (in interactive mode via breakpoints)
-- In non-interactive mode (yolo), proceed with cleanup using defaults
-- The insights file goes to docs/run-history-insights.md
-- Only remove terminal runs (completed/failed) older than the keep-days threshold
-- Never remove active/in-progress runs
-- Remove orphaned process files not referenced by remaining runs
-- After cleanup, show remaining run count and disk usage
+CRITICAL: The cleanup MUST follow this exact phase order. Do NOT delete any run before Phase 2 completes.
+Phase 1 — Scan:
+- Scan .a5c/runs/ for all runs
+- Classify each as terminal (completed/failed) or active (in-progress/created)
+- Identify terminal runs older than the keep-days threshold as removal candidates
+- Never mark active/in-progress runs for removal
+- Count and report: total runs, terminal, active, removal candidates, disk usage
+Phase 2 — Aggregate insights (BEFORE any deletion):
+- For EVERY removal candidate, read its run.json and journal/ events
+- Extract: processId, prompt, status, event count, created date, task summaries
+- Group by process type and extract patterns (retry counts, convergence behavior, failure modes)
+- Append a new dated section to docs/run-history-insights.md with:
+  - Summary statistics (runs removed, disk freed, runs retained)
+  - Run categories with counts and descriptions
+  - Key patterns observed (multi-batch convergence, retry behavior, etc.)
+  - What worked well / what didn't from the run data
+- This file MUST be written and verified before proceeding to Phase 3
+Phase 3 — Confirm removal:
+- In interactive mode, show the user what will be removed via a breakpoint
+- In non-interactive mode (yolo), proceed with defaults
+- In dry-run mode, stop here and show what would be removed
+Phase 4 — Remove:
+- Delete the terminal runs older than keep-days threshold
+- Identify and remove orphaned process files not referenced by remaining runs
+- Show remaining run count and disk usage after cleanup

package/skills/doctor/SKILL.md CHANGED Viewed

@@ -157,7 +157,6 @@ If it exists:
 **Goal:** Inspect babysitter session files for health and detect runaway loops.
 - Search for session state files using Glob:
-  - `plugins/babysitter/skills/babysit/state/*.md`
   - `.a5c/state/*.md`
   - `.a5c/state/*.json`
 - For each session state file found:
@@ -261,7 +260,7 @@ Mark as PASS if total size < 500MB and no files > 10MB. Mark as WARN if total si
 ### 10a. Hook Registration
-- Locate the plugin root. Check for `CLAUDE_PLUGIN_ROOT` env var, or search for `plugins/babysitter/hooks/hooks.json` by walking up from the current directory.
+- Locate the plugin root. Check for `CLAUDE_PLUGIN_ROOT` env var first, or search for a babysitter `hooks.json` by walking up from the current directory.
 - If found, read `hooks.json` and verify:
   - A `Stop` hook entry exists with a command referencing `babysitter-stop-hook.sh`.
   - A `SessionStart` hook entry exists with a command referencing `babysitter-session-start-hook.sh`.
@@ -316,7 +315,7 @@ If the stop hook shows NO evidence of execution (no log entries, no journal even
 Perform these diagnostic steps in order and report the first failure found:
-1. **Plugin not installed**: Check if `plugins/babysitter/` exists relative to the project root and if `CLAUDE_PLUGIN_ROOT` is set. If the plugin directory doesn't exist, report: "Plugin not installed — the babysitter plugin directory is missing."
+1. **Plugin not installed**: Check if `CLAUDE_PLUGIN_ROOT` is set or if a babysitter plugin directory exists relative to the project root. If neither exists, report: "Plugin not installed — the babysitter plugin directory is missing."
 2. **Plugin not enabled**: Check for Claude settings files:
    - `~/.claude/settings.json` — look for `babysitter` in `enabledPlugins`.

package/skills/help/SKILL.md CHANGED Viewed

@@ -234,7 +234,8 @@ SECONDARY COMMANDS
   How it works: Runs npx @a5c-ai/babysitter-observer-dashboard@latest which watches
   the .a5c/runs/ directory (or a parent directory containing multiple projects) and
   serves a live dashboard. The process is blocking -- it runs until you stop it, and
-  it prints the local URL to share with the user.
+  it prints the local URL to share with the user. Do not use `babysitter observe`
+  as a fallback; the core Babysitter CLI does not expose that subcommand.
   Example: /babysitter:observe
   (opens browser showing all runs with live-updating task

package/skills/observe/SKILL.md CHANGED Viewed

@@ -8,6 +8,11 @@ description: Launch the babysitter observer dashboard. Installs and runs the rea
 Run the babysitter observer dashboard:
 1. Determine the watch directory — this is usually the project's container directory (the parent of the project dir), or the current working directory if not specified.
-2. Launch the dashboard: `npx -y @a5c-ai/babysitter-observer-dashboard@latest --watch-dir <dir>`
+2. Launch the standalone dashboard package: `npx -y @a5c-ai/babysitter-observer-dashboard@latest --watch-dir <dir>`.
 3. This is a blocking process — it will keep running until stopped.
 4. Report the URL printed by the dashboard to the user, then open it in the browser.
+Do not fall back to `babysitter observe`; the core Babysitter CLI does not expose
+that subcommand. Some harness runtimes may provide a separate
+`babysitter-agent observe` surface, but this skill uses the verified standalone
+dashboard package.

package/skills/yolo/SKILL.md CHANGED Viewed

@@ -5,4 +5,8 @@ description: Orchestrate a babysitter run. use this command to start babysitting
 # yolo
-Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md). but without any user interaction or breakpoints in the run.
+Start the Babysitter run directly through the CLI, without any user interaction or breakpoints. Do not invoke the Skill tool and do not run an instructions-only command. In Claude Code, use Bash to run `babysitter-agent yolo --harness claude-code --workspace "$PWD" --prompt "<user arguments>" --json`; in Codex, run `babysitter-agent yolo --harness codex --workspace "$PWD" --prompt "<user arguments>" --json`; in other harnesses, use the same command with that harness id. Replace `<user arguments>` with the arguments shown below, wait for the command to finish, and treat the CLI completion proof as the result.
+User arguments for this command:
+$ARGUMENTS

package/versions.json CHANGED Viewed

@@ -1,3 +1,4 @@
 {
-  "sdkVersion": "5.0.1-staging.e4c68b9b"
+  "sdkVersion": "5.0.1-staging.e920fef118ef",
+  "extensionVersion": "5.0.1-staging.e920fef118ef"
 }

package/scripts/sync-command-surfaces.js DELETED Viewed

@@ -1,62 +0,0 @@
-'use strict';
-const path = require('path');
-const {
-  listDirectories,
-  listMarkdownBasenames,
-  reportCheckResult,
-  syncCommandMirrors,
-  syncSkillsFromCommands,
-} = require('../../../scripts/plugin-command-sync-lib.cjs');
-const PACKAGE_ROOT = path.resolve(__dirname, '..');
-const REPO_ROOT = path.resolve(PACKAGE_ROOT, '..', '..');
-const ROOT_COMMANDS = path.join(REPO_ROOT, 'plugins', 'babysitter', 'commands');
-const PLUGIN_COMMANDS = path.join(PACKAGE_ROOT, 'commands');
-const PLUGIN_SKILLS = path.join(PACKAGE_ROOT, 'skills');
-const LABEL = 'babysitter-github sync';
-function getMirroredCommandNames() {
-  const local = new Set(listMarkdownBasenames(PLUGIN_COMMANDS));
-  return listMarkdownBasenames(ROOT_COMMANDS).filter((name) => local.has(name));
-}
-function getDerivedSkillNames() {
-  const local = new Set(listDirectories(PLUGIN_SKILLS));
-  return listMarkdownBasenames(PLUGIN_COMMANDS).filter((name) => local.has(name));
-}
-function main() {
-  const check = process.argv.includes('--check');
-  const mirrorResult = syncCommandMirrors({
-    label: LABEL,
-    sourceRoot: ROOT_COMMANDS,
-    targetRoot: PLUGIN_COMMANDS,
-    names: getMirroredCommandNames(),
-    check,
-    cwd: PACKAGE_ROOT,
-  });
-  const skillsResult = syncSkillsFromCommands({
-    label: LABEL,
-    sourceRoot: PLUGIN_COMMANDS,
-    skillsRoot: PLUGIN_SKILLS,
-    names: getDerivedSkillNames(),
-    check,
-    cwd: PACKAGE_ROOT,
-  });
-  if (check) {
-    reportCheckResult(LABEL, [...mirrorResult.stale, ...skillsResult.stale]);
-    return;
-  }
-  const updated = mirrorResult.updated + skillsResult.updated;
-  if (updated === 0) {
-    console.log(`[${LABEL}] no GitHub plugin command changes were needed.`);
-    return;
-  }
-  console.log(`[${LABEL}] updated ${updated} GitHub plugin file(s).`);
-}
-main();