@a5c-ai/babysitter-github 5.0.1-staging.e4c68b9b → 5.0.1-staging.e920fef118ef

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/README.md CHANGED
@@ -18,7 +18,8 @@ directly.
18
18
  - **Node.js 22+**
19
19
  - **GitHub Copilot CLI** (`copilot`) -- requires an active GitHub Copilot
20
20
  subscription
21
- - **Babysitter SDK CLI** (`@a5c-ai/babysitter-sdk`) -- installed globally
21
+ - **Babysitter CLI** (`@a5c-ai/babysitter`) -- installed globally when using
22
+ the SDK helper
22
23
 
23
24
  ## Installation
24
25
 
@@ -28,7 +29,7 @@ Register the a5c.ai marketplace and install the plugin:
28
29
 
29
30
  ```bash
30
31
  # Register the marketplace
31
- copilot plugin marketplace add a5c-ai/babysitter
32
+ copilot plugin marketplace add a5c-ai/babysitter-claude
32
33
 
33
34
  # Install the plugin
34
35
  copilot plugin install babysitter
@@ -36,42 +37,50 @@ copilot plugin install babysitter
36
37
 
37
38
  ### Direct GitHub install
38
39
 
39
- Install directly from the Git repository using Copilot CLI. Copilot CLI
40
- discovers the plugin via `.github/plugin/marketplace.json` at the repo root:
40
+ Install directly from the generated external plugin repository:
41
41
 
42
42
  ```bash
43
- copilot plugin install a5c-ai/babysitter
43
+ copilot plugin install a5c-ai/babysitter-github-copilot
44
44
  ```
45
45
 
46
- ### Alternative Installation (npm / development)
46
+ ### Alternative Installation (SDK helper / development)
47
47
 
48
- For development or environments where the Copilot CLI plugin system is not
49
- available, install via npm:
48
+ For development, automation, or environments where the Copilot CLI plugin system is not available, install through the Babysitter SDK helper. This is the canonical scriptable path used by the installer tests and resolves to `npx --yes @a5c-ai/babysitter-github install ...` under the hood:
50
49
 
51
- Install the SDK CLI first:
50
+ Install the Babysitter CLI first:
52
51
 
53
52
  ```bash
54
- npm install -g @a5c-ai/babysitter-sdk
53
+ npm install -g @a5c-ai/babysitter
55
54
  ```
56
55
 
57
- Then install the GitHub Copilot plugin globally:
56
+ Then install the GitHub Copilot plugin globally or into a workspace:
58
57
 
59
58
  ```bash
60
- npm install -g @a5c-ai/babysitter-github
61
- babysitter-github install
59
+ # Global install
60
+ babysitter harness:install-plugin github-copilot
61
+
62
+ # Workspace install
63
+ babysitter harness:install-plugin github-copilot --workspace /path/to/repo
62
64
  ```
63
65
 
64
- Or install from source:
66
+ You can also run the published package installer directly:
65
67
 
66
68
  ```bash
67
- cd plugins/babysitter-github
68
- node bin/install.js
69
+ npx --yes @a5c-ai/babysitter-github install --global
70
+ npx --yes @a5c-ai/babysitter-github install --workspace /path/to/repo
71
+ ```
72
+
73
+ Or install from generated source:
74
+
75
+ ```bash
76
+ npm run generate:plugins
77
+ node artifacts/generated-plugins/github-copilot/bin/install.js
69
78
  ```
70
79
 
71
- Install into a specific workspace:
80
+ Install into a specific workspace from generated source:
72
81
 
73
82
  ```bash
74
- babysitter-github install --workspace /path/to/repo
83
+ node artifacts/generated-plugins/github-copilot/bin/install.js --workspace /path/to/repo
75
84
  ```
76
85
 
77
86
  ### GitHub Copilot cloud agent installation
@@ -253,8 +262,7 @@ Copilot CLI looks for the plugin manifest in these paths, checked in order:
253
262
  The first match wins. This plugin uses `plugin.json` at the package root.
254
263
 
255
264
  For marketplace discovery, Copilot CLI looks for `.github/plugin/marketplace.json`
256
- at the repository root. This file lists all available plugins in the repo and is
257
- used when installing via `copilot plugin install OWNER/REPO`.
265
+ at the repository root of the generated plugin repository.
258
266
 
259
267
  ### plugin.json Schema
260
268
 
@@ -404,7 +412,7 @@ repository root in `.github/plugin/marketplace.json`:
404
412
  "name": "babysitter",
405
413
  "description": "Multi-step workflow orchestration with event-sourced state",
406
414
  "version": "0.1.0",
407
- "source": "./plugins/babysitter-github"
415
+ "source": "./"
408
416
  }
409
417
  ]
410
418
  }
@@ -461,7 +469,7 @@ These registries are available without running `marketplace add`.
461
469
  ## Plugin Structure (Directory Layout)
462
470
 
463
471
  ```
464
- plugins/babysitter-github/
472
+ artifacts/generated-plugins/github-copilot/
465
473
  plugin.json # Plugin manifest (skills, hooks, metadata)
466
474
  .github/plugin.json # Plugin manifest (alternate discovery path)
467
475
  hooks.json # Hook configuration (sessionStart, sessionEnd, userPromptSubmitted)
@@ -579,14 +587,14 @@ compatibility where PowerShell execution is available.
579
587
  git clone https://github.com/a5c-ai/babysitter.git
580
588
  cd babysitter
581
589
  npm install
582
- cd plugins/babysitter-github
590
+ npm run generate:plugins
583
591
  node bin/install.js
584
592
  ```
585
593
 
586
594
  ### Publishing
587
595
 
588
596
  ```bash
589
- cd plugins/babysitter-github
597
+ cd artifacts/generated-plugins/github-copilot
590
598
  npm run deploy # Publish to npm (public)
591
599
  npm run deploy:staging # Publish to npm with staging tag
592
600
  ```
@@ -594,7 +602,7 @@ npm run deploy:staging # Publish to npm with staging tag
594
602
  ### Team installation
595
603
 
596
604
  ```bash
597
- cd plugins/babysitter-github
605
+ cd artifacts/generated-plugins/github-copilot
598
606
  npm run team:install
599
607
  ```
600
608
 
@@ -13,7 +13,7 @@ function getUserHome() {
13
13
  }
14
14
 
15
15
  function getHarnessHome() {
16
- return path.join(os.homedir(), '.copilot');
16
+ return path.join(os.homedir(), ".copilot");
17
17
  }
18
18
 
19
19
  function getHomePluginRoot(scope) {
@@ -104,7 +104,7 @@ function ensureMarketplaceEntry(marketplacePath, pluginRoot) {
104
104
  name: PLUGIN_NAME,
105
105
  source: relSource,
106
106
  description: "Orchestrate complex, multi-step workflows with event-sourced state management, hook-based extensibility, and human-in-the-loop approval",
107
- version: "5.0.0",
107
+ version: "5.0.1-staging.e920fef118ef",
108
108
  author: { name: "a5c.ai" },
109
109
  };
110
110
  if (idx >= 0) marketplace.plugins[idx] = entry;
@@ -454,8 +454,9 @@ function installManagedHooks(packageRoot, copilotHome) {
454
454
  mergeManagedHooksConfig(packageRoot, copilotHome);
455
455
  }
456
456
 
457
- function removeLegacyHooks(copilotHome) {
458
- for (const hookName of LEGACY_HOOK_SCRIPT_NAMES) {
457
+ function removeManagedHooks(copilotHome) {
458
+ const managedHookNames = [...LEGACY_HOOK_SCRIPT_NAMES, ...HOOK_SCRIPT_NAMES];
459
+ for (const hookName of managedHookNames) {
459
460
  fs.rmSync(path.join(copilotHome, 'hooks', hookName), { force: true });
460
461
  }
461
462
 
@@ -476,10 +477,17 @@ function removeLegacyHooks(copilotHome) {
476
477
  const eventHooks = Array.isArray(hooksConfig.hooks[eventName]) ? hooksConfig.hooks[eventName] : [];
477
478
  const filteredMatchers = eventHooks
478
479
  .map((matcher) => {
480
+ const directBash = String(matcher?.bash || matcher?.command || '');
481
+ const directPs = String(matcher?.powershell || '');
482
+ const hasDirectHook = directBash.length > 0 || directPs.length > 0;
483
+ const directIsManaged = managedHookNames.some((name) => directBash.includes(name) || directPs.includes(name));
484
+ if (hasDirectHook) {
485
+ return directIsManaged ? null : matcher;
486
+ }
479
487
  const hooks = Array.isArray(matcher.hooks) ? matcher.hooks : [];
480
488
  const keptHooks = hooks.filter((hook) => {
481
489
  const command = String(hook.command || '');
482
- return !LEGACY_HOOK_SCRIPT_NAMES.some((name) => command.includes(name));
490
+ return !managedHookNames.some((name) => command.includes(name));
483
491
  });
484
492
  return keptHooks.length > 0 ? { ...matcher, hooks: keptHooks } : null;
485
493
  })
@@ -498,11 +506,13 @@ function removeLegacyHooks(copilotHome) {
498
506
  }
499
507
 
500
508
  function installCopilotSurface(packageRoot, copilotHome) {
501
- removeLegacyHooks(copilotHome);
509
+ removeManagedHooks(copilotHome);
502
510
  installManagedSkills(packageRoot, copilotHome);
503
511
  installManagedHooks(packageRoot, copilotHome);
504
512
  }
505
513
 
514
+ const removeLegacyHooks = removeManagedHooks;
515
+
506
516
  function renderCloudAgentAgentsBlock() {
507
517
  return [
508
518
  '## Babysitter Cloud Agent',
@@ -831,10 +841,19 @@ module.exports = {
831
841
  resolveCliCommand,
832
842
  runCli,
833
843
  ensureGlobalProcessLibrary,
844
+ PLUGIN_BUNDLE_ENTRIES,
845
+ copyRecursive,
846
+ copyPluginBundle,
847
+ DEFAULT_MARKETPLACE,
848
+ normalizeMarketplaceSourcePath,
849
+ ensureMarketplaceEntry,
850
+ removeMarketplaceEntry,
851
+ installManagedSkills,
852
+ mergeManagedHooksConfig,
853
+ installManagedHooks,
854
+ warnWindowsHooks,
834
855
  LEGACY_HOOK_SCRIPT_NAMES,
835
856
  HOOK_SCRIPT_NAMES,
836
- DEFAULT_MARKETPLACE,
837
- PLUGIN_BUNDLE_ENTRIES,
838
857
  CLOUD_AGENT_BUNDLE_ENTRIES,
839
858
  MANAGED_BLOCK_START,
840
859
  MANAGED_BLOCK_END,
@@ -849,10 +868,8 @@ module.exports = {
849
868
  rewriteCloudSkill,
850
869
  registerCopilotPlugin,
851
870
  deregisterCopilotPlugin,
852
- installManagedSkills,
853
- mergeManagedHooksConfig,
854
- installManagedHooks,
855
871
  removeLegacyHooks,
872
+ removeManagedHooks,
856
873
  installCopilotSurface,
857
874
  renderCloudAgentAgentsBlock,
858
875
  renderCloudAgentCopilotInstructionsBlock,
@@ -862,12 +879,6 @@ module.exports = {
862
879
  installCloudAgentInstructions,
863
880
  installCloudAgentSetupSteps,
864
881
  installCloudAgentSurface,
865
- normalizeMarketplaceSourcePath,
866
- ensureMarketplaceEntry,
867
- removeMarketplaceEntry,
868
- warnWindowsHooks,
869
- copyPluginBundle,
870
- copyRecursive,
871
882
  harnessCliRoute,
872
883
  harnessInstall,
873
884
  };
package/bin/install.js CHANGED
@@ -65,6 +65,15 @@ function main() {
65
65
  try {
66
66
  shared.copyPluginBundle(PACKAGE_ROOT, pluginRoot);
67
67
  shared.ensureMarketplaceEntry(marketplacePath, pluginRoot);
68
+ if (typeof shared.registerCopilotPlugin === 'function') {
69
+ shared.registerCopilotPlugin(pluginRoot);
70
+ }
71
+ if (typeof shared.installCopilotSurface === 'function' && typeof shared.getCopilotHome === 'function') {
72
+ shared.installCopilotSurface(PACKAGE_ROOT, shared.getCopilotHome());
73
+ }
74
+ if (typeof shared.warnWindowsHooks === 'function') {
75
+ shared.warnWindowsHooks();
76
+ }
68
77
  if (typeof shared.harnessInstall === 'function') {
69
78
  shared.harnessInstall(PACKAGE_ROOT, pluginRoot);
70
79
  }
package/bin/uninstall.js CHANGED
@@ -7,17 +7,38 @@ const shared = require('./install-shared');
7
7
 
8
8
  function main() {
9
9
  const pluginRoot = shared.getHomePluginRoot();
10
+ const marketplacePath = typeof shared.getHomeMarketplacePath === 'function'
11
+ ? shared.getHomeMarketplacePath()
12
+ : null;
13
+ const copilotHome = typeof shared.getCopilotHome === 'function'
14
+ ? shared.getCopilotHome()
15
+ : null;
10
16
 
11
17
  if (!fs.existsSync(pluginRoot)) {
12
18
  console.log(`[${shared.PLUGIN_NAME}] Plugin not installed at ${pluginRoot}`);
13
- return;
19
+ } else {
20
+ try {
21
+ fs.rmSync(pluginRoot, { recursive: true, force: true });
22
+ console.log(`[${shared.PLUGIN_NAME}] Uninstalled from ${pluginRoot}`);
23
+ } catch (err) {
24
+ console.error(`[${shared.PLUGIN_NAME}] Failed to uninstall: ${err.message}`);
25
+ process.exitCode = 1;
26
+ return;
27
+ }
14
28
  }
15
29
 
16
30
  try {
17
- fs.rmSync(pluginRoot, { recursive: true, force: true });
18
- console.log(`[${shared.PLUGIN_NAME}] Uninstalled from ${pluginRoot}`);
31
+ if (typeof shared.deregisterCopilotPlugin === 'function') {
32
+ shared.deregisterCopilotPlugin(pluginRoot);
33
+ }
34
+ if (copilotHome && typeof shared.removeManagedHooks === 'function') {
35
+ shared.removeManagedHooks(copilotHome);
36
+ }
37
+ if (marketplacePath && typeof shared.removeMarketplaceEntry === 'function') {
38
+ shared.removeMarketplaceEntry(marketplacePath);
39
+ }
19
40
  } catch (err) {
20
- console.error(`[${shared.PLUGIN_NAME}] Failed to uninstall: ${err.message}`);
41
+ console.error(`[${shared.PLUGIN_NAME}] Failed to clean up uninstall state: ${err.message}`);
21
42
  process.exitCode = 1;
22
43
  }
23
44
  }
package/commands/call.md CHANGED
@@ -4,4 +4,8 @@ argument-hint: Specific instructions for the run.
4
4
  allowed-tools: Read, Grep, Write, Task, Bash, Edit, Grep, Glob, WebFetch, WebSearch, Search, AskUserQuestion, TodoWrite, TodoRead, Skill, BashOutput, KillShell, MultiEdit, LS
5
5
  ---
6
6
 
7
- Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md).
7
+ Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md). Then continue executing the returned instructions in this same turn. Do not stop after the Skill tool returns; carry the requested run through to completion proof.
8
+
9
+ User arguments for this command:
10
+
11
+ $ARGUMENTS
@@ -10,11 +10,33 @@ Create and run a cleanup process using the process at `skills\babysit\process\cr
10
10
 
11
11
  Implementation notes (for the process):
12
12
  - Parse arguments for `--dry-run` flag (if present, set dryRun: true in inputs) and `--keep-days N` (default: 7)
13
- - The process scans .a5c/runs/ for completed/failed runs, aggregates insights, writes summaries, then removes old data
14
- - Always show the user what will be removed before removing (in interactive mode via breakpoints)
15
- - In non-interactive mode (yolo), proceed with cleanup using defaults
16
- - The insights file goes to docs/run-history-insights.md
17
- - Only remove terminal runs (completed/failed) older than the keep-days threshold
18
- - Never remove active/in-progress runs
19
- - Remove orphaned process files not referenced by remaining runs
20
- - After cleanup, show remaining run count and disk usage
13
+
14
+ CRITICAL: The cleanup MUST follow this exact phase order. Do NOT delete any run before Phase 2 completes.
15
+
16
+ Phase 1 Scan:
17
+ - Scan .a5c/runs/ for all runs
18
+ - Classify each as terminal (completed/failed) or active (in-progress/created)
19
+ - Identify terminal runs older than the keep-days threshold as removal candidates
20
+ - Never mark active/in-progress runs for removal
21
+ - Count and report: total runs, terminal, active, removal candidates, disk usage
22
+
23
+ Phase 2 — Aggregate insights (BEFORE any deletion):
24
+ - For EVERY removal candidate, read its run.json and journal/ events
25
+ - Extract: processId, prompt, status, event count, created date, task summaries
26
+ - Group by process type and extract patterns (retry counts, convergence behavior, failure modes)
27
+ - Append a new dated section to docs/run-history-insights.md with:
28
+ - Summary statistics (runs removed, disk freed, runs retained)
29
+ - Run categories with counts and descriptions
30
+ - Key patterns observed (multi-batch convergence, retry behavior, etc.)
31
+ - What worked well / what didn't from the run data
32
+ - This file MUST be written and verified before proceeding to Phase 3
33
+
34
+ Phase 3 — Confirm removal:
35
+ - In interactive mode, show the user what will be removed via a breakpoint
36
+ - In non-interactive mode (yolo), proceed with defaults
37
+ - In dry-run mode, stop here and show what would be removed
38
+
39
+ Phase 4 — Remove:
40
+ - Delete the terminal runs older than keep-days threshold
41
+ - Identify and remove orphaned process files not referenced by remaining runs
42
+ - Show remaining run count and disk usage after cleanup
@@ -156,7 +156,6 @@ If it exists:
156
156
  **Goal:** Inspect babysitter session files for health and detect runaway loops.
157
157
 
158
158
  - Search for session state files using Glob:
159
- - `plugins/babysitter/skills/babysit/state/*.md`
160
159
  - `.a5c/state/*.md`
161
160
  - `.a5c/state/*.json`
162
161
  - For each session state file found:
@@ -260,7 +259,7 @@ Mark as PASS if total size < 500MB and no files > 10MB. Mark as WARN if total si
260
259
 
261
260
  ### 10a. Hook Registration
262
261
 
263
- - Locate the plugin root. Check for `CLAUDE_PLUGIN_ROOT` env var, or search for `plugins/babysitter/hooks/hooks.json` by walking up from the current directory.
262
+ - Locate the plugin root. Check for `CLAUDE_PLUGIN_ROOT` env var first, or search for a babysitter `hooks.json` by walking up from the current directory.
264
263
  - If found, read `hooks.json` and verify:
265
264
  - A `Stop` hook entry exists with a command referencing `babysitter-stop-hook.sh`.
266
265
  - A `SessionStart` hook entry exists with a command referencing `babysitter-session-start-hook.sh`.
@@ -315,7 +314,7 @@ If the stop hook shows NO evidence of execution (no log entries, no journal even
315
314
 
316
315
  Perform these diagnostic steps in order and report the first failure found:
317
316
 
318
- 1. **Plugin not installed**: Check if `plugins/babysitter/` exists relative to the project root and if `CLAUDE_PLUGIN_ROOT` is set. If the plugin directory doesn't exist, report: "Plugin not installed — the babysitter plugin directory is missing."
317
+ 1. **Plugin not installed**: Check if `CLAUDE_PLUGIN_ROOT` is set or if a babysitter plugin directory exists relative to the project root. If neither exists, report: "Plugin not installed — the babysitter plugin directory is missing."
319
318
 
320
319
  2. **Plugin not enabled**: Check for Claude settings files:
321
320
  - `~/.claude/settings.json` — look for `babysitter` in `enabledPlugins`.
package/commands/help.md CHANGED
@@ -233,7 +233,8 @@ SECONDARY COMMANDS
233
233
  How it works: Runs npx @a5c-ai/babysitter-observer-dashboard@latest which watches
234
234
  the .a5c/runs/ directory (or a parent directory containing multiple projects) and
235
235
  serves a live dashboard. The process is blocking -- it runs until you stop it, and
236
- it prints the local URL to share with the user.
236
+ it prints the local URL to share with the user. Do not use `babysitter observe`
237
+ as a fallback; the core Babysitter CLI does not expose that subcommand.
237
238
 
238
239
  Example: /babysitter:observe
239
240
  (opens browser showing all runs with live-updating task
@@ -7,6 +7,11 @@ allowed-tools: Read, Grep, Write, Task, Bash
7
7
  Run the babysitter observer dashboard:
8
8
 
9
9
  1. Determine the watch directory — this is usually the project's container directory (the parent of the project dir), or the current working directory if not specified.
10
- 2. Launch the dashboard: `npx -y @a5c-ai/babysitter-observer-dashboard@latest --watch-dir <dir>`
10
+ 2. Launch the standalone dashboard package: `npx -y @a5c-ai/babysitter-observer-dashboard@latest --watch-dir <dir>`.
11
11
  3. This is a blocking process — it will keep running until stopped.
12
12
  4. Report the URL printed by the dashboard to the user, then open it in the browser.
13
+
14
+ Do not fall back to `babysitter observe`; the core Babysitter CLI does not expose
15
+ that subcommand. Some harness runtimes may provide a separate
16
+ `babysitter-agent observe` surface, but this skill uses the verified standalone
17
+ dashboard package.
package/commands/yolo.md CHANGED
@@ -1,7 +1,11 @@
1
- ---
2
- description: Orchestrate a babysitter run. use this command to start babysitting a complex workflow in a non-interactive mode, without any user interaction or breakpoints in the run.
3
- argument-hint: Specific instructions for the run.
4
- allowed-tools: Read, Grep, Write, Task, Bash, Edit, Grep, Glob, WebFetch, WebSearch, Search, AskUserQuestion, TodoWrite, TodoRead, Skill, BashOutput, KillShell, MultiEdit, LS
5
- ---
6
-
7
- Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md). but without any user interaction or breakpoints in the run.
1
+ ---
2
+ description: Orchestrate a babysitter run. use this command to start babysitting a complex workflow in a non-interactive mode, without any user interaction or breakpoints in the run.
3
+ argument-hint: Specific instructions for the run.
4
+ allowed-tools: Read, Grep, Write, Task, Bash, Edit, Grep, Glob, WebFetch, WebSearch, Search, AskUserQuestion, TodoWrite, TodoRead, Skill, BashOutput, KillShell, MultiEdit, LS
5
+ ---
6
+
7
+ Start the Babysitter run directly through the CLI, without any user interaction or breakpoints. Do not invoke the Skill tool and do not run an instructions-only command. In Claude Code, use Bash to run `babysitter-agent yolo --harness claude-code --workspace "$PWD" --prompt "<user arguments>" --json`; in Codex, run `babysitter-agent yolo --harness codex --workspace "$PWD" --prompt "<user arguments>" --json`; in other harnesses, use the same command with that harness id. Replace `<user arguments>` with the arguments shown below, wait for the command to finish, and treat the CLI completion proof as the result.
8
+
9
+ User arguments for this command:
10
+
11
+ $ARGUMENTS
@@ -0,0 +1,12 @@
1
+ # PowerShell hook wrapper — sets env vars and delegates to bash
2
+ $env:HOOK_TYPE = 'post-tool-use'
3
+ $env:ADAPTER_NAME = 'copilot'
4
+ $env:PLUGIN_ROOT = Split-Path -Parent (Split-Path -Parent $PSScriptRoot)
5
+
6
+ $input_data = [Console]::In.ReadToEnd()
7
+ $result = $input_data | & bash "$PSScriptRoot/../$($MyInvocation.MyCommand.Name -replace '\.ps1$','.sh')" 2>$null
8
+ if ($LASTEXITCODE -eq 0 -and $result) {
9
+ Write-Output $result
10
+ } else {
11
+ Write-Output '{}'
12
+ }
@@ -0,0 +1,3 @@
1
+ #!/bin/bash
2
+ set -euo pipefail
3
+ babysitter hook:run --harness unified --hook-type post-tool-use --json
@@ -0,0 +1,12 @@
1
+ # PowerShell hook wrapper — sets env vars and delegates to bash
2
+ $env:HOOK_TYPE = 'pre-compact'
3
+ $env:ADAPTER_NAME = 'copilot'
4
+ $env:PLUGIN_ROOT = Split-Path -Parent (Split-Path -Parent $PSScriptRoot)
5
+
6
+ $input_data = [Console]::In.ReadToEnd()
7
+ $result = $input_data | & bash "$PSScriptRoot/../$($MyInvocation.MyCommand.Name -replace '\.ps1$','.sh')" 2>$null
8
+ if ($LASTEXITCODE -eq 0 -and $result) {
9
+ Write-Output $result
10
+ } else {
11
+ Write-Output '{}'
12
+ }
@@ -0,0 +1,3 @@
1
+ #!/bin/bash
2
+ set -euo pipefail
3
+ babysitter hook:run --harness unified --hook-type pre-compact --json
@@ -0,0 +1,12 @@
1
+ # PowerShell hook wrapper — sets env vars and delegates to bash
2
+ $env:HOOK_TYPE = 'pre-tool-use'
3
+ $env:ADAPTER_NAME = 'copilot'
4
+ $env:PLUGIN_ROOT = Split-Path -Parent (Split-Path -Parent $PSScriptRoot)
5
+
6
+ $input_data = [Console]::In.ReadToEnd()
7
+ $result = $input_data | & bash "$PSScriptRoot/../$($MyInvocation.MyCommand.Name -replace '\.ps1$','.sh')" 2>$null
8
+ if ($LASTEXITCODE -eq 0 -and $result) {
9
+ Write-Output $result
10
+ } else {
11
+ Write-Output '{}'
12
+ }
@@ -0,0 +1,3 @@
1
+ #!/bin/bash
2
+ set -euo pipefail
3
+ babysitter hook:run --harness unified --hook-type pre-tool-use --json
File without changes
File without changes
File without changes
package/hooks.json CHANGED
@@ -17,6 +17,30 @@
17
17
  "timeoutSec": 15
18
18
  }
19
19
  ],
20
+ "preToolUse": [
21
+ {
22
+ "type": "command",
23
+ "bash": "./hooks/babysitter-proxied-pre-tool-use.sh",
24
+ "powershell": "./hooks/babysitter-proxied-pre-tool-use.ps1",
25
+ "timeoutSec": 30
26
+ }
27
+ ],
28
+ "postToolUse": [
29
+ {
30
+ "type": "command",
31
+ "bash": "./hooks/babysitter-proxied-post-tool-use.sh",
32
+ "powershell": "./hooks/babysitter-proxied-post-tool-use.ps1",
33
+ "timeoutSec": 30
34
+ }
35
+ ],
36
+ "PreCompact": [
37
+ {
38
+ "type": "command",
39
+ "bash": "./hooks/babysitter-proxied-pre-compact.sh",
40
+ "powershell": "./hooks/babysitter-proxied-pre-compact.ps1",
41
+ "timeoutSec": 30
42
+ }
43
+ ],
20
44
  "sessionEnd": [
21
45
  {
22
46
  "type": "command",
package/package.json CHANGED
@@ -1,28 +1,26 @@
1
1
  {
2
2
  "name": "@a5c-ai/babysitter-github",
3
- "version": "5.0.1-staging.e4c68b9b",
3
+ "version": "5.0.1-staging.e920fef118ef",
4
4
  "description": "Orchestrate complex, multi-step workflows with event-sourced state management, hook-based extensibility, and human-in-the-loop approval",
5
5
  "scripts": {
6
6
  "deploy": "npm publish --access public",
7
7
  "deploy:staging": "npm publish --access public --tag staging",
8
- "postinstall": "node bin/install.js",
9
- "preuninstall": "node bin/uninstall.js",
10
- "team:install": "node scripts/team-install.js",
11
- "test": "node scripts/sync-command-surfaces.js --check",
12
- "sync:commands": "node scripts/sync-command-surfaces.js"
8
+ "plugin:install": "node bin/install.js --global",
9
+ "plugin:uninstall": "node bin/uninstall.js --global",
10
+ "team:install": "node scripts/team-install.js"
13
11
  },
14
12
  "bin": {
15
- "babysitter-github-copilot": "bin/cli.js"
13
+ "babysitter-github": "bin/cli.js"
16
14
  },
17
15
  "files": [
18
16
  "bin/",
19
17
  "hooks.json",
18
+ "AGENTS.md",
20
19
  "hooks/",
21
20
  "skills/",
22
21
  "commands/",
23
22
  "scripts/",
24
23
  "plugin.json",
25
- "AGENTS.md",
26
24
  "README.md",
27
25
  "versions.json",
28
26
  "package.json"
@@ -38,11 +36,14 @@
38
36
  "access": "public"
39
37
  },
40
38
  "dependencies": {
41
- "@a5c-ai/babysitter-sdk": "5.0.1-staging.e4c68b9b"
39
+ "@a5c-ai/babysitter-sdk": "5.0.1-staging.e920fef118ef"
42
40
  },
43
41
  "repository": {
44
42
  "type": "git",
45
- "url": "https://github.com/a5c-ai/babysitter"
43
+ "url": "git+https://github.com/a5c-ai/babysitter-github-copilot.git"
46
44
  },
47
- "homepage": "https://github.com/a5c-ai/babysitter/tree/main/plugins/babysitter-github#readme"
45
+ "homepage": "https://github.com/a5c-ai/babysitter-github-copilot#readme",
46
+ "bugs": {
47
+ "url": "https://github.com/a5c-ai/babysitter-github-copilot/issues"
48
+ }
48
49
  }
package/plugin.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "babysitter",
3
- "version": "5.0.1-staging.e4c68b9b",
3
+ "version": "5.0.1-staging.e920fef118ef",
4
4
  "description": "Orchestrate complex, multi-step workflows with event-sourced state management, hook-based extensibility, and human-in-the-loop approval",
5
5
  "author": {
6
6
  "name": "a5c.ai"
@@ -0,0 +1,18 @@
1
+ #!/usr/bin/env node
2
+ import { spawnSync } from 'node:child_process';
3
+ import { existsSync, readFileSync } from 'node:fs';
4
+
5
+ function run(command, args) {
6
+ const result = spawnSync(command, args, { encoding: 'utf8', stdio: 'inherit' });
7
+ if (result.status !== 0) process.exit(result.status || 1);
8
+ }
9
+
10
+ const branch = process.env.GITHUB_REF_NAME || 'develop';
11
+ const sha = (process.env.GITHUB_SHA || '').slice(0, 12);
12
+ const version = existsSync('package.json') ? JSON.parse(readFileSync('package.json', 'utf8')).version : JSON.parse(readFileSync('versions.json', 'utf8')).sdkVersion;
13
+ const normalized = String(version).replace(/[^0-9A-Za-z._-]/g, '-');
14
+ const tag = 'release/' + branch + '/v' + normalized + '-' + sha;
15
+ run('git', ['config', 'user.name', 'github-actions[bot]']);
16
+ run('git', ['config', 'user.email', 'github-actions[bot]@users.noreply.github.com']);
17
+ run('git', ['tag', tag]);
18
+ run('git', ['push', 'origin', tag]);
@@ -0,0 +1,41 @@
1
+ #!/usr/bin/env node
2
+ import { spawnSync } from 'node:child_process';
3
+ import { readFileSync } from 'node:fs';
4
+
5
+ function run(command, args, options = {}) {
6
+ const result = spawnSync(command, args, { stdio: options.stdio || 'inherit', encoding: options.encoding });
7
+ if (result.status !== 0 && !options.allowFailure) process.exit(result.status || 1);
8
+ return result;
9
+ }
10
+
11
+ function npmView(packageSpec) {
12
+ return run('npm', ['view', packageSpec, 'version'], { allowFailure: true, stdio: 'pipe', encoding: 'utf8' }).status === 0;
13
+ }
14
+
15
+ const pkg = JSON.parse(readFileSync('package.json', 'utf8'));
16
+ const ref = process.env.GITHUB_REF_NAME || '';
17
+ const branch = ref.split('/')[1] || 'develop';
18
+ const tag = branch === 'main' ? 'latest' : branch;
19
+
20
+ if (!process.env.NODE_AUTH_TOKEN) {
21
+ console.log('NODE_AUTH_TOKEN is not configured; skipping npm publish.');
22
+ process.exit(0);
23
+ }
24
+
25
+ if (npmView(pkg.name + '@' + pkg.version)) {
26
+ console.log(pkg.name + '@' + pkg.version + ' already exists; ensuring dist-tag ' + tag + '.');
27
+ run('npm', ['dist-tag', 'add', pkg.name + '@' + pkg.version, tag], { allowFailure: true });
28
+ process.exit(0);
29
+ }
30
+
31
+ for (const field of ['dependencies', 'peerDependencies', 'optionalDependencies']) {
32
+ for (const [name, version] of Object.entries(pkg[field] || {})) {
33
+ if (!name.startsWith('@a5c-ai/') || version.startsWith('^') || version.startsWith('~') || version === '*' || version.startsWith('workspace:')) continue;
34
+ if (!npmView(name + '@' + version)) {
35
+ console.log('Required internal dependency ' + name + '@' + version + ' is not published yet; skipping npm publish.');
36
+ process.exit(0);
37
+ }
38
+ }
39
+ }
40
+
41
+ run('npm', ['publish', '--access', 'public', '--tag', tag]);
@@ -1,14 +1,12 @@
1
1
  ---
2
2
  name: babysit
3
3
  description: >-
4
- Orchestrate via @babysitter. Use this skill when asked to babysit a run,
5
- orchestrate a process or whenever it is called explicitly. (babysit,
6
- babysitter, orchestrate, orchestrate a run, workflow, etc.)
4
+ Execute via @babysitter. Use this skill when asked to babysit a task, do anything that is structured process-driven (even a loop) or whenever it is called explicitly. (babysit, babysitter, with a process, orchestrate, orchestrate a run, workflow, loop until, etc.)
7
5
  ---
8
6
 
9
7
  # babysit
10
8
 
11
- Orchestrate `.a5c/runs/<runId>/` through iterative execution.
9
+ Follow the commands below exactly. but apply judgement and creativity to get the job done. no matter how small or simple the task may seem, you must use the babysitter SDK and run lifecycle to execute it. This is non-negotiable. If you are asked to do something that seems like it could be done with a simple tool call, you must still use the babysitter SDK to create a run, define tasks, execute them, and complete the run. This is how you will learn and demonstrate mastery of the babysitter system. Always follow the full process, even for trivial tasks.
12
10
 
13
11
  ## Dependencies
14
12
 
@@ -5,4 +5,8 @@ description: Orchestrate a babysitter run. use this command to start babysitting
5
5
 
6
6
  # call
7
7
 
8
- Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md).
8
+ Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md). Then continue executing the returned instructions in this same turn. Do not stop after the Skill tool returns; carry the requested run through to completion proof.
9
+
10
+ User arguments for this command:
11
+
12
+ $ARGUMENTS
@@ -11,11 +11,33 @@ Create and run a cleanup process using the process at `skills\babysit\process\cr
11
11
 
12
12
  Implementation notes (for the process):
13
13
  - Parse arguments for `--dry-run` flag (if present, set dryRun: true in inputs) and `--keep-days N` (default: 7)
14
- - The process scans .a5c/runs/ for completed/failed runs, aggregates insights, writes summaries, then removes old data
15
- - Always show the user what will be removed before removing (in interactive mode via breakpoints)
16
- - In non-interactive mode (yolo), proceed with cleanup using defaults
17
- - The insights file goes to docs/run-history-insights.md
18
- - Only remove terminal runs (completed/failed) older than the keep-days threshold
19
- - Never remove active/in-progress runs
20
- - Remove orphaned process files not referenced by remaining runs
21
- - After cleanup, show remaining run count and disk usage
14
+
15
+ CRITICAL: The cleanup MUST follow this exact phase order. Do NOT delete any run before Phase 2 completes.
16
+
17
+ Phase 1 Scan:
18
+ - Scan .a5c/runs/ for all runs
19
+ - Classify each as terminal (completed/failed) or active (in-progress/created)
20
+ - Identify terminal runs older than the keep-days threshold as removal candidates
21
+ - Never mark active/in-progress runs for removal
22
+ - Count and report: total runs, terminal, active, removal candidates, disk usage
23
+
24
+ Phase 2 — Aggregate insights (BEFORE any deletion):
25
+ - For EVERY removal candidate, read its run.json and journal/ events
26
+ - Extract: processId, prompt, status, event count, created date, task summaries
27
+ - Group by process type and extract patterns (retry counts, convergence behavior, failure modes)
28
+ - Append a new dated section to docs/run-history-insights.md with:
29
+ - Summary statistics (runs removed, disk freed, runs retained)
30
+ - Run categories with counts and descriptions
31
+ - Key patterns observed (multi-batch convergence, retry behavior, etc.)
32
+ - What worked well / what didn't from the run data
33
+ - This file MUST be written and verified before proceeding to Phase 3
34
+
35
+ Phase 3 — Confirm removal:
36
+ - In interactive mode, show the user what will be removed via a breakpoint
37
+ - In non-interactive mode (yolo), proceed with defaults
38
+ - In dry-run mode, stop here and show what would be removed
39
+
40
+ Phase 4 — Remove:
41
+ - Delete the terminal runs older than keep-days threshold
42
+ - Identify and remove orphaned process files not referenced by remaining runs
43
+ - Show remaining run count and disk usage after cleanup
@@ -157,7 +157,6 @@ If it exists:
157
157
  **Goal:** Inspect babysitter session files for health and detect runaway loops.
158
158
 
159
159
  - Search for session state files using Glob:
160
- - `plugins/babysitter/skills/babysit/state/*.md`
161
160
  - `.a5c/state/*.md`
162
161
  - `.a5c/state/*.json`
163
162
  - For each session state file found:
@@ -261,7 +260,7 @@ Mark as PASS if total size < 500MB and no files > 10MB. Mark as WARN if total si
261
260
 
262
261
  ### 10a. Hook Registration
263
262
 
264
- - Locate the plugin root. Check for `CLAUDE_PLUGIN_ROOT` env var, or search for `plugins/babysitter/hooks/hooks.json` by walking up from the current directory.
263
+ - Locate the plugin root. Check for `CLAUDE_PLUGIN_ROOT` env var first, or search for a babysitter `hooks.json` by walking up from the current directory.
265
264
  - If found, read `hooks.json` and verify:
266
265
  - A `Stop` hook entry exists with a command referencing `babysitter-stop-hook.sh`.
267
266
  - A `SessionStart` hook entry exists with a command referencing `babysitter-session-start-hook.sh`.
@@ -316,7 +315,7 @@ If the stop hook shows NO evidence of execution (no log entries, no journal even
316
315
 
317
316
  Perform these diagnostic steps in order and report the first failure found:
318
317
 
319
- 1. **Plugin not installed**: Check if `plugins/babysitter/` exists relative to the project root and if `CLAUDE_PLUGIN_ROOT` is set. If the plugin directory doesn't exist, report: "Plugin not installed — the babysitter plugin directory is missing."
318
+ 1. **Plugin not installed**: Check if `CLAUDE_PLUGIN_ROOT` is set or if a babysitter plugin directory exists relative to the project root. If neither exists, report: "Plugin not installed — the babysitter plugin directory is missing."
320
319
 
321
320
  2. **Plugin not enabled**: Check for Claude settings files:
322
321
  - `~/.claude/settings.json` — look for `babysitter` in `enabledPlugins`.
@@ -234,7 +234,8 @@ SECONDARY COMMANDS
234
234
  How it works: Runs npx @a5c-ai/babysitter-observer-dashboard@latest which watches
235
235
  the .a5c/runs/ directory (or a parent directory containing multiple projects) and
236
236
  serves a live dashboard. The process is blocking -- it runs until you stop it, and
237
- it prints the local URL to share with the user.
237
+ it prints the local URL to share with the user. Do not use `babysitter observe`
238
+ as a fallback; the core Babysitter CLI does not expose that subcommand.
238
239
 
239
240
  Example: /babysitter:observe
240
241
  (opens browser showing all runs with live-updating task
@@ -8,6 +8,11 @@ description: Launch the babysitter observer dashboard. Installs and runs the rea
8
8
  Run the babysitter observer dashboard:
9
9
 
10
10
  1. Determine the watch directory — this is usually the project's container directory (the parent of the project dir), or the current working directory if not specified.
11
- 2. Launch the dashboard: `npx -y @a5c-ai/babysitter-observer-dashboard@latest --watch-dir <dir>`
11
+ 2. Launch the standalone dashboard package: `npx -y @a5c-ai/babysitter-observer-dashboard@latest --watch-dir <dir>`.
12
12
  3. This is a blocking process — it will keep running until stopped.
13
13
  4. Report the URL printed by the dashboard to the user, then open it in the browser.
14
+
15
+ Do not fall back to `babysitter observe`; the core Babysitter CLI does not expose
16
+ that subcommand. Some harness runtimes may provide a separate
17
+ `babysitter-agent observe` surface, but this skill uses the verified standalone
18
+ dashboard package.
@@ -5,4 +5,8 @@ description: Orchestrate a babysitter run. use this command to start babysitting
5
5
 
6
6
  # yolo
7
7
 
8
- Invoke the babysitter:babysit skill (using the Skill tool) and follow its instructions (SKILL.md). but without any user interaction or breakpoints in the run.
8
+ Start the Babysitter run directly through the CLI, without any user interaction or breakpoints. Do not invoke the Skill tool and do not run an instructions-only command. In Claude Code, use Bash to run `babysitter-agent yolo --harness claude-code --workspace "$PWD" --prompt "<user arguments>" --json`; in Codex, run `babysitter-agent yolo --harness codex --workspace "$PWD" --prompt "<user arguments>" --json`; in other harnesses, use the same command with that harness id. Replace `<user arguments>` with the arguments shown below, wait for the command to finish, and treat the CLI completion proof as the result.
9
+
10
+ User arguments for this command:
11
+
12
+ $ARGUMENTS
package/versions.json CHANGED
@@ -1,3 +1,4 @@
1
1
  {
2
- "sdkVersion": "5.0.1-staging.e4c68b9b"
2
+ "sdkVersion": "5.0.1-staging.e920fef118ef",
3
+ "extensionVersion": "5.0.1-staging.e920fef118ef"
3
4
  }
@@ -1,62 +0,0 @@
1
- 'use strict';
2
-
3
- const path = require('path');
4
- const {
5
- listDirectories,
6
- listMarkdownBasenames,
7
- reportCheckResult,
8
- syncCommandMirrors,
9
- syncSkillsFromCommands,
10
- } = require('../../../scripts/plugin-command-sync-lib.cjs');
11
-
12
- const PACKAGE_ROOT = path.resolve(__dirname, '..');
13
- const REPO_ROOT = path.resolve(PACKAGE_ROOT, '..', '..');
14
- const ROOT_COMMANDS = path.join(REPO_ROOT, 'plugins', 'babysitter', 'commands');
15
- const PLUGIN_COMMANDS = path.join(PACKAGE_ROOT, 'commands');
16
- const PLUGIN_SKILLS = path.join(PACKAGE_ROOT, 'skills');
17
- const LABEL = 'babysitter-github sync';
18
-
19
- function getMirroredCommandNames() {
20
- const local = new Set(listMarkdownBasenames(PLUGIN_COMMANDS));
21
- return listMarkdownBasenames(ROOT_COMMANDS).filter((name) => local.has(name));
22
- }
23
-
24
- function getDerivedSkillNames() {
25
- const local = new Set(listDirectories(PLUGIN_SKILLS));
26
- return listMarkdownBasenames(PLUGIN_COMMANDS).filter((name) => local.has(name));
27
- }
28
-
29
- function main() {
30
- const check = process.argv.includes('--check');
31
- const mirrorResult = syncCommandMirrors({
32
- label: LABEL,
33
- sourceRoot: ROOT_COMMANDS,
34
- targetRoot: PLUGIN_COMMANDS,
35
- names: getMirroredCommandNames(),
36
- check,
37
- cwd: PACKAGE_ROOT,
38
- });
39
- const skillsResult = syncSkillsFromCommands({
40
- label: LABEL,
41
- sourceRoot: PLUGIN_COMMANDS,
42
- skillsRoot: PLUGIN_SKILLS,
43
- names: getDerivedSkillNames(),
44
- check,
45
- cwd: PACKAGE_ROOT,
46
- });
47
-
48
- if (check) {
49
- reportCheckResult(LABEL, [...mirrorResult.stale, ...skillsResult.stale]);
50
- return;
51
- }
52
-
53
- const updated = mirrorResult.updated + skillsResult.updated;
54
- if (updated === 0) {
55
- console.log(`[${LABEL}] no GitHub plugin command changes were needed.`);
56
- return;
57
- }
58
-
59
- console.log(`[${LABEL}] updated ${updated} GitHub plugin file(s).`);
60
- }
61
-
62
- main();