npm - @xn-intenton-z2a/agentic-lib - Versions diffs - 7.2.5 → 7.2.7 - Mend

@xn-intenton-z2a/agentic-lib 7.2.5 → 7.2.7

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (34) hide show

package/.github/workflows/agentic-lib-init.yml +56 -0
package/.github/workflows/agentic-lib-test.yml +7 -2
package/.github/workflows/agentic-lib-workflow.yml +50 -3
package/README.md +88 -17
package/agentic-lib.toml +7 -0
package/bin/agentic-lib.js +260 -496
package/package.json +2 -1
package/src/actions/agentic-step/config-loader.js +9 -0
package/src/actions/agentic-step/index.js +104 -7
package/src/actions/agentic-step/tasks/direct.js +435 -0
package/src/actions/agentic-step/tasks/supervise.js +107 -180
package/src/agents/agent-apply-fix.md +5 -2
package/src/agents/agent-director.md +58 -0
package/src/agents/agent-discovery.md +52 -0
package/src/agents/agent-issue-resolution.md +18 -0
package/src/agents/agent-iterate.md +45 -0
package/src/agents/agent-supervisor.md +22 -50
package/src/copilot/agents.js +39 -0
package/src/copilot/config.js +308 -0
package/src/copilot/context.js +318 -0
package/src/copilot/hybrid-session.js +330 -0
package/src/copilot/logger.js +43 -0
package/src/copilot/sdk.js +36 -0
package/src/copilot/session.js +372 -0
package/src/copilot/tasks/fix-code.js +73 -0
package/src/copilot/tasks/maintain-features.js +61 -0
package/src/copilot/tasks/maintain-library.js +66 -0
package/src/copilot/tasks/transform.js +120 -0
package/src/copilot/tools.js +141 -0
package/src/mcp/server.js +43 -25
package/src/seeds/zero-README.md +31 -0
package/src/seeds/zero-behaviour.test.js +12 -4
package/src/seeds/zero-package.json +1 -1
package/src/seeds/zero-playwright.config.js +1 -0

package/.github/workflows/agentic-lib-init.yml CHANGED Viewed

@@ -333,3 +333,59 @@ jobs:
               exit 1
             fi
           done
+      # W8: Create initial seed issues after purge so the pipeline has work to do
+      - name: Create initial seed issues
+        if: github.repository != 'xn-intenton-z2a/agentic-lib' && env.INIT_MODE == 'purge' && needs.params.outputs.dry-run != 'true'
+        uses: actions/github-script@v8
+        with:
+          script: |
+            const fs = require('fs');
+            const missionContent = fs.existsSync('MISSION.md')
+              ? fs.readFileSync('MISSION.md', 'utf8')
+              : '(no MISSION.md found)';
+            // Ensure labels exist
+            for (const label of ['automated', 'ready']) {
+              try {
+                await github.rest.issues.createLabel({
+                  ...context.repo, name: label,
+                  color: label === 'automated' ? '0e8a16' : '1d76db',
+                  description: label === 'automated' ? 'Created by automation' : 'Ready for dev transform',
+                });
+              } catch (e) { /* label already exists */ }
+            }
+            // W8a: Initial unit tests issue
+            const unitTestBody = [
+              'Create a unit test file for each of the major features in the mission ',
+              'and put a TODO in a trivial empty passing test in each.',
+              '',
+              '## MISSION.md',
+              '',
+              missionContent,
+            ].join('\n');
+            const { data: issue1 } = await github.rest.issues.create({
+              ...context.repo,
+              title: 'Initial unit tests',
+              body: unitTestBody,
+              labels: ['automated', 'ready'],
+            });
+            core.info(`Created issue #${issue1.number}: Initial unit tests`);
+            // W8b: Initial web layout issue
+            const webLayoutBody = [
+              'Create the home page layout to showcase each of the major features in the mission ',
+              'and put a TODO in a trivial empty passing test in each.',
+              '',
+              '## MISSION.md',
+              '',
+              missionContent,
+            ].join('\n');
+            const { data: issue2 } = await github.rest.issues.create({
+              ...context.repo,
+              title: 'Initial web layout',
+              body: webLayoutBody,
+              labels: ['automated', 'ready'],
+            });
+            core.info(`Created issue #${issue2.number}: Initial web layout`);

package/.github/workflows/agentic-lib-test.yml CHANGED Viewed

@@ -90,8 +90,13 @@ jobs:
       - name: Install dependencies
         run: npm ci
-      - name: Run behaviour tests
-        run: npm run test:behaviour
+      - name: Run behaviour tests (with retry)
+        run: |
+          npm run test:behaviour || {
+            echo "::warning::Behaviour test attempt 1 failed — retrying"
+            sleep 2
+            npm run test:behaviour
+          }
         #env:
         #  HOME: /root

package/.github/workflows/agentic-lib-workflow.yml CHANGED Viewed

@@ -621,14 +621,55 @@ jobs:
           commit-message: "agentic-step: maintain features and library"
           push-ref: ${{ github.ref_name }}
-  # ─── Supervisor: LLM decides what to do (after maintain has features) ──
-  supervisor:
-    needs: [params, pr-cleanup, telemetry, maintain]
+  # ─── Director: LLM evaluates mission status (complete/failed/in-progress) ──
+  director:
+    needs: [params, telemetry, maintain]
     if: |
       !cancelled() &&
       (needs.params.outputs.mode == 'full' || needs.params.outputs.mode == 'dev-only') &&
       needs.params.result == 'success'
     runs-on: ubuntu-latest
+    outputs:
+      decision: ${{ steps.director.outputs.director-decision }}
+      analysis: ${{ steps.director.outputs.director-analysis }}
+    steps:
+      - uses: actions/checkout@v6
+      - uses: actions/setup-node@v6
+        with:
+          node-version: "24"
+      - name: Self-init (agentic-lib dev only)
+        if: hashFiles('scripts/self-init.sh') != '' && hashFiles('.github/agentic-lib/actions/agentic-step/package.json') == ''
+        run: bash scripts/self-init.sh
+      - name: Install agentic-step dependencies
+        working-directory: .github/agentic-lib/actions/agentic-step
+        run: npm ci
+      - name: Run director
+        id: director
+        if: github.repository != 'xn-intenton-z2a/agentic-lib'
+        uses: ./.github/agentic-lib/actions/agentic-step
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+          COPILOT_GITHUB_TOKEN: ${{ secrets.COPILOT_GITHUB_TOKEN }}
+        with:
+          task: "direct"
+          config: ${{ needs.params.outputs.config-path }}
+          instructions: ".github/agentic-lib/agents/agent-director.md"
+          model: ${{ needs.params.outputs.model }}
+  # ─── Supervisor: LLM decides what to do (after director evaluates) ──
+  supervisor:
+    needs: [params, pr-cleanup, telemetry, maintain, director]
+    if: |
+      !cancelled() &&
+      (needs.params.outputs.mode == 'full' || needs.params.outputs.mode == 'dev-only') &&
+      needs.params.result == 'success' &&
+      needs.director.outputs.decision != 'mission-complete' &&
+      needs.director.outputs.decision != 'mission-failed'
+    runs-on: ubuntu-latest
     steps:
       - uses: actions/checkout@v6
@@ -1175,6 +1216,12 @@ jobs:
           set +e
           npm run --if-present test:behaviour 2>&1 | tail -30
           EXIT_CODE=$?
+          if [ $EXIT_CODE -ne 0 ]; then
+            echo "::warning::Behaviour test attempt 1 failed — retrying"
+            sleep 2
+            npm run --if-present test:behaviour 2>&1 | tail -30
+            EXIT_CODE=$?
+          fi
           set -e
           if [ $EXIT_CODE -ne 0 ]; then
             echo "tests-passed=false" >> $GITHUB_OUTPUT

package/README.md CHANGED Viewed

@@ -73,7 +73,7 @@ your-repo/
 │   │
 │   └── agentic-lib/                          # [INIT] Internal infrastructure (always overwritten)
 │       ├── actions/
-│       │   ├── agentic-step/                 #   The Copilot SDK action (9 task handlers)
+│       │   ├── agentic-step/                 #   The Copilot SDK action (10 task handlers)
 │       │   ├── commit-if-changed/            #   Composite: conditional git commit
 │       │   └── setup-npmrc/                  #   Composite: npm registry auth
 │       ├── agents/                           #   8 prompt files + config YAML
@@ -212,6 +212,7 @@ The core of the system is a single GitHub Action that handles all autonomous tas
 | Task | Purpose |
 |------|---------|
 | `supervise` | Gather repo context, choose and dispatch actions strategically |
+| `direct` | Evaluate mission status: complete, failed, or gap analysis |
 | `transform` | Transform the codebase toward the mission |
 | `resolve-issue` | Read an issue and generate code to resolve it |
 | `fix-code` | Fix failing tests or lint errors |
@@ -242,9 +243,8 @@ All task commands accept these flags:
 | `--dry-run` | off | Show the prompt without calling the Copilot SDK |
 | `--target <path>` | current directory | Target repository to transform |
 | `--model <name>` | `claude-sonnet-4` | Copilot SDK model |
-| `--cycles <N>` | from budget | Max iteration cycles (iterate only) |
-| `--steps <list>` | all three | Comma-separated steps per cycle (iterate only) |
 | `--mission <name>` | hamming-distance | Init with --purge before iterating (iterate only) |
+| `--timeout <ms>` | 600000 | Session timeout in milliseconds (iterate only) |
 ### Example: Full Walkthrough
@@ -299,25 +299,96 @@ npx @xn-intenton-z2a/agentic-lib transform --dry-run
 ### Iterator
-The `iterate` command runs multiple cycles of maintain → transform → fix with automatic stop conditions and budget tracking:
+The `iterate` command runs a single persistent Copilot SDK session that autonomously implements your mission — reading code, writing implementations and tests, running tests, and iterating until everything passes.
 ```bash
-# Init a mission and iterate with default budget
-npx @xn-intenton-z2a/agentic-lib iterate --mission fizz-buzz --model gpt-5-mini
+# Init a mission and iterate
+npx @xn-intenton-z2a/agentic-lib iterate --mission hamming-distance --model gpt-5-mini
-# Run 4 cycles on an existing workspace
-npx @xn-intenton-z2a/agentic-lib iterate --cycles 4
+# Iterate on an existing workspace
+npx @xn-intenton-z2a/agentic-lib iterate --target /path/to/workspace
-# Transform-only cycles (skip maintain)
-npx @xn-intenton-z2a/agentic-lib iterate --steps transform,fix-code --cycles 3
+# With a longer timeout (10 minutes)
+npx @xn-intenton-z2a/agentic-lib iterate --mission fizz-buzz --timeout 600000
 ```
-**Stop conditions:**
-- Tests pass for 2 consecutive cycles
-- No files change for 2 consecutive cycles
-- Transformation budget exhausted (configurable via `transformation-budget` in `agentic-lib.toml`)
+The session uses SDK hooks for observability (tool call tracking, error recovery) and infinite sessions for context management. The agent drives its own read-write-test loop until the mission is complete or the timeout is reached.
-Each cycle logs `**agentic-lib transformation cost:** 1` to `intentïon.md` when source files change. The iterator reads these to track cumulative cost against the budget.
+**Available missions:** hamming-distance, fizz-buzz, roman-numerals, string-utils, cron-engine, dense-encoding, markdown-compiler, and more (see `src/seeds/missions/`).
+### Running Local Benchmarks
+You can benchmark mission completion locally without GitHub Actions. This is useful for comparing models, tuning profiles, and measuring iteration speed.
+**Prerequisites:**
+1. A `COPILOT_GITHUB_TOKEN` (fine-grained PAT with Copilot read permission)
+2. Node.js 24+
+**Setup:**
+```bash
+# Set your token
+export COPILOT_GITHUB_TOKEN=github_pat_...
+# Or source from .env
+source .env
+```
+**Run a benchmark:**
+```bash
+# Quick: hamming-distance with gpt-5-mini (simplest mission, ~1-2 min)
+npx @xn-intenton-z2a/agentic-lib iterate \
+  --mission hamming-distance --model gpt-5-mini --timeout 300000
+# Medium: roman-numerals with claude-sonnet-4
+npx @xn-intenton-z2a/agentic-lib iterate \
+  --mission roman-numerals --model claude-sonnet-4
+# Complex: string-utils with gpt-4.1 (10 functions, longer timeout)
+npx @xn-intenton-z2a/agentic-lib iterate \
+  --mission string-utils --model gpt-4.1 --timeout 600000
+```
+**From a local clone** (development):
+```bash
+# From the agentic-lib directory
+npx . iterate --mission hamming-distance --model gpt-5-mini --target /tmp/bench
+# Or link globally
+npm link
+agentic-lib iterate --mission hamming-distance --model gpt-5-mini --target /tmp/bench
+```
+**Output:**
+```
+=== agentic-lib iterate ===
+Target:  /tmp/bench
+Model:   gpt-5-mini
+[hybrid] Creating session (model=gpt-5-mini, workspace=/tmp/bench)
+[hybrid] Session: sess_abc123
+  [tool] read_file
+  [tool] read_file
+  [tool] write_file
+  [tool] run_tests
+  [tool] write_file
+  [tool] run_tests
+=== Results ===
+Success:       true
+Tests passed:  true
+Session time:  47s
+Total time:    52s
+Tool calls:    6
+Test runs:     2
+Files written: 2
+Tokens:        12400 (in=9200 out=3200)
+End reason:    complete
+```
 ### Environment
@@ -367,14 +438,14 @@ This repository is the source for the `@xn-intenton-z2a/agentic-lib` npm package
 src/
 ├── workflows/     8 GitHub Actions workflow templates
 ├── actions/       3 composite/SDK actions (agentic-step, commit-if-changed, setup-npmrc)
-├── agents/        8 agent prompt files + 1 config
+├── agents/        9 agent prompt files + 1 config
 ├── seeds/         7 seed files (test.yml + 6 project seed files for --purge reset)
 └── scripts/       7 utility scripts distributed to consumers
 ```
 ### Testing
-393 unit tests across 26 test files, plus system tests:
+431 unit tests across 27 test files, plus system tests:
 ```bash
 npm test                  # Run all tests (vitest)

package/agentic-lib.toml CHANGED Viewed

@@ -130,5 +130,12 @@ max-attempts-per-issue = 4                 # max transform attempts before aband
 features-limit = 8                     # max feature files in features/ directory
 library-limit = 64                     # max library entries in library/ directory
+[mission-complete]
+# Thresholds for deterministic mission-complete declaration.
+# All conditions must be met simultaneously.
+min-resolved-issues = 3            # minimum closed-as-RESOLVED issues since init
+require-dedicated-tests = true     # require test files that import from src/lib/
+max-source-todos = 0               # max TODO comments allowed in ./src (0 = none)
 [bot]
 log-file = "test/intentïon.md"                  #@dist "intentïon.md"