@windyroad/architect 0.18.0 → 0.18.1-preview.804

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
@@ -123,5 +123,5 @@
123
123
  }
124
124
  },
125
125
  "name": "wr-architect",
126
- "version": "0.18.0"
126
+ "version": "0.18.1"
127
127
  }
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "wr-architect",
3
- "version": "0.18.0",
3
+ "version": "0.18.1",
4
4
  "description": "Architecture decision enforcement for AI coding agents",
5
5
  "author": {
6
6
  "name": "Windy Road Technology",
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@windyroad/architect",
3
- "version": "0.18.0",
3
+ "version": "0.18.1-preview.804",
4
4
  "description": "Architecture decision enforcement for AI coding agents",
5
5
  "bin": {
6
6
  "windyroad-architect": "./bin/install.mjs"
@@ -27,6 +27,7 @@
27
27
  ".claude-plugin/",
28
28
  ".codex-plugin/",
29
29
  "lib/",
30
- "!skills/*/eval/"
30
+ "!skills/*/eval/",
31
+ "!agents/eval/"
31
32
  ]
32
33
  }
@@ -1,22 +0,0 @@
1
- {
2
- "type": "object",
3
- "additionalProperties": false,
4
- "required": [
5
- "pass",
6
- "score",
7
- "reason"
8
- ],
9
- "properties": {
10
- "pass": {
11
- "type": "boolean"
12
- },
13
- "score": {
14
- "type": "number",
15
- "minimum": 0,
16
- "maximum": 1
17
- },
18
- "reason": {
19
- "type": "string"
20
- }
21
- }
22
- }
@@ -1,39 +0,0 @@
1
- #!/usr/bin/env bash
2
- set -euo pipefail
3
-
4
- SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
5
- REPO_ROOT="$(cd "${SCRIPT_DIR}/../../../.." && pwd)"
6
- SCHEMA="${SCRIPT_DIR}/codex-rubric-output.schema.json"
7
- PROMPT="${*:-}"
8
-
9
- if [[ -z "$PROMPT" ]]; then
10
- echo "grade-codex-rubric.sh: rubric prompt argument is required" >&2
11
- exit 2
12
- fi
13
-
14
- raw="$(
15
- codex exec \
16
- --ephemeral \
17
- --cd "$REPO_ROOT" \
18
- -c 'approval_policy="never"' \
19
- --sandbox read-only \
20
- --output-schema "$SCHEMA" \
21
- "You are a strict grading assistant. Respond only with JSON matching the provided schema. Grade this promptfoo rubric literally.
22
-
23
- ${PROMPT}"
24
- )"
25
-
26
- printf '%s' "$raw" | awk '
27
- BEGIN { depth = 0; started = 0 }
28
- {
29
- line = $0
30
- for (i = 1; i <= length(line); i++) {
31
- c = substr(line, i, 1)
32
- if (c == "{") { depth++; started = 1 }
33
- if (started) { buf = buf c }
34
- if (c == "}") { depth--; if (depth == 0 && started) { print buf; exit } }
35
- }
36
- if (started) { buf = buf "\n" }
37
- }
38
- END { if (started && depth != 0) print buf }
39
- ' || printf '%s' "$raw"
@@ -1,56 +0,0 @@
1
- description: |
2
- Codex wr-architect agent verdict eval. Exercises the generated
3
- .codex/agents/wr-architect.toml path and the Codex plugin install surface.
4
-
5
- providers:
6
- - id: 'exec:bash ./run-codex-agent-eval.sh'
7
-
8
- defaultTest:
9
- options:
10
- provider:
11
- id: 'exec:bash ./grade-codex-rubric.sh'
12
-
13
- prompts:
14
- - '{{prompt}}'
15
-
16
- tests:
17
- - description: PASS for aligned pre-edit proposal
18
- vars:
19
- prompt: |
20
- PRE-EDIT review: proposed change updates comments only. No
21
- architecture-bearing files, dependencies, hooks, workflows, or ADRs
22
- change. Return the architect verdict.
23
- assert:
24
- - type: regex
25
- value: 'Architecture Review:\s*PASS|PASS'
26
-
27
- - description: ISSUES FOUND for undocumented dependency
28
- vars:
29
- prompt: |
30
- PRE-EDIT review: proposed change adds a new npm dependency named
31
- fast-queue to package.json for core task scheduling. No existing ADR
32
- covers this dependency choice. Return the architect verdict.
33
- assert:
34
- - type: regex
35
- value: 'ISSUES FOUND|Undocumented Decision|new decision'
36
-
37
- - description: NEEDS DIRECTION when viable options are unpinned
38
- vars:
39
- prompt: |
40
- PRE-EDIT review: proposed change must choose whether plugin
41
- distribution uses a remote marketplace only or also a repo-local
42
- marketplace, and the prompt does not pin a direction. Return the
43
- architect verdict.
44
- assert:
45
- - type: regex
46
- value: 'NEEDS DIRECTION'
47
-
48
- - description: Unratified Dependency flags unconfirmed ADR dependency
49
- vars:
50
- prompt: |
51
- PRE-EDIT review: proposed change explicitly implements ADR-074, but
52
- the ADR frontmatter lacks human-oversight: confirmed. Return the
53
- architect verdict and action.
54
- assert:
55
- - type: regex
56
- value: 'Unratified Dependency|ratify|review-decisions'
@@ -1,47 +0,0 @@
1
- #!/usr/bin/env bash
2
- # Codex promptfoo exec-provider driver for the generated wr-architect agent.
3
- set -euo pipefail
4
-
5
- SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
6
- REPO_ROOT="$(cd "${SCRIPT_DIR}/../../../.." && pwd)"
7
- MARKETPLACE_DIR="$REPO_ROOT"
8
- PROMPT="${*:-}"
9
-
10
- if [[ -z "$PROMPT" ]]; then
11
- echo "run-codex-agent-eval.sh: prompt argument is required" >&2
12
- exit 2
13
- fi
14
-
15
- SOURCE_CODEX_HOME="${CODEX_HOME:-${HOME}/.codex}"
16
- TMP_CODEX_HOME=""
17
-
18
- if [[ -n "${WR_CODEX_EVAL_CODEX_HOME:-}" ]]; then
19
- export CODEX_HOME="$WR_CODEX_EVAL_CODEX_HOME"
20
- mkdir -p "$CODEX_HOME"
21
- else
22
- TMP_CODEX_HOME="$(mktemp -d)"
23
- chmod 700 "$TMP_CODEX_HOME"
24
- export CODEX_HOME="$TMP_CODEX_HOME"
25
- if [[ -f "${SOURCE_CODEX_HOME}/auth.json" ]]; then
26
- cp "${SOURCE_CODEX_HOME}/auth.json" "$CODEX_HOME/auth.json"
27
- chmod 600 "$CODEX_HOME/auth.json"
28
- fi
29
- if [[ "${WR_CODEX_EVAL_COPY_CONFIG:-0}" == "1" && -f "${SOURCE_CODEX_HOME}/config.toml" ]]; then
30
- cp "${SOURCE_CODEX_HOME}/config.toml" "$CODEX_HOME/config.toml"
31
- chmod 600 "$CODEX_HOME/config.toml"
32
- fi
33
- trap 'rm -rf "$TMP_CODEX_HOME"' EXIT
34
- fi
35
-
36
- codex plugin marketplace add "$MARKETPLACE_DIR" >/dev/null
37
- codex plugin add wr-architect@windyroad-local >/dev/null
38
-
39
- exec codex exec \
40
- --ephemeral \
41
- --cd "$REPO_ROOT" \
42
- -c 'approval_policy="never"' \
43
- --sandbox read-only \
44
- --dangerously-bypass-hook-trust \
45
- "Spawn the custom collaborator agent named wr-architect:agent (auto-discovered by Codex from the installed wr-architect plugin's agents/agent.md). If this non-interactive harness cannot spawn the custom agent directly, read .codex/agents/wr-architect.toml and perform the same review inline.
46
-
47
- ${PROMPT}"