@windyroad/architect 0.18.0-preview.802 → 0.18.1-preview.804
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.claude-plugin/plugin.json +1 -1
- package/.codex-plugin/plugin.json +1 -1
- package/package.json +3 -2
- package/agents/eval/codex-rubric-output.schema.json +0 -22
- package/agents/eval/grade-codex-rubric.sh +0 -39
- package/agents/eval/promptfooconfig.codex.yaml +0 -56
- package/agents/eval/run-codex-agent-eval.sh +0 -47
package/package.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
|
1
1
|
{
|
|
2
2
|
"name": "@windyroad/architect",
|
|
3
|
-
"version": "0.18.
|
|
3
|
+
"version": "0.18.1-preview.804",
|
|
4
4
|
"description": "Architecture decision enforcement for AI coding agents",
|
|
5
5
|
"bin": {
|
|
6
6
|
"windyroad-architect": "./bin/install.mjs"
|
|
@@ -27,6 +27,7 @@
|
|
|
27
27
|
".claude-plugin/",
|
|
28
28
|
".codex-plugin/",
|
|
29
29
|
"lib/",
|
|
30
|
-
"!skills/*/eval/"
|
|
30
|
+
"!skills/*/eval/",
|
|
31
|
+
"!agents/eval/"
|
|
31
32
|
]
|
|
32
33
|
}
|
|
@@ -1,22 +0,0 @@
|
|
|
1
|
-
{
|
|
2
|
-
"type": "object",
|
|
3
|
-
"additionalProperties": false,
|
|
4
|
-
"required": [
|
|
5
|
-
"pass",
|
|
6
|
-
"score",
|
|
7
|
-
"reason"
|
|
8
|
-
],
|
|
9
|
-
"properties": {
|
|
10
|
-
"pass": {
|
|
11
|
-
"type": "boolean"
|
|
12
|
-
},
|
|
13
|
-
"score": {
|
|
14
|
-
"type": "number",
|
|
15
|
-
"minimum": 0,
|
|
16
|
-
"maximum": 1
|
|
17
|
-
},
|
|
18
|
-
"reason": {
|
|
19
|
-
"type": "string"
|
|
20
|
-
}
|
|
21
|
-
}
|
|
22
|
-
}
|
|
@@ -1,39 +0,0 @@
|
|
|
1
|
-
#!/usr/bin/env bash
|
|
2
|
-
set -euo pipefail
|
|
3
|
-
|
|
4
|
-
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
|
|
5
|
-
REPO_ROOT="$(cd "${SCRIPT_DIR}/../../../.." && pwd)"
|
|
6
|
-
SCHEMA="${SCRIPT_DIR}/codex-rubric-output.schema.json"
|
|
7
|
-
PROMPT="${*:-}"
|
|
8
|
-
|
|
9
|
-
if [[ -z "$PROMPT" ]]; then
|
|
10
|
-
echo "grade-codex-rubric.sh: rubric prompt argument is required" >&2
|
|
11
|
-
exit 2
|
|
12
|
-
fi
|
|
13
|
-
|
|
14
|
-
raw="$(
|
|
15
|
-
codex exec \
|
|
16
|
-
--ephemeral \
|
|
17
|
-
--cd "$REPO_ROOT" \
|
|
18
|
-
-c 'approval_policy="never"' \
|
|
19
|
-
--sandbox read-only \
|
|
20
|
-
--output-schema "$SCHEMA" \
|
|
21
|
-
"You are a strict grading assistant. Respond only with JSON matching the provided schema. Grade this promptfoo rubric literally.
|
|
22
|
-
|
|
23
|
-
${PROMPT}"
|
|
24
|
-
)"
|
|
25
|
-
|
|
26
|
-
printf '%s' "$raw" | awk '
|
|
27
|
-
BEGIN { depth = 0; started = 0 }
|
|
28
|
-
{
|
|
29
|
-
line = $0
|
|
30
|
-
for (i = 1; i <= length(line); i++) {
|
|
31
|
-
c = substr(line, i, 1)
|
|
32
|
-
if (c == "{") { depth++; started = 1 }
|
|
33
|
-
if (started) { buf = buf c }
|
|
34
|
-
if (c == "}") { depth--; if (depth == 0 && started) { print buf; exit } }
|
|
35
|
-
}
|
|
36
|
-
if (started) { buf = buf "\n" }
|
|
37
|
-
}
|
|
38
|
-
END { if (started && depth != 0) print buf }
|
|
39
|
-
' || printf '%s' "$raw"
|
|
@@ -1,56 +0,0 @@
|
|
|
1
|
-
description: |
|
|
2
|
-
Codex wr-architect agent verdict eval. Exercises the generated
|
|
3
|
-
.codex/agents/wr-architect.toml path and the Codex plugin install surface.
|
|
4
|
-
|
|
5
|
-
providers:
|
|
6
|
-
- id: 'exec:bash ./run-codex-agent-eval.sh'
|
|
7
|
-
|
|
8
|
-
defaultTest:
|
|
9
|
-
options:
|
|
10
|
-
provider:
|
|
11
|
-
id: 'exec:bash ./grade-codex-rubric.sh'
|
|
12
|
-
|
|
13
|
-
prompts:
|
|
14
|
-
- '{{prompt}}'
|
|
15
|
-
|
|
16
|
-
tests:
|
|
17
|
-
- description: PASS for aligned pre-edit proposal
|
|
18
|
-
vars:
|
|
19
|
-
prompt: |
|
|
20
|
-
PRE-EDIT review: proposed change updates comments only. No
|
|
21
|
-
architecture-bearing files, dependencies, hooks, workflows, or ADRs
|
|
22
|
-
change. Return the architect verdict.
|
|
23
|
-
assert:
|
|
24
|
-
- type: regex
|
|
25
|
-
value: 'Architecture Review:\s*PASS|PASS'
|
|
26
|
-
|
|
27
|
-
- description: ISSUES FOUND for undocumented dependency
|
|
28
|
-
vars:
|
|
29
|
-
prompt: |
|
|
30
|
-
PRE-EDIT review: proposed change adds a new npm dependency named
|
|
31
|
-
fast-queue to package.json for core task scheduling. No existing ADR
|
|
32
|
-
covers this dependency choice. Return the architect verdict.
|
|
33
|
-
assert:
|
|
34
|
-
- type: regex
|
|
35
|
-
value: 'ISSUES FOUND|Undocumented Decision|new decision'
|
|
36
|
-
|
|
37
|
-
- description: NEEDS DIRECTION when viable options are unpinned
|
|
38
|
-
vars:
|
|
39
|
-
prompt: |
|
|
40
|
-
PRE-EDIT review: proposed change must choose whether plugin
|
|
41
|
-
distribution uses a remote marketplace only or also a repo-local
|
|
42
|
-
marketplace, and the prompt does not pin a direction. Return the
|
|
43
|
-
architect verdict.
|
|
44
|
-
assert:
|
|
45
|
-
- type: regex
|
|
46
|
-
value: 'NEEDS DIRECTION'
|
|
47
|
-
|
|
48
|
-
- description: Unratified Dependency flags unconfirmed ADR dependency
|
|
49
|
-
vars:
|
|
50
|
-
prompt: |
|
|
51
|
-
PRE-EDIT review: proposed change explicitly implements ADR-074, but
|
|
52
|
-
the ADR frontmatter lacks human-oversight: confirmed. Return the
|
|
53
|
-
architect verdict and action.
|
|
54
|
-
assert:
|
|
55
|
-
- type: regex
|
|
56
|
-
value: 'Unratified Dependency|ratify|review-decisions'
|
|
@@ -1,47 +0,0 @@
|
|
|
1
|
-
#!/usr/bin/env bash
|
|
2
|
-
# Codex promptfoo exec-provider driver for the generated wr-architect agent.
|
|
3
|
-
set -euo pipefail
|
|
4
|
-
|
|
5
|
-
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
|
|
6
|
-
REPO_ROOT="$(cd "${SCRIPT_DIR}/../../../.." && pwd)"
|
|
7
|
-
MARKETPLACE_DIR="$REPO_ROOT"
|
|
8
|
-
PROMPT="${*:-}"
|
|
9
|
-
|
|
10
|
-
if [[ -z "$PROMPT" ]]; then
|
|
11
|
-
echo "run-codex-agent-eval.sh: prompt argument is required" >&2
|
|
12
|
-
exit 2
|
|
13
|
-
fi
|
|
14
|
-
|
|
15
|
-
SOURCE_CODEX_HOME="${CODEX_HOME:-${HOME}/.codex}"
|
|
16
|
-
TMP_CODEX_HOME=""
|
|
17
|
-
|
|
18
|
-
if [[ -n "${WR_CODEX_EVAL_CODEX_HOME:-}" ]]; then
|
|
19
|
-
export CODEX_HOME="$WR_CODEX_EVAL_CODEX_HOME"
|
|
20
|
-
mkdir -p "$CODEX_HOME"
|
|
21
|
-
else
|
|
22
|
-
TMP_CODEX_HOME="$(mktemp -d)"
|
|
23
|
-
chmod 700 "$TMP_CODEX_HOME"
|
|
24
|
-
export CODEX_HOME="$TMP_CODEX_HOME"
|
|
25
|
-
if [[ -f "${SOURCE_CODEX_HOME}/auth.json" ]]; then
|
|
26
|
-
cp "${SOURCE_CODEX_HOME}/auth.json" "$CODEX_HOME/auth.json"
|
|
27
|
-
chmod 600 "$CODEX_HOME/auth.json"
|
|
28
|
-
fi
|
|
29
|
-
if [[ "${WR_CODEX_EVAL_COPY_CONFIG:-0}" == "1" && -f "${SOURCE_CODEX_HOME}/config.toml" ]]; then
|
|
30
|
-
cp "${SOURCE_CODEX_HOME}/config.toml" "$CODEX_HOME/config.toml"
|
|
31
|
-
chmod 600 "$CODEX_HOME/config.toml"
|
|
32
|
-
fi
|
|
33
|
-
trap 'rm -rf "$TMP_CODEX_HOME"' EXIT
|
|
34
|
-
fi
|
|
35
|
-
|
|
36
|
-
codex plugin marketplace add "$MARKETPLACE_DIR" >/dev/null
|
|
37
|
-
codex plugin add wr-architect@windyroad-local >/dev/null
|
|
38
|
-
|
|
39
|
-
exec codex exec \
|
|
40
|
-
--ephemeral \
|
|
41
|
-
--cd "$REPO_ROOT" \
|
|
42
|
-
-c 'approval_policy="never"' \
|
|
43
|
-
--sandbox read-only \
|
|
44
|
-
--dangerously-bypass-hook-trust \
|
|
45
|
-
"Spawn the custom collaborator agent named wr-architect:agent (auto-discovered by Codex from the installed wr-architect plugin's agents/agent.md). If this non-interactive harness cannot spawn the custom agent directly, read .codex/agents/wr-architect.toml and perform the same review inline.
|
|
46
|
-
|
|
47
|
-
${PROMPT}"
|