@f-o-h/cli 0.1.35 → 0.1.37
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/README.md
CHANGED
|
@@ -4,7 +4,7 @@ AI-operator provisioning CLI for Front Of House.
|
|
|
4
4
|
|
|
5
5
|
Public mirror: https://github.com/iiko38/front-of-house-cli
|
|
6
6
|
|
|
7
|
-
Current
|
|
7
|
+
Current published baseline: `@f-o-h/cli@0.1.37`
|
|
8
8
|
|
|
9
9
|
This mirror is a generated release artifact. The private product monorepo is not
|
|
10
10
|
published here, and no open-source license is granted unless stated separately.
|
|
@@ -123,9 +123,13 @@ foh eval external-agent run \
|
|
|
123
123
|
--prompt-version blank-setup.v1
|
|
124
124
|
```
|
|
125
125
|
|
|
126
|
-
The command writes a versioned prompt, launches an instrumented shell, captures
|
|
127
|
-
FOH CLI commands into `commands.ndjson`, and finalizes `run.json` as an
|
|
128
|
-
`external_agent_run.v1` artifact when the shell exits.
|
|
126
|
+
The command writes a versioned prompt, launches an instrumented shell, captures
|
|
127
|
+
FOH CLI commands into `commands.ndjson`, and finalizes `run.json` as an
|
|
128
|
+
`external_agent_run.v1` artifact when the shell exits.
|
|
129
|
+
|
|
130
|
+
Run artifacts include `eval_state` so repeated benchmark runs make reuse
|
|
131
|
+
explicit: org, agent, and widget reuse are expected; fresh paid phone-number
|
|
132
|
+
creation is not expected.
|
|
129
133
|
|
|
130
134
|
For guarded programmable-runner planning:
|
|
131
135
|
|
package/dist/foh.js
CHANGED
|
@@ -32755,7 +32755,7 @@ var StdioServerTransport = class {
|
|
|
32755
32755
|
};
|
|
32756
32756
|
|
|
32757
32757
|
// src/lib/cli-version.ts
|
|
32758
|
-
var CLI_VERSION = "0.1.
|
|
32758
|
+
var CLI_VERSION = "0.1.37";
|
|
32759
32759
|
|
|
32760
32760
|
// src/commands/mcp-serve.ts
|
|
32761
32761
|
var DEFAULT_TIMEOUT_MS = 12e4;
|
|
@@ -39292,6 +39292,17 @@ function buildExecutedRunArtifact(input) {
|
|
|
39292
39292
|
],
|
|
39293
39293
|
commands_run: commands.map((command) => command.command),
|
|
39294
39294
|
docs_pages_used: [],
|
|
39295
|
+
eval_state: {
|
|
39296
|
+
org_reuse_expected: true,
|
|
39297
|
+
agent_reuse_expected: true,
|
|
39298
|
+
widget_reuse_expected: true,
|
|
39299
|
+
fresh_org_expected: false,
|
|
39300
|
+
fresh_agent_expected: false,
|
|
39301
|
+
phone_purchase_expected: false,
|
|
39302
|
+
paid_resource_creation_expected: false,
|
|
39303
|
+
spend_policy_expected: NO_SPEND_POLICY,
|
|
39304
|
+
rationale: "Mass external-agent evals benchmark public docs/CLI/API clarity; reuse avoids paid phone and Twilio inventory churn."
|
|
39305
|
+
},
|
|
39295
39306
|
artifacts: {
|
|
39296
39307
|
terminal_transcript: relativeArtifactName(input.run.outputs.jsonl),
|
|
39297
39308
|
command_log: (0, import_fs14.existsSync)((0, import_path12.join)(input.run.run_dir, "commands.ndjson")) ? "commands.ndjson" : null,
|
|
@@ -39509,6 +39520,19 @@ function writeSession(runDir, session) {
|
|
|
39509
39520
|
`, "utf8");
|
|
39510
39521
|
return path2;
|
|
39511
39522
|
}
|
|
39523
|
+
function buildDefaultEvalState() {
|
|
39524
|
+
return {
|
|
39525
|
+
org_reuse_expected: true,
|
|
39526
|
+
agent_reuse_expected: true,
|
|
39527
|
+
widget_reuse_expected: true,
|
|
39528
|
+
fresh_org_expected: false,
|
|
39529
|
+
fresh_agent_expected: false,
|
|
39530
|
+
phone_purchase_expected: false,
|
|
39531
|
+
paid_resource_creation_expected: false,
|
|
39532
|
+
spend_policy_expected: "no_spend",
|
|
39533
|
+
rationale: "Mass external-agent evals benchmark public docs/CLI/API clarity; reuse avoids paid phone and Twilio inventory churn."
|
|
39534
|
+
};
|
|
39535
|
+
}
|
|
39512
39536
|
function buildRunArtifact(input) {
|
|
39513
39537
|
const commands = readCommandRecords(input.runDir);
|
|
39514
39538
|
const startedAt = String(input.session.started_at);
|
|
@@ -39545,6 +39569,7 @@ function buildRunArtifact(input) {
|
|
|
39545
39569
|
],
|
|
39546
39570
|
commands_run: commands.map((command) => command.command),
|
|
39547
39571
|
docs_pages_used: [],
|
|
39572
|
+
eval_state: buildDefaultEvalState(),
|
|
39548
39573
|
artifacts: {
|
|
39549
39574
|
terminal_transcript: null,
|
|
39550
39575
|
command_log: "commands.ndjson",
|
|
@@ -39651,6 +39676,7 @@ function registerEval(program3) {
|
|
|
39651
39676
|
manual_intervention_count: 0,
|
|
39652
39677
|
run_dir: runDir,
|
|
39653
39678
|
prompt_path: promptPath,
|
|
39679
|
+
eval_state: buildDefaultEvalState(),
|
|
39654
39680
|
capture_env: {
|
|
39655
39681
|
[EXTERNAL_AGENT_RUN_DIR_ENV]: runDir,
|
|
39656
39682
|
[EXTERNAL_AGENT_PROMPT_VERSION_ENV]: promptVersion
|
|
@@ -38,6 +38,17 @@
|
|
|
38
38
|
"https://frontofhouse.okii.uk/guides/cli-install-and-upgrade",
|
|
39
39
|
"https://frontofhouse.okii.uk/guides/error-handling-and-debugging"
|
|
40
40
|
],
|
|
41
|
+
"eval_state": {
|
|
42
|
+
"org_reuse_expected": true,
|
|
43
|
+
"agent_reuse_expected": true,
|
|
44
|
+
"widget_reuse_expected": true,
|
|
45
|
+
"fresh_org_expected": false,
|
|
46
|
+
"fresh_agent_expected": false,
|
|
47
|
+
"phone_purchase_expected": false,
|
|
48
|
+
"paid_resource_creation_expected": false,
|
|
49
|
+
"spend_policy_expected": "no_spend",
|
|
50
|
+
"rationale": "Mass external-agent evals benchmark public docs/CLI/API clarity; reuse avoids paid phone and Twilio inventory churn."
|
|
51
|
+
},
|
|
41
52
|
"artifacts": {
|
|
42
53
|
"terminal_transcript": "terminal-transcript.txt",
|
|
43
54
|
"proof_bundle": null,
|
package/package.json
CHANGED
|
@@ -67,6 +67,21 @@
|
|
|
67
67
|
"type": "array",
|
|
68
68
|
"items": { "type": "string" }
|
|
69
69
|
},
|
|
70
|
+
"eval_state": {
|
|
71
|
+
"type": "object",
|
|
72
|
+
"properties": {
|
|
73
|
+
"org_reuse_expected": { "type": "boolean" },
|
|
74
|
+
"agent_reuse_expected": { "type": "boolean" },
|
|
75
|
+
"widget_reuse_expected": { "type": "boolean" },
|
|
76
|
+
"fresh_org_expected": { "type": "boolean" },
|
|
77
|
+
"fresh_agent_expected": { "type": "boolean" },
|
|
78
|
+
"phone_purchase_expected": { "type": "boolean" },
|
|
79
|
+
"paid_resource_creation_expected": { "type": "boolean" },
|
|
80
|
+
"spend_policy_expected": { "type": "string" },
|
|
81
|
+
"rationale": { "type": "string" }
|
|
82
|
+
},
|
|
83
|
+
"additionalProperties": true
|
|
84
|
+
},
|
|
70
85
|
"artifacts": {
|
|
71
86
|
"type": "object",
|
|
72
87
|
"properties": {
|