@f-o-h/cli 0.1.36 → 0.1.37

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/README.md CHANGED
@@ -4,7 +4,7 @@ AI-operator provisioning CLI for Front Of House.
4
4
 
5
5
  Public mirror: https://github.com/iiko38/front-of-house-cli
6
6
 
7
- Current published baseline: `@f-o-h/cli@0.1.36`
7
+ Current published baseline: `@f-o-h/cli@0.1.37`
8
8
 
9
9
  This mirror is a generated release artifact. The private product monorepo is not
10
10
  published here, and no open-source license is granted unless stated separately.
@@ -123,9 +123,13 @@ foh eval external-agent run \
123
123
  --prompt-version blank-setup.v1
124
124
  ```
125
125
 
126
- The command writes a versioned prompt, launches an instrumented shell, captures
127
- FOH CLI commands into `commands.ndjson`, and finalizes `run.json` as an
128
- `external_agent_run.v1` artifact when the shell exits.
126
+ The command writes a versioned prompt, launches an instrumented shell, captures
127
+ FOH CLI commands into `commands.ndjson`, and finalizes `run.json` as an
128
+ `external_agent_run.v1` artifact when the shell exits.
129
+
130
+ Run artifacts include `eval_state` so repeated benchmark runs make reuse
131
+ explicit: org, agent, and widget reuse are expected; fresh paid phone-number
132
+ creation is not expected.
129
133
 
130
134
  For guarded programmable-runner planning:
131
135
 
package/dist/foh.js CHANGED
@@ -32755,7 +32755,7 @@ var StdioServerTransport = class {
32755
32755
  };
32756
32756
 
32757
32757
  // src/lib/cli-version.ts
32758
- var CLI_VERSION = "0.1.36";
32758
+ var CLI_VERSION = "0.1.37";
32759
32759
 
32760
32760
  // src/commands/mcp-serve.ts
32761
32761
  var DEFAULT_TIMEOUT_MS = 12e4;
@@ -39292,6 +39292,17 @@ function buildExecutedRunArtifact(input) {
39292
39292
  ],
39293
39293
  commands_run: commands.map((command) => command.command),
39294
39294
  docs_pages_used: [],
39295
+ eval_state: {
39296
+ org_reuse_expected: true,
39297
+ agent_reuse_expected: true,
39298
+ widget_reuse_expected: true,
39299
+ fresh_org_expected: false,
39300
+ fresh_agent_expected: false,
39301
+ phone_purchase_expected: false,
39302
+ paid_resource_creation_expected: false,
39303
+ spend_policy_expected: NO_SPEND_POLICY,
39304
+ rationale: "Mass external-agent evals benchmark public docs/CLI/API clarity; reuse avoids paid phone and Twilio inventory churn."
39305
+ },
39295
39306
  artifacts: {
39296
39307
  terminal_transcript: relativeArtifactName(input.run.outputs.jsonl),
39297
39308
  command_log: (0, import_fs14.existsSync)((0, import_path12.join)(input.run.run_dir, "commands.ndjson")) ? "commands.ndjson" : null,
@@ -39509,6 +39520,19 @@ function writeSession(runDir, session) {
39509
39520
  `, "utf8");
39510
39521
  return path2;
39511
39522
  }
39523
+ function buildDefaultEvalState() {
39524
+ return {
39525
+ org_reuse_expected: true,
39526
+ agent_reuse_expected: true,
39527
+ widget_reuse_expected: true,
39528
+ fresh_org_expected: false,
39529
+ fresh_agent_expected: false,
39530
+ phone_purchase_expected: false,
39531
+ paid_resource_creation_expected: false,
39532
+ spend_policy_expected: "no_spend",
39533
+ rationale: "Mass external-agent evals benchmark public docs/CLI/API clarity; reuse avoids paid phone and Twilio inventory churn."
39534
+ };
39535
+ }
39512
39536
  function buildRunArtifact(input) {
39513
39537
  const commands = readCommandRecords(input.runDir);
39514
39538
  const startedAt = String(input.session.started_at);
@@ -39545,6 +39569,7 @@ function buildRunArtifact(input) {
39545
39569
  ],
39546
39570
  commands_run: commands.map((command) => command.command),
39547
39571
  docs_pages_used: [],
39572
+ eval_state: buildDefaultEvalState(),
39548
39573
  artifacts: {
39549
39574
  terminal_transcript: null,
39550
39575
  command_log: "commands.ndjson",
@@ -39651,6 +39676,7 @@ function registerEval(program3) {
39651
39676
  manual_intervention_count: 0,
39652
39677
  run_dir: runDir,
39653
39678
  prompt_path: promptPath,
39679
+ eval_state: buildDefaultEvalState(),
39654
39680
  capture_env: {
39655
39681
  [EXTERNAL_AGENT_RUN_DIR_ENV]: runDir,
39656
39682
  [EXTERNAL_AGENT_PROMPT_VERSION_ENV]: promptVersion
@@ -38,6 +38,17 @@
38
38
  "https://frontofhouse.okii.uk/guides/cli-install-and-upgrade",
39
39
  "https://frontofhouse.okii.uk/guides/error-handling-and-debugging"
40
40
  ],
41
+ "eval_state": {
42
+ "org_reuse_expected": true,
43
+ "agent_reuse_expected": true,
44
+ "widget_reuse_expected": true,
45
+ "fresh_org_expected": false,
46
+ "fresh_agent_expected": false,
47
+ "phone_purchase_expected": false,
48
+ "paid_resource_creation_expected": false,
49
+ "spend_policy_expected": "no_spend",
50
+ "rationale": "Mass external-agent evals benchmark public docs/CLI/API clarity; reuse avoids paid phone and Twilio inventory churn."
51
+ },
41
52
  "artifacts": {
42
53
  "terminal_transcript": "terminal-transcript.txt",
43
54
  "proof_bundle": null,
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@f-o-h/cli",
3
- "version": "0.1.36",
3
+ "version": "0.1.37",
4
4
  "description": "FOH CLI - AI-operator provisioning tool for Front Of House",
5
5
  "license": "UNLICENSED",
6
6
  "bin": {
@@ -67,6 +67,21 @@
67
67
  "type": "array",
68
68
  "items": { "type": "string" }
69
69
  },
70
+ "eval_state": {
71
+ "type": "object",
72
+ "properties": {
73
+ "org_reuse_expected": { "type": "boolean" },
74
+ "agent_reuse_expected": { "type": "boolean" },
75
+ "widget_reuse_expected": { "type": "boolean" },
76
+ "fresh_org_expected": { "type": "boolean" },
77
+ "fresh_agent_expected": { "type": "boolean" },
78
+ "phone_purchase_expected": { "type": "boolean" },
79
+ "paid_resource_creation_expected": { "type": "boolean" },
80
+ "spend_policy_expected": { "type": "string" },
81
+ "rationale": { "type": "string" }
82
+ },
83
+ "additionalProperties": true
84
+ },
70
85
  "artifacts": {
71
86
  "type": "object",
72
87
  "properties": {