@f5xc-salesdemos/xcsh 18.49.1 → 18.50.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/package.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
{
|
|
2
2
|
"type": "module",
|
|
3
3
|
"name": "@f5xc-salesdemos/xcsh",
|
|
4
|
-
"version": "18.
|
|
4
|
+
"version": "18.50.0",
|
|
5
5
|
"description": "Coding agent CLI with read, bash, edit, write tools and session management",
|
|
6
6
|
"homepage": "https://github.com/f5xc-salesdemos/xcsh",
|
|
7
7
|
"author": "Can Boluk",
|
|
@@ -48,12 +48,12 @@
|
|
|
48
48
|
"dependencies": {
|
|
49
49
|
"@agentclientprotocol/sdk": "0.16.1",
|
|
50
50
|
"@mozilla/readability": "^0.6",
|
|
51
|
-
"@f5xc-salesdemos/xcsh-stats": "18.
|
|
52
|
-
"@f5xc-salesdemos/pi-agent-core": "18.
|
|
53
|
-
"@f5xc-salesdemos/pi-ai": "18.
|
|
54
|
-
"@f5xc-salesdemos/pi-natives": "18.
|
|
55
|
-
"@f5xc-salesdemos/pi-tui": "18.
|
|
56
|
-
"@f5xc-salesdemos/pi-utils": "18.
|
|
51
|
+
"@f5xc-salesdemos/xcsh-stats": "18.50.0",
|
|
52
|
+
"@f5xc-salesdemos/pi-agent-core": "18.50.0",
|
|
53
|
+
"@f5xc-salesdemos/pi-ai": "18.50.0",
|
|
54
|
+
"@f5xc-salesdemos/pi-natives": "18.50.0",
|
|
55
|
+
"@f5xc-salesdemos/pi-tui": "18.50.0",
|
|
56
|
+
"@f5xc-salesdemos/pi-utils": "18.50.0",
|
|
57
57
|
"@sinclair/typebox": "^0.34",
|
|
58
58
|
"@xterm/headless": "^6.0",
|
|
59
59
|
"ajv": "^8.18",
|
|
@@ -21,6 +21,7 @@ export const AUTORESEARCH_COMMITTABLE_FILES = [
|
|
|
21
21
|
"autoresearch.sh",
|
|
22
22
|
"autoresearch.checks.sh",
|
|
23
23
|
"autoresearch.ideas.md",
|
|
24
|
+
"SELF_AWARENESS.md",
|
|
24
25
|
] as const;
|
|
25
26
|
export const AUTORESEARCH_LOCAL_STATE_FILES = ["autoresearch.jsonl"] as const;
|
|
26
27
|
export const AUTORESEARCH_LOCAL_STATE_DIRECTORIES = [".autoresearch"] as const;
|
|
@@ -323,6 +323,7 @@ export const createAutoresearchExtension: ExtensionFactory = api => {
|
|
|
323
323
|
const checksPath = path.join(workDir, "autoresearch.checks.sh");
|
|
324
324
|
const ideasPath = path.join(workDir, "autoresearch.ideas.md");
|
|
325
325
|
const programPath = path.join(workDir, "autoresearch.program.md");
|
|
326
|
+
const selfAwarenessPath = path.join(workDir, "SELF_AWARENESS.md");
|
|
326
327
|
const pendingRun =
|
|
327
328
|
runtime.lastRunSummary ??
|
|
328
329
|
(await readPendingRunSummary(workDir, collectLoggedRunNumbers(runtime.state.results)));
|
|
@@ -362,6 +363,8 @@ export const createAutoresearchExtension: ExtensionFactory = api => {
|
|
|
362
363
|
ideas_path: ideasPath,
|
|
363
364
|
has_program: fs.existsSync(programPath),
|
|
364
365
|
program_path: programPath,
|
|
366
|
+
has_self_awareness: fs.existsSync(selfAwarenessPath),
|
|
367
|
+
self_awareness_path: selfAwarenessPath,
|
|
365
368
|
current_segment: runtime.state.currentSegment + 1,
|
|
366
369
|
current_segment_run_count: currentSegmentResults.length,
|
|
367
370
|
has_baseline_metric: baselineMetric !== null,
|
|
@@ -27,6 +27,14 @@ You are running an autonomous experiment loop. Keep iterating until the user int
|
|
|
27
27
|
|
|
28
28
|
Use it as a repo-local strategy overlay for this session. `autoresearch.md` remains the source of truth for benchmark, scope, and constraints.
|
|
29
29
|
{{/if}}
|
|
30
|
+
{{#if has_self_awareness}}
|
|
31
|
+
|
|
32
|
+
### Self-Awareness Manifest
|
|
33
|
+
|
|
34
|
+
`SELF_AWARENESS.md` exists at `{{self_awareness_path}}`.
|
|
35
|
+
|
|
36
|
+
This document defines xcsh's mission, current capability inventory, evaluation dimensions, and known gaps. When the session goal involves self-evaluation, capability improvement, or SE workflow enhancement, read this document first — it is the ground truth for what xcsh is, what it should become, and how to measure progress.
|
|
37
|
+
{{/if}}
|
|
30
38
|
{{#if has_recent_results}}
|
|
31
39
|
|
|
32
40
|
### Current Segment Snapshot
|
|
@@ -218,6 +226,19 @@ Before the first benchmark:
|
|
|
218
226
|
- Optionally add `autoresearch.checks.sh` if correctness or quality needs a hard gate.
|
|
219
227
|
- Call `init_experiment` with arguments that match `autoresearch.md` exactly (benchmark command, metric, unit, direction, scope paths, off limits, constraints).
|
|
220
228
|
- Run and log the baseline.
|
|
229
|
+
{{#if has_self_awareness}}
|
|
230
|
+
|
|
231
|
+
#### SE Self-Evaluation Sessions
|
|
232
|
+
|
|
233
|
+
When the goal involves evaluating or improving xcsh's sales engineering capabilities (not runtime code performance):
|
|
234
|
+
|
|
235
|
+
- Read `SELF_AWARENESS.md` first to understand the current capability inventory and evaluation dimensions
|
|
236
|
+
- Read `autoresearch.program.md` for the SE-specific evaluation strategy
|
|
237
|
+
- Design the benchmark script (`autoresearch.sh`) to test the specific SE capability dimension — product knowledge accuracy, API reliability, prompt effectiveness, or workflow completeness
|
|
238
|
+
- Use quality/accuracy scores as the primary metric (direction: `higher`) rather than timing metrics
|
|
239
|
+
- Focus `Files in Scope` on the prompts, agent definitions, tool descriptions, or service modules relevant to the SE capability being evaluated
|
|
240
|
+
- Record capability status changes in `SELF_AWARENESS.md` when experiments yield durable improvements
|
|
241
|
+
{{/if}}
|
|
221
242
|
|
|
222
243
|
Until `init_experiment` succeeds, only autoresearch control files (`autoresearch.md`, `autoresearch.sh`, `autoresearch.program.md`, `autoresearch.ideas.md`, `autoresearch.checks.sh`) may be edited; after initialization, respect Files in Scope from the contract.
|
|
223
244
|
|
|
@@ -17,17 +17,17 @@ export interface BuildInfo {
|
|
|
17
17
|
}
|
|
18
18
|
|
|
19
19
|
export const BUILD_INFO: BuildInfo = {
|
|
20
|
-
"version": "18.
|
|
21
|
-
"commit": "
|
|
22
|
-
"shortCommit": "
|
|
20
|
+
"version": "18.50.0",
|
|
21
|
+
"commit": "026774fcc6c6e909bc5a3dffa6f1e019f7bb95d3",
|
|
22
|
+
"shortCommit": "026774f",
|
|
23
23
|
"branch": "main",
|
|
24
|
-
"tag": "v18.
|
|
25
|
-
"commitDate": "2026-05-
|
|
26
|
-
"buildDate": "2026-05-
|
|
27
|
-
"dirty":
|
|
24
|
+
"tag": "v18.50.0",
|
|
25
|
+
"commitDate": "2026-05-08T23:09:25Z",
|
|
26
|
+
"buildDate": "2026-05-08T23:30:02.931Z",
|
|
27
|
+
"dirty": true,
|
|
28
28
|
"prNumber": "",
|
|
29
29
|
"repoUrl": "https://github.com/f5xc-salesdemos/xcsh",
|
|
30
30
|
"repoSlug": "f5xc-salesdemos/xcsh",
|
|
31
|
-
"commitUrl": "https://github.com/f5xc-salesdemos/xcsh/commit/
|
|
32
|
-
"releaseUrl": "https://github.com/f5xc-salesdemos/xcsh/releases/tag/v18.
|
|
31
|
+
"commitUrl": "https://github.com/f5xc-salesdemos/xcsh/commit/026774fcc6c6e909bc5a3dffa6f1e019f7bb95d3",
|
|
32
|
+
"releaseUrl": "https://github.com/f5xc-salesdemos/xcsh/releases/tag/v18.50.0"
|
|
33
33
|
};
|