ultimate-pi 0.4.0 → 0.5.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (94) hide show
  1. package/.agents/skills/harness-decisions/SKILL.md +15 -0
  2. package/.agents/skills/scrapling-web/SKILL.md +45 -40
  3. package/.agents/skills/wiki-autoresearch/SKILL.md +3 -3
  4. package/.pi/PACKAGING.md +3 -2
  5. package/.pi/SYSTEM.md +12 -13
  6. package/.pi/agents/pi-pi/agent-expert.md +3 -3
  7. package/.pi/extensions/harness-web-guard.ts +95 -0
  8. package/.pi/extensions/harness-web-tools.ts +209 -0
  9. package/.pi/extensions/lib/harness-vcc-settings.ts +50 -0
  10. package/.pi/extensions/lib/harness-web/run-cli.ts +92 -0
  11. package/.pi/extensions/ultimate-pi-vcc.ts +17 -0
  12. package/.pi/harness/docs/adrs/0030-inhouse-vcc-compaction.md +40 -0
  13. package/.pi/harness/docs/adrs/README.md +1 -0
  14. package/.pi/harness/env.harness.template +3 -1
  15. package/.pi/prompts/harness-setup.md +48 -2
  16. package/.pi/scripts/harness-cli-verify.sh +12 -3
  17. package/.pi/scripts/harness-searxng-bootstrap.mjs +270 -0
  18. package/.pi/scripts/harness-web-search.md +24 -5
  19. package/.pi/scripts/harness-web.py +24 -7
  20. package/.pi/scripts/harness_web/config.py +37 -3
  21. package/.pi/scripts/harness_web/output.py +8 -2
  22. package/.pi/scripts/harness_web/search.py +22 -0
  23. package/.pi/scripts/harness_web/search_ddg.py +1 -5
  24. package/.pi/scripts/harness_web/search_searxng.py +100 -0
  25. package/.pi/scripts/vendor-pi-vcc-settings.stub.ts +8 -0
  26. package/.pi/scripts/vendor-sync-pi-vcc.sh +40 -0
  27. package/.pi/settings.example.json +1 -6
  28. package/CHANGELOG.md +20 -6
  29. package/THIRD_PARTY_NOTICES.md +8 -22
  30. package/package.json +7 -6
  31. package/vendor/pi-vcc/README.md +215 -0
  32. package/vendor/pi-vcc/UPSTREAM_PIN.md +12 -0
  33. package/vendor/pi-vcc/demo.gif +0 -0
  34. package/vendor/pi-vcc/index.ts +12 -0
  35. package/vendor/pi-vcc/package.json +26 -0
  36. package/vendor/pi-vcc/scripts/audit-sessions.ts +88 -0
  37. package/vendor/pi-vcc/scripts/benchmark-real-sessions.ts +25 -0
  38. package/vendor/pi-vcc/scripts/compare-before-after.ts +36 -0
  39. package/vendor/pi-vcc/scripts/dump-branch-output.ts +20 -0
  40. package/vendor/pi-vcc/src/commands/pi-vcc.ts +36 -0
  41. package/vendor/pi-vcc/src/commands/vcc-recall.ts +65 -0
  42. package/vendor/pi-vcc/src/core/brief.ts +381 -0
  43. package/vendor/pi-vcc/src/core/build-sections.ts +79 -0
  44. package/vendor/pi-vcc/src/core/content.ts +60 -0
  45. package/vendor/pi-vcc/src/core/filter-noise.ts +42 -0
  46. package/vendor/pi-vcc/src/core/format-recall.ts +27 -0
  47. package/vendor/pi-vcc/src/core/format.ts +49 -0
  48. package/vendor/pi-vcc/src/core/lineage.ts +26 -0
  49. package/vendor/pi-vcc/src/core/load-messages.ts +41 -0
  50. package/vendor/pi-vcc/src/core/normalize.ts +66 -0
  51. package/vendor/pi-vcc/src/core/recall-scope.ts +14 -0
  52. package/vendor/pi-vcc/src/core/render-entries.ts +55 -0
  53. package/vendor/pi-vcc/src/core/report.ts +237 -0
  54. package/vendor/pi-vcc/src/core/sanitize.ts +5 -0
  55. package/vendor/pi-vcc/src/core/search-entries.ts +221 -0
  56. package/vendor/pi-vcc/src/core/settings.ts +8 -0
  57. package/vendor/pi-vcc/src/core/skill-collapse.ts +35 -0
  58. package/vendor/pi-vcc/src/core/summarize.ts +157 -0
  59. package/vendor/pi-vcc/src/core/tool-args.ts +14 -0
  60. package/vendor/pi-vcc/src/details.ts +7 -0
  61. package/vendor/pi-vcc/src/extract/commits.ts +69 -0
  62. package/vendor/pi-vcc/src/extract/files.ts +80 -0
  63. package/vendor/pi-vcc/src/extract/goals.ts +79 -0
  64. package/vendor/pi-vcc/src/extract/preferences.ts +55 -0
  65. package/vendor/pi-vcc/src/hooks/before-compact.ts +314 -0
  66. package/vendor/pi-vcc/src/sections.ts +12 -0
  67. package/vendor/pi-vcc/src/tools/recall.ts +109 -0
  68. package/vendor/pi-vcc/src/types.ts +14 -0
  69. package/vendor/pi-vcc/tests/before-compact-hook.test.ts +204 -0
  70. package/vendor/pi-vcc/tests/before-compact.test.ts +145 -0
  71. package/vendor/pi-vcc/tests/brief.test.ts +206 -0
  72. package/vendor/pi-vcc/tests/build-sections.test.ts +59 -0
  73. package/vendor/pi-vcc/tests/compile.test.ts +80 -0
  74. package/vendor/pi-vcc/tests/content.test.ts +31 -0
  75. package/vendor/pi-vcc/tests/extract-goals.test.ts +86 -0
  76. package/vendor/pi-vcc/tests/extract-preferences.test.ts +30 -0
  77. package/vendor/pi-vcc/tests/filter-noise.test.ts +61 -0
  78. package/vendor/pi-vcc/tests/fixtures.ts +61 -0
  79. package/vendor/pi-vcc/tests/format-recall.test.ts +30 -0
  80. package/vendor/pi-vcc/tests/format.test.ts +62 -0
  81. package/vendor/pi-vcc/tests/lineage.test.ts +33 -0
  82. package/vendor/pi-vcc/tests/load-messages.test.ts +51 -0
  83. package/vendor/pi-vcc/tests/normalize.test.ts +97 -0
  84. package/vendor/pi-vcc/tests/real-sessions.test.ts +38 -0
  85. package/vendor/pi-vcc/tests/recall-expand.test.ts +15 -0
  86. package/vendor/pi-vcc/tests/recall-scope.test.ts +32 -0
  87. package/vendor/pi-vcc/tests/recall-tool-scope.test.ts +67 -0
  88. package/vendor/pi-vcc/tests/render-entries.test.ts +62 -0
  89. package/vendor/pi-vcc/tests/report.test.ts +44 -0
  90. package/vendor/pi-vcc/tests/sanitize.test.ts +24 -0
  91. package/vendor/pi-vcc/tests/search-entries.test.ts +144 -0
  92. package/vendor/pi-vcc/tests/support/load-session.ts +23 -0
  93. package/vendor/pi-vcc/tests/support/real-sessions.ts +51 -0
  94. package/.pi/pi-vcc-config.json +0 -4
@@ -0,0 +1,157 @@
1
+ import type { Message } from "@mariozechner/pi-ai";
2
+ import type { FileOps } from "../types";
3
+ import { normalize } from "./normalize";
4
+ import { filterNoise } from "./filter-noise";
5
+ import { buildSections } from "./build-sections";
6
+ import { formatSummary, capBrief, RECALL_NOTE } from "./format";
7
+
8
+ export interface CompileInput {
9
+ messages: Message[];
10
+ previousSummary?: string;
11
+ fileOps?: FileOps;
12
+ }
13
+
14
+ const HEADER_NAMES = ["Session Goal", "Files And Changes", "Commits", "Outstanding Context", "User Preferences"];
15
+
16
+ const SEPARATOR = "\n\n---\n\n";
17
+
18
+ /** Extract a named section from summary text */
19
+ const sectionOf = (text: string, header: string): string => {
20
+ const tag = `[${header}]`;
21
+ const start = text.indexOf(tag);
22
+ if (start < 0) return "";
23
+ const after = text.slice(start);
24
+ // Find next section header or separator
25
+ const nextSection = HEADER_NAMES
26
+ .filter((h) => h !== header)
27
+ .map((h) => after.indexOf(`[${h}]`))
28
+ .filter((n) => n > 0);
29
+ const nextSep = after.indexOf("\n\n---\n\n");
30
+ const candidates = [...nextSection, ...(nextSep > 0 ? [nextSep] : [])].sort((a, b) => a - b);
31
+ const end = candidates[0];
32
+ return (end ? after.slice(0, end) : after).trim();
33
+ };
34
+
35
+ /** Extract the brief transcript part (everything after ---) */
36
+ const briefOf = (text: string): string => {
37
+ const idx = text.indexOf(SEPARATOR);
38
+ if (idx < 0) return "";
39
+ return text.slice(idx + SEPARATOR.length).trim();
40
+ };
41
+
42
+ /** Merge a header section */
43
+ const mergeHeaderSection = (header: string, prev: string, fresh: string): string => {
44
+ // Outstanding Context is volatile -- always use fresh only
45
+ if (header === "Outstanding Context") return fresh;
46
+ if (!prev) return fresh;
47
+ if (!fresh) return prev;
48
+
49
+ // Files And Changes: merge by category (Modified/Created/Read), dedup paths
50
+ if (header === "Files And Changes") {
51
+ return mergeFileLines(prev, fresh);
52
+ }
53
+
54
+ // Session Goal, User Preferences: line-level dedup, cap
55
+ const isClean = (l: string) => l.startsWith("- ") && !l.includes("<skill") && !l.includes("</skill");
56
+ const prevLines = prev.split("\n").filter(isClean);
57
+ const freshLines = fresh.split("\n").filter(isClean);
58
+ const combined = [...new Set([...prevLines, ...freshLines])];
59
+ const CAP = header === "Session Goal" ? 8 : header === "Commits" ? 8 : 15;
60
+ const capped = combined.length > CAP ? combined.slice(-CAP) : combined;
61
+ if (capped.length === 0) return "";
62
+ return `[${header}]\n${capped.join("\n")}`;
63
+ };
64
+
65
+ /** Merge Files And Changes by category, dedup paths across compactions */
66
+ const mergeFileLines = (prev: string, fresh: string): string => {
67
+ const categories = ["Modified", "Created", "Read"] as const;
68
+ const merged: Record<string, Set<string>> = {};
69
+ for (const cat of categories) merged[cat] = new Set();
70
+
71
+ // Parse "- Modified: a, b, c (+N more)" lines from both prev and fresh
72
+ for (const text of [prev, fresh]) {
73
+ for (const line of text.split("\n")) {
74
+ for (const cat of categories) {
75
+ const prefix = `- ${cat}: `;
76
+ if (!line.startsWith(prefix)) continue;
77
+ let rest = line.slice(prefix.length);
78
+ // Strip "(+N more)" suffix
79
+ rest = rest.replace(/\s*\(\+\d+ more\)\s*$/, "");
80
+ for (const p of rest.split(",")) {
81
+ const trimmed = p.trim();
82
+ if (trimmed) merged[cat].add(trimmed);
83
+ }
84
+ }
85
+ }
86
+ }
87
+
88
+ // Dedup: if already in Modified, drop from Created (file existed before)
89
+ for (const p of merged.Modified) merged.Created.delete(p);
90
+
91
+ const cap = (set: Set<string>, limit: number) => {
92
+ const arr = [...set];
93
+ if (arr.length <= limit) return arr.join(", ");
94
+ return arr.slice(0, limit).join(", ") + ` (+${arr.length - limit} more)`;
95
+ };
96
+
97
+ const lines: string[] = [];
98
+ if (merged.Modified.size > 0) lines.push(`- Modified: ${cap(merged.Modified, 10)}`);
99
+ if (merged.Created.size > 0) lines.push(`- Created: ${cap(merged.Created, 10)}`);
100
+ if (merged.Read.size > 0) lines.push(`- Read: ${cap(merged.Read, 10)}`);
101
+ if (lines.length === 0) return "";
102
+ return `[Files And Changes]\n${lines.join("\n")}`;
103
+ };
104
+
105
+ const mergeBriefTranscript = (prev: string, fresh: string): string => {
106
+ if (!prev) return fresh;
107
+ if (!fresh) return prev;
108
+ return prev + "\n\n" + fresh;
109
+ };
110
+
111
+ const mergePrevious = (prev: string, fresh: string): string => {
112
+ // Merge header sections
113
+ const headers = HEADER_NAMES
114
+ .map((header) => {
115
+ const freshSec = sectionOf(fresh, header);
116
+ const prevSec = sectionOf(prev, header);
117
+ return mergeHeaderSection(header, prevSec, freshSec);
118
+ })
119
+ .filter(Boolean);
120
+
121
+ // Merge brief transcript
122
+ const prevBrief = briefOf(prev);
123
+ const freshBrief = briefOf(fresh);
124
+ const mergedBrief = mergeBriefTranscript(prevBrief, freshBrief);
125
+
126
+ const parts: string[] = [];
127
+ if (headers.length > 0) {
128
+ parts.push(headers.join("\n\n"));
129
+ }
130
+ if (mergedBrief) {
131
+ parts.push(capBrief(mergedBrief));
132
+ }
133
+
134
+ return parts.join(SEPARATOR);
135
+ };
136
+
137
+ export const compile = (input: CompileInput): string => {
138
+ const blocks = filterNoise(normalize(input.messages));
139
+ const data = buildSections({ blocks });
140
+ const fresh = formatSummary(data);
141
+ // Strip any legacy RECALL_NOTE baked into prev summary (pre-fix format)
142
+ // so merge doesn't re-stack it inside the brief.
143
+ const prev = input.previousSummary
144
+ ? stripRecallNote(input.previousSummary)
145
+ : undefined;
146
+ const merged = prev ? mergePrevious(prev, fresh) : fresh;
147
+ if (!merged) return "";
148
+ return merged + SEPARATOR + RECALL_NOTE;
149
+ };
150
+
151
+ const stripRecallNote = (text: string): string => {
152
+ // Remove trailing RECALL_NOTE (and any separators surrounding it) if present.
153
+ // Handles both current format (---\n\nNOTE) and bare trailing NOTE.
154
+ const idx = text.lastIndexOf(RECALL_NOTE);
155
+ if (idx < 0) return text;
156
+ return text.slice(0, idx).replace(/\s*(?:\n\n---\n\n)?\s*$/, "").trimEnd();
157
+ };
@@ -0,0 +1,14 @@
1
+ export const extractPath = (args: Record<string, unknown>): string | null => {
2
+ for (const key of ["path", "file_path", "filePath", "file"]) {
3
+ if (typeof args[key] === "string") return args[key] as string;
4
+ }
5
+ return null;
6
+ };
7
+
8
+ export const summarizeToolArgs = (args: Record<string, unknown>): string => {
9
+ const path = extractPath(args);
10
+ if (path) return `path=${path}`;
11
+ if (typeof args.command === "string") return `command=${args.command}`;
12
+ if (typeof args.query === "string") return `query=${args.query}`;
13
+ return Object.keys(args).join(", ");
14
+ };
@@ -0,0 +1,7 @@
1
+ export interface PiVccCompactionDetails {
2
+ compactor: "pi-vcc" | "ultimate-pi-vcc";
3
+ version: number;
4
+ sections: string[];
5
+ sourceMessageCount: number;
6
+ previousSummaryUsed: boolean;
7
+ }
@@ -0,0 +1,69 @@
1
+ import type { NormalizedBlock } from "../types";
2
+
3
+ interface CommitInfo {
4
+ hash?: string;
5
+ message: string;
6
+ }
7
+
8
+ const COMMIT_MSG_RE = /git\s+commit[^\n]*?-m\s+(?:"((?:[^"\\]|\\.)*)"|'((?:[^'\\]|\\.)*)'|\$?'((?:[^'\\]|\\.)*)')/;
9
+ // Match short hash from git output: "[branch hash]" or "main hash" or 7-12 hex
10
+ const HASH_RE = /\b([0-9a-f]{7,12})\b/;
11
+
12
+ const firstLineOf = (text: string): string => {
13
+ const line = text.split(/\\n|\n/)[0] ?? "";
14
+ return line.trim();
15
+ };
16
+
17
+ const cleanMessage = (msg: string): string =>
18
+ msg.replace(/\\"/g, '"').replace(/\\'/g, "'").trim();
19
+
20
+ /**
21
+ * Extract git commits from bash tool calls (`git commit -m "..."`) and pair
22
+ * with hash from the immediately following tool_result.
23
+ */
24
+ export const extractCommits = (blocks: NormalizedBlock[]): CommitInfo[] => {
25
+ const commits: CommitInfo[] = [];
26
+
27
+ for (let i = 0; i < blocks.length; i++) {
28
+ const b = blocks[i];
29
+ if (b.kind !== "tool_call" || b.name !== "bash") continue;
30
+ const cmd = typeof b.args.command === "string" ? b.args.command : "";
31
+ if (!/\bgit\s+commit\b/.test(cmd)) continue;
32
+ const m = cmd.match(COMMIT_MSG_RE);
33
+ if (!m) continue;
34
+ const message = firstLineOf(cleanMessage(m[1] ?? m[2] ?? m[3] ?? ""));
35
+ if (!message) continue;
36
+
37
+ let hash: string | undefined;
38
+ // Look at next tool_result for hash
39
+ for (let j = i + 1; j < Math.min(blocks.length, i + 3); j++) {
40
+ const r = blocks[j];
41
+ if (r.kind !== "tool_result") continue;
42
+ // Common git commit output: `[branch <hash>] message` or `<branch> <hash>..<hash>`
43
+ const bracket = r.text.match(/\[\S+\s+([0-9a-f]{7,12})\]/);
44
+ if (bracket) { hash = bracket[1]; break; }
45
+ const range = r.text.match(/\b([0-9a-f]{7,12})\.\.([0-9a-f]{7,12})\b/);
46
+ if (range) { hash = range[2]; break; }
47
+ const plain = r.text.match(HASH_RE);
48
+ if (plain) { hash = plain[1]; break; }
49
+ }
50
+
51
+ // Dedup by message+hash
52
+ const key = `${hash ?? ""}::${message}`;
53
+ if (!commits.some((c) => `${c.hash ?? ""}::${c.message}` === key)) {
54
+ commits.push({ hash, message });
55
+ }
56
+ }
57
+
58
+ return commits;
59
+ };
60
+
61
+ export const formatCommits = (commits: CommitInfo[], limit = 8): string[] => {
62
+ const lines: string[] = [];
63
+ const items = commits.slice(-limit); // keep most recent
64
+ for (const c of items) {
65
+ const prefix = c.hash ? `${c.hash}: ` : "";
66
+ lines.push(`${prefix}${c.message}`);
67
+ }
68
+ return lines;
69
+ };
@@ -0,0 +1,80 @@
1
+ import type { FileOps, NormalizedBlock } from "../types";
2
+ import { extractPath } from "../core/tool-args";
3
+
4
+ interface FileActivity {
5
+ read: Set<string>;
6
+ modified: Set<string>;
7
+ created: Set<string>;
8
+ }
9
+
10
+ const FILE_READ_TOOLS = new Set([
11
+ "Read", "read_file", "View",
12
+ ]);
13
+
14
+ const FILE_WRITE_TOOLS = new Set([
15
+ "Edit", "Write", "edit", "write", "edit_file", "write_file",
16
+ "MultiEdit",
17
+ ]);
18
+
19
+ const FILE_CREATE_TOOLS = new Set([
20
+ "Write", "write", "write_file",
21
+ ]);
22
+
23
+ /**
24
+ * Find the longest common directory prefix among absolute paths.
25
+ * Returns "" if fewer than 2 absolute paths or no meaningful common prefix.
26
+ */
27
+ const longestCommonDirPrefix = (paths: string[]): string => {
28
+ const abs = paths.filter((p) => p.startsWith("/"));
29
+ if (abs.length < 2) return "";
30
+ const split = abs.map((p) => p.split("/"));
31
+ const min = Math.min(...split.map((s) => s.length));
32
+ let i = 0;
33
+ while (i < min - 1) {
34
+ const seg = split[0][i];
35
+ if (!split.every((s) => s[i] === seg)) break;
36
+ i++;
37
+ }
38
+ if (i < 2) return ""; // require at least /a/b common
39
+ return split[0].slice(0, i).join("/") + "/";
40
+ };
41
+
42
+ const trimPaths = (set: Set<string>, prefix: string): Set<string> => {
43
+ if (!prefix) return set;
44
+ const out = new Set<string>();
45
+ for (const p of set) {
46
+ out.add(p.startsWith(prefix) ? p.slice(prefix.length) : p);
47
+ }
48
+ return out;
49
+ };
50
+
51
+ export const extractFiles = (
52
+ blocks: NormalizedBlock[],
53
+ fileOps?: FileOps,
54
+ ): FileActivity => {
55
+ const act: FileActivity = {
56
+ read: new Set(fileOps?.readFiles ?? []),
57
+ modified: new Set(fileOps?.modifiedFiles ?? []),
58
+ created: new Set(fileOps?.createdFiles ?? []),
59
+ };
60
+
61
+ for (const b of blocks) {
62
+ if (b.kind !== "tool_call") continue;
63
+ const p = extractPath(b.args);
64
+ if (!p) continue;
65
+
66
+ if (FILE_READ_TOOLS.has(b.name)) act.read.add(p);
67
+ if (FILE_WRITE_TOOLS.has(b.name)) act.modified.add(p);
68
+ if (FILE_CREATE_TOOLS.has(b.name)) act.created.add(p);
69
+ }
70
+
71
+ const all = [...act.read, ...act.modified, ...act.created];
72
+ const prefix = longestCommonDirPrefix(all);
73
+ if (prefix) {
74
+ act.read = trimPaths(act.read, prefix);
75
+ act.modified = trimPaths(act.modified, prefix);
76
+ act.created = trimPaths(act.created, prefix);
77
+ }
78
+
79
+ return act;
80
+ };
@@ -0,0 +1,79 @@
1
+ import type { NormalizedBlock } from "../types";
2
+ import { nonEmptyLines, clip } from "../core/content";
3
+ import { collapseSkillLines } from "../core/skill-collapse";
4
+
5
+ const SCOPE_CHANGE_RE =
6
+ /\b(instead|actually|change of plan|forget that|new task|switch to|now I want|pivot|let'?s do|stop .* and)\b/i;
7
+
8
+ const TASK_RE =
9
+ /\b(fix|implement|add|create|build|refactor|debug|investigate|update|remove|delete|migrate|deploy|test|write|set up)\b/i;
10
+
11
+ const NOISE_SHORT_RE = /^(ok|yes|no|sure|yeah|yep|go|hi|hey|thx|thanks|ok\b.*|y|n|k)\s*[.!?]*$/i;
12
+
13
+ // Reject lines that are clearly not user goals (pasted output, code, paths, tool dumps)
14
+ // or meta-prompt boilerplate (command templates like `/issues` that start with "For each issue:"
15
+ // followed by numbered "Read the issue in full..." steps).
16
+ const NON_GOAL_RE =
17
+ /^\s*[\[│├└─╭╰]|```|^\s*(=[A-Z]+\(|function |const |let |var |import |export |class )|^(https?:|file:|\/[A-Za-z])|\\n|^\s*For each\b|\bin full\b[^\n]*\b(comments|issue|issues|PRs?|linked)\b/;
18
+
19
+ // Signals that the rest of the user message is a command template (e.g. /issues),
20
+ // in which case we should stop collecting goals at the signal line.
21
+ const TEMPLATE_SIGNAL_RE =
22
+ /^\s*(For each\b|Do NOT implement\b|Analyze and propose\b|If Task\/context\b|Output:\s*$)/i;
23
+
24
+ const truncateAtTemplate = (lines: string[]): string[] => {
25
+ const idx = lines.findIndex((l) => TEMPLATE_SIGNAL_RE.test(l));
26
+ return idx >= 0 ? lines.slice(0, idx) : lines;
27
+ };
28
+
29
+ const stripLeadingBullet = (line: string): string =>
30
+ line.replace(/^\s*(?:[-*+]|\d+\.)\s+/, "").trim();
31
+
32
+ const MAX_GOAL_CHARS = 200;
33
+
34
+ const isSubstantiveGoal = (text: string): boolean => {
35
+ const t = text.trim();
36
+ if (t.length <= 5) return false;
37
+ if (t.length > MAX_GOAL_CHARS) return false;
38
+ if (NOISE_SHORT_RE.test(t)) return false;
39
+ if (NON_GOAL_RE.test(t)) return false;
40
+ return true;
41
+ };
42
+
43
+ // Test scope-change / task intent only on the leading portion of a user block
44
+ // so that pasted outputs below the actual instruction do not trigger matches.
45
+ const LEADING_CHARS = 200;
46
+
47
+ export const extractGoals = (blocks: NormalizedBlock[]): string[] => {
48
+ const goals: string[] = [];
49
+ let latestScopeChange: string[] | null = null;
50
+
51
+ for (const b of blocks) {
52
+ if (b.kind !== "user") continue;
53
+ const rawLines = nonEmptyLines(b.text);
54
+ const truncated = truncateAtTemplate(rawLines);
55
+ const lines = collapseSkillLines(truncated.filter(isSubstantiveGoal))
56
+ .map(stripLeadingBullet)
57
+ .filter((l) => l.length > 5);
58
+ if (lines.length === 0) continue;
59
+
60
+ if (goals.length === 0) {
61
+ goals.push(...lines.slice(0, 6));
62
+ continue;
63
+ }
64
+
65
+ const leading = b.text.slice(0, LEADING_CHARS);
66
+ if (SCOPE_CHANGE_RE.test(leading)) {
67
+ latestScopeChange = lines.slice(0, 3).map((l) => clip(l, MAX_GOAL_CHARS));
68
+ } else if (TASK_RE.test(leading) && lines[0].length > 15) {
69
+ latestScopeChange = lines.slice(0, 2).map((l) => clip(l, MAX_GOAL_CHARS));
70
+ }
71
+ }
72
+
73
+ // Only emit the [Scope change] marker when we actually captured bullets.
74
+ if (latestScopeChange && latestScopeChange.length > 0) {
75
+ goals.push("[Scope change]", ...latestScopeChange);
76
+ }
77
+
78
+ return goals.slice(0, 8);
79
+ };
@@ -0,0 +1,55 @@
1
+ import type { NormalizedBlock } from "../types";
2
+ import { clip, nonEmptyLines } from "../core/content";
3
+
4
+ // Tightened patterns: require a clear preference construction, not bare keywords.
5
+ const PREF_PATTERNS = [
6
+ /\bprefer(?:s|red|ring)?\s+\w/i,
7
+ /\bdon'?t want\b/i,
8
+ /\balways (?:use|do|run|prefer|keep|make|format|write|add|set|put|prefix|start|include|append)\b/i,
9
+ /\bnever (?:use|do|run|push|commit|write|ignore|add|set|put|remove|delete|include|deploy)\b/i,
10
+ /\bplease (?:use|avoid|keep|make|don'?t|do not|format|write)\b/i,
11
+ /\b(?:style|format|language|naming)\s*[:=]\s*\S/i,
12
+ ];
13
+
14
+ export const extractPreferences = (blocks: NormalizedBlock[]): string[] => {
15
+ const prefs: string[] = [];
16
+ const seen = new Set<string>();
17
+
18
+ for (const b of blocks) {
19
+ if (b.kind !== "user") continue;
20
+
21
+ let perBlock = 0;
22
+ for (const line of nonEmptyLines(b.text)) {
23
+ const trimmed = line.trim();
24
+ if (!trimmed || trimmed.length < 5) continue;
25
+ if (trimmed.length > 200) continue;
26
+ // Reject questions.
27
+ if (trimmed.endsWith("?") || trimmed.includes("?...")) continue;
28
+ if (!PREF_PATTERNS.some((p) => p.test(trimmed))) continue;
29
+
30
+ const clipped = clip(trimmed, 200);
31
+ const key = clipped.toLowerCase();
32
+ if (seen.has(key)) continue;
33
+ seen.add(key);
34
+ prefs.push(clipped);
35
+
36
+ // Cap per user block to avoid pasting long rule lists as many prefs.
37
+ if (++perBlock >= 1) break;
38
+ }
39
+ }
40
+
41
+ return prefs.slice(0, 10);
42
+ };
43
+
44
+ /**
45
+ * Remove preferences that duplicate goals (case-insensitive, trimmed).
46
+ * Called by `buildSections` so that the two sections do not overlap.
47
+ */
48
+ export const dedupPreferencesAgainstGoals = (
49
+ prefs: string[],
50
+ goals: string[],
51
+ ): string[] => {
52
+ const norm = (s: string) => s.trim().toLowerCase();
53
+ const goalSet = new Set(goals.map(norm));
54
+ return prefs.filter((p) => !goalSet.has(norm(p)));
55
+ };