ultimate-pi 0.1.0 → 0.1.3

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (509) hide show
  1. package/.agents/skills/ck-search/SKILL.md +99 -0
  2. package/.agents/skills/defuddle/SKILL.md +90 -0
  3. package/.agents/skills/find-skills/SKILL.md +142 -0
  4. package/.agents/skills/firecrawl/SKILL.md +150 -0
  5. package/.agents/skills/firecrawl/rules/install.md +82 -0
  6. package/.agents/skills/firecrawl/rules/security.md +26 -0
  7. package/.agents/skills/firecrawl-agent/SKILL.md +57 -0
  8. package/.agents/skills/firecrawl-build-interact/SKILL.md +67 -0
  9. package/.agents/skills/firecrawl-build-onboarding/SKILL.md +102 -0
  10. package/.agents/skills/firecrawl-build-onboarding/references/auth-flow.md +39 -0
  11. package/.agents/skills/firecrawl-build-onboarding/references/project-setup.md +20 -0
  12. package/.agents/skills/firecrawl-build-onboarding/references/sdk-installation.md +17 -0
  13. package/.agents/skills/firecrawl-build-scrape/SKILL.md +68 -0
  14. package/.agents/skills/firecrawl-build-search/SKILL.md +68 -0
  15. package/.agents/skills/firecrawl-crawl/SKILL.md +58 -0
  16. package/.agents/skills/firecrawl-download/SKILL.md +69 -0
  17. package/.agents/skills/firecrawl-interact/SKILL.md +83 -0
  18. package/.agents/skills/firecrawl-map/SKILL.md +50 -0
  19. package/.agents/skills/firecrawl-parse/SKILL.md +61 -0
  20. package/.agents/skills/firecrawl-scrape/SKILL.md +68 -0
  21. package/.agents/skills/firecrawl-search/SKILL.md +59 -0
  22. package/.agents/skills/obsidian-bases/SKILL.md +299 -0
  23. package/.agents/skills/obsidian-markdown/SKILL.md +237 -0
  24. package/.agents/skills/posthog-analyst/SKILL.md +306 -0
  25. package/.agents/skills/posthog-analyst/evals/evals.json +23 -0
  26. package/.agents/skills/wiki/SKILL.md +215 -0
  27. package/.agents/skills/wiki/references/css-snippets.md +122 -0
  28. package/.agents/skills/wiki/references/frontmatter.md +107 -0
  29. package/.agents/skills/wiki/references/git-setup.md +58 -0
  30. package/.agents/skills/wiki/references/mcp-setup.md +149 -0
  31. package/.agents/skills/wiki/references/modes.md +259 -0
  32. package/.agents/skills/wiki/references/plugins.md +96 -0
  33. package/.agents/skills/wiki/references/rest-api.md +124 -0
  34. package/.agents/skills/wiki-autoresearch/SKILL.md +211 -0
  35. package/.agents/skills/wiki-autoresearch/references/program.md +75 -0
  36. package/.agents/skills/wiki-fold/SKILL.md +204 -0
  37. package/.agents/skills/wiki-fold/references/fold-template.md +133 -0
  38. package/.agents/skills/wiki-ingest/SKILL.md +288 -0
  39. package/.agents/skills/wiki-lint/SKILL.md +183 -0
  40. package/.agents/skills/wiki-query/SKILL.md +176 -0
  41. package/.agents/skills/wiki-save/SKILL.md +128 -0
  42. package/.ckignore +41 -0
  43. package/.env.example +9 -0
  44. package/.github/banner-v2.png +0 -0
  45. package/.github/workflows/lint.yml +33 -0
  46. package/.github/workflows/publish-github-packages.yml +35 -0
  47. package/.github/workflows/publish-npm.yml +32 -0
  48. package/.pi/SYSTEM.md +107 -40
  49. package/.pi/agents/pi-pi/agent-expert.md +205 -0
  50. package/.pi/agents/pi-pi/cli-expert.md +47 -0
  51. package/.pi/agents/pi-pi/config-expert.md +67 -0
  52. package/.pi/agents/pi-pi/ext-expert.md +53 -0
  53. package/.pi/agents/pi-pi/keybinding-expert.md +123 -0
  54. package/.pi/agents/pi-pi/pi-orchestrator.md +103 -0
  55. package/.pi/agents/pi-pi/prompt-expert.md +83 -0
  56. package/.pi/agents/pi-pi/skill-expert.md +52 -0
  57. package/.pi/agents/pi-pi/theme-expert.md +46 -0
  58. package/.pi/agents/pi-pi/tui-expert.md +100 -0
  59. package/.pi/agents/rethink.md +140 -0
  60. package/.pi/agents/wiki-ingest.md +67 -0
  61. package/.pi/agents/wiki-lint.md +75 -0
  62. package/.pi/auto-commit.json +20 -0
  63. package/.pi/extensions/banner.png +0 -0
  64. package/.pi/extensions/ck-enforce.ts +216 -0
  65. package/.pi/extensions/custom-footer.ts +308 -0
  66. package/.pi/extensions/custom-header.ts +116 -0
  67. package/.pi/extensions/dotenv-loader.ts +170 -0
  68. package/.pi/internal/cursor-sdk-transcript-parser.ts +59 -0
  69. package/.pi/model-router.json +95 -0
  70. package/.pi/npm/.gitignore +2 -0
  71. package/.pi/prompts/git-sync.md +124 -0
  72. package/.pi/prompts/harness-setup.md +509 -0
  73. package/.pi/prompts/save.md +16 -0
  74. package/.pi/prompts/wiki-autoresearch.md +19 -0
  75. package/.pi/prompts/wiki.md +23 -0
  76. package/.pi/providers/cursor-sdk-provider.test.mjs +476 -0
  77. package/.pi/providers/cursor-sdk-provider.ts +1085 -0
  78. package/.pi/settings.json +14 -4
  79. package/.pi/skills/agent-router/SKILL.md +174 -0
  80. package/.pi/sounds/alert/1-kaching-track.mp3 +0 -0
  81. package/.pi/sounds/error/1-ksi-wth-track.mp3 +0 -0
  82. package/.pi/sounds/error/2-smash-track.mp3 +0 -0
  83. package/.pi/sounds/error/3-buzzer-track.mp3 +0 -0
  84. package/.pi/sounds/notification/1-soft-notification-track.mp3 +0 -0
  85. package/.pi/sounds/project-sounds.json +25 -0
  86. package/.pi/sounds/reminder/1-soft-notification-track.mp3 +0 -0
  87. package/.pi/sounds/success/1-tada-track.mp3 +0 -0
  88. package/.pi/sounds/success/2-jobs-done-track.mp3 +0 -0
  89. package/.pi/sounds/success/3-yay-track.mp3 +0 -0
  90. package/CONTRIBUTING.md +116 -0
  91. package/README.md +33 -40
  92. package/biome.json +34 -0
  93. package/firecrawl/.env.template +58 -0
  94. package/firecrawl/README.md +49 -0
  95. package/firecrawl/docker-compose.yaml +201 -0
  96. package/firecrawl/searxng/searxng.env +3 -0
  97. package/firecrawl/searxng/settings.yml +85 -0
  98. package/lefthook.yml +8 -0
  99. package/package.json +55 -16
  100. package/vault/AGENTS.md +37 -0
  101. package/vault/wiki/_templates/comparison.md +39 -0
  102. package/vault/wiki/_templates/concept.md +40 -0
  103. package/vault/wiki/_templates/decision.md +21 -0
  104. package/vault/wiki/_templates/entity.md +32 -0
  105. package/vault/wiki/_templates/flow.md +14 -0
  106. package/vault/wiki/_templates/module.md +18 -0
  107. package/vault/wiki/_templates/question.md +31 -0
  108. package/vault/wiki/_templates/source.md +39 -0
  109. package/vault/wiki/concepts/AST-Aware Code Chunking.md +44 -0
  110. package/vault/wiki/concepts/Build-Time Prompt Compilation.md +107 -0
  111. package/vault/wiki/concepts/Context Engine (AI Coding).md +47 -0
  112. package/vault/wiki/concepts/Context-Aware System Reminders.md +61 -0
  113. package/vault/wiki/concepts/Contextualized Text Embedding.md +42 -0
  114. package/vault/wiki/concepts/Contractor vs Employee AI Model.md +55 -0
  115. package/vault/wiki/concepts/Dual-Model Agent Architecture.md +65 -0
  116. package/vault/wiki/concepts/Late Chunking vs Early Chunking.md +43 -0
  117. package/vault/wiki/concepts/Majority Vote Ensembling.md +68 -0
  118. package/vault/wiki/concepts/Meta-Harness.md +16 -0
  119. package/vault/wiki/concepts/Multi-Agent AI Coding Architecture.md +75 -0
  120. package/vault/wiki/concepts/Prompt Enhancement.md +90 -0
  121. package/vault/wiki/concepts/Prompt Renderer.md +89 -0
  122. package/vault/wiki/concepts/Semantic Codebase Indexing.md +67 -0
  123. package/vault/wiki/concepts/additive-config-hierarchy.md +16 -0
  124. package/vault/wiki/concepts/agent-artifacts-verifiable-deliverables.md +71 -0
  125. package/vault/wiki/concepts/agent-browser-browser-automation.md +99 -0
  126. package/vault/wiki/concepts/agent-codebase-interface.md +43 -0
  127. package/vault/wiki/concepts/agent-harness-architecture.md +67 -0
  128. package/vault/wiki/concepts/agent-loop-detection-patterns.md +133 -0
  129. package/vault/wiki/concepts/agent-search-enforcement.md +126 -0
  130. package/vault/wiki/concepts/agent-skills-ecosystem.md +74 -0
  131. package/vault/wiki/concepts/agent-skills-pattern.md +68 -0
  132. package/vault/wiki/concepts/agentic-harness-context-enforcement.md +91 -0
  133. package/vault/wiki/concepts/agentic-harness.md +34 -0
  134. package/vault/wiki/concepts/agentic-orchestration-pipeline.md +56 -0
  135. package/vault/wiki/concepts/agentic-search-no-embeddings.md +18 -0
  136. package/vault/wiki/concepts/anthropic-context-engineering.md +13 -0
  137. package/vault/wiki/concepts/antigravity-agent-first-architecture.md +61 -0
  138. package/vault/wiki/concepts/ast-compression.md +19 -0
  139. package/vault/wiki/concepts/ast-truncation.md +66 -0
  140. package/vault/wiki/concepts/barrel-files.md +37 -0
  141. package/vault/wiki/concepts/browser-harness-agent.md +41 -0
  142. package/vault/wiki/concepts/browser-subagent-visual-verification.md +82 -0
  143. package/vault/wiki/concepts/codebase-intelligence-ecosystem-comparison.md +192 -0
  144. package/vault/wiki/concepts/codebase-intelligence-harness-integration.md +161 -0
  145. package/vault/wiki/concepts/codebase-to-context-ingestion.md +46 -0
  146. package/vault/wiki/concepts/codex-harness-innovations.md +147 -0
  147. package/vault/wiki/concepts/consensus-debate-flow.md +17 -0
  148. package/vault/wiki/concepts/consensus-debate.md +206 -0
  149. package/vault/wiki/concepts/content-addressed-spec-identity.md +166 -0
  150. package/vault/wiki/concepts/context-anxiety.md +57 -0
  151. package/vault/wiki/concepts/context-compression-techniques.md +19 -0
  152. package/vault/wiki/concepts/context-continuity.md +22 -0
  153. package/vault/wiki/concepts/context-drift-in-agents.md +106 -0
  154. package/vault/wiki/concepts/context-engineering.md +62 -0
  155. package/vault/wiki/concepts/context-folding.md +67 -0
  156. package/vault/wiki/concepts/context-mode.md +38 -0
  157. package/vault/wiki/concepts/cursor-harness-innovations.md +107 -0
  158. package/vault/wiki/concepts/deterministic-session-compaction.md +79 -0
  159. package/vault/wiki/concepts/drift-detection-unified.md +296 -0
  160. package/vault/wiki/concepts/execution-feedback-loop.md +46 -0
  161. package/vault/wiki/concepts/feedforward-feedback-harness.md +60 -0
  162. package/vault/wiki/concepts/five-root-cause-metrics-sentrux.md +40 -0
  163. package/vault/wiki/concepts/fork-safe-spec-storage.md +89 -0
  164. package/vault/wiki/concepts/fts5-sandbox.md +19 -0
  165. package/vault/wiki/concepts/fuzzy-edit-matching.md +71 -0
  166. package/vault/wiki/concepts/gemini-cli-architecture.md +104 -0
  167. package/vault/wiki/concepts/generator-evaluator-architecture.md +64 -0
  168. package/vault/wiki/concepts/guardian-agent-pattern.md +67 -0
  169. package/vault/wiki/concepts/harness-configuration-layers.md +89 -0
  170. package/vault/wiki/concepts/harness-control-frameworks.md +155 -0
  171. package/vault/wiki/concepts/harness-engineering-first-principles.md +90 -0
  172. package/vault/wiki/concepts/harness-h-formalism.md +53 -0
  173. package/vault/wiki/concepts/hybrid-code-search.md +61 -0
  174. package/vault/wiki/concepts/inline-post-edit-validation.md +112 -0
  175. package/vault/wiki/concepts/legendary-engineering-patterns-harness.md +110 -0
  176. package/vault/wiki/concepts/lifecycle-hooks.md +94 -0
  177. package/vault/wiki/concepts/mcp-tool-routing.md +102 -0
  178. package/vault/wiki/concepts/memory-system-of-record-vs-ephemeral-cache.md +47 -0
  179. package/vault/wiki/concepts/meta-agent-context-pruning.md +151 -0
  180. package/vault/wiki/concepts/model-adaptive-harness.md +122 -0
  181. package/vault/wiki/concepts/model-routing-agents.md +101 -0
  182. package/vault/wiki/concepts/monorepo-architecture.md +45 -0
  183. package/vault/wiki/concepts/multi-agent-specialization.md +61 -0
  184. package/vault/wiki/concepts/permission-subsystem.md +16 -0
  185. package/vault/wiki/concepts/pi-messenger-analysis.md +243 -0
  186. package/vault/wiki/concepts/pi-vscode-extension-landscape.md +37 -0
  187. package/vault/wiki/concepts/policy-engine-pattern.md +78 -0
  188. package/vault/wiki/concepts/progressive-disclosure-agents.md +53 -0
  189. package/vault/wiki/concepts/progressive-skill-disclosure.md +17 -0
  190. package/vault/wiki/concepts/provider-native-prompting.md +203 -0
  191. package/vault/wiki/concepts/quality-signal-sentrux.md +37 -0
  192. package/vault/wiki/concepts/repo-map-ranking.md +42 -0
  193. package/vault/wiki/concepts/result-monad-error-handling.md +47 -0
  194. package/vault/wiki/concepts/safety-defense-in-depth.md +83 -0
  195. package/vault/wiki/concepts/sandbox-os-enforcement.md +18 -0
  196. package/vault/wiki/concepts/selective-debate-routing.md +70 -0
  197. package/vault/wiki/concepts/self-evolving-harness.md +60 -0
  198. package/vault/wiki/concepts/sentrux-mcp-integration.md +36 -0
  199. package/vault/wiki/concepts/sentrux-rules-engine.md +49 -0
  200. package/vault/wiki/concepts/shell-pattern-compression.md +24 -0
  201. package/vault/wiki/concepts/skill-first-architecture.md +166 -0
  202. package/vault/wiki/concepts/structured-compaction.md +78 -0
  203. package/vault/wiki/concepts/subagent-orchestration.md +17 -0
  204. package/vault/wiki/concepts/subagent-worktree-isolation.md +68 -0
  205. package/vault/wiki/concepts/superpowers-methodology.md +78 -0
  206. package/vault/wiki/concepts/think-in-code.md +73 -0
  207. package/vault/wiki/concepts/ts-execution-layer.md +100 -0
  208. package/vault/wiki/concepts/typescript-strict-mode.md +37 -0
  209. package/vault/wiki/concepts/vcc-conversation-compaction-for-pi.md +51 -0
  210. package/vault/wiki/concepts/verification-drift-detection.md +19 -0
  211. package/vault/wiki/consensus/consensus-records.md +58 -0
  212. package/vault/wiki/decisions/2026-04-30-pi-lean-ctx-native.md +122 -0
  213. package/vault/wiki/decisions/adr-008.md +40 -0
  214. package/vault/wiki/decisions/adr-009.md +46 -0
  215. package/vault/wiki/decisions/adr-010.md +55 -0
  216. package/vault/wiki/decisions/adr-011.md +165 -0
  217. package/vault/wiki/decisions/adr-012.md +102 -0
  218. package/vault/wiki/decisions/adr-013.md +59 -0
  219. package/vault/wiki/decisions/adr-014.md +73 -0
  220. package/vault/wiki/decisions/adr-015.md +81 -0
  221. package/vault/wiki/decisions/adr-016.md +91 -0
  222. package/vault/wiki/decisions/adr-017.md +79 -0
  223. package/vault/wiki/decisions/adr-018.md +100 -0
  224. package/vault/wiki/decisions/adr-019.md +75 -0
  225. package/vault/wiki/decisions/adr-020.md +106 -0
  226. package/vault/wiki/decisions/adr-021.md +86 -0
  227. package/vault/wiki/decisions/adr-022.md +113 -0
  228. package/vault/wiki/decisions/adr-023.md +113 -0
  229. package/vault/wiki/decisions/adr-024.md +73 -0
  230. package/vault/wiki/decisions/adr-025.md +130 -0
  231. package/vault/wiki/decisions/adr-026.md +56 -0
  232. package/vault/wiki/decisions/colocate-wiki.md +34 -0
  233. package/vault/wiki/entities/Anders Hejlsberg.md +29 -0
  234. package/vault/wiki/entities/Anthropic.md +17 -0
  235. package/vault/wiki/entities/Augment Code.md +49 -0
  236. package/vault/wiki/entities/Bjarne Stroustrup.md +26 -0
  237. package/vault/wiki/entities/Bolt.new (StackBlitz).md +39 -0
  238. package/vault/wiki/entities/Boris Cherny.md +11 -0
  239. package/vault/wiki/entities/Claude Code.md +19 -0
  240. package/vault/wiki/entities/Dennis Ritchie.md +26 -0
  241. package/vault/wiki/entities/Emergent Labs.md +32 -0
  242. package/vault/wiki/entities/Google Cloud.md +16 -0
  243. package/vault/wiki/entities/Guido van Rossum.md +28 -0
  244. package/vault/wiki/entities/Ken Thompson.md +28 -0
  245. package/vault/wiki/entities/Lee et al.md +16 -0
  246. package/vault/wiki/entities/Linus Torvalds.md +28 -0
  247. package/vault/wiki/entities/Lovable (company).md +40 -0
  248. package/vault/wiki/entities/Martin Fowler.md +16 -0
  249. package/vault/wiki/entities/Meng et al.md +16 -0
  250. package/vault/wiki/entities/OpenAI.md +16 -0
  251. package/vault/wiki/entities/Rocket.new.md +38 -0
  252. package/vault/wiki/entities/VILA-Lab.md +15 -0
  253. package/vault/wiki/entities/autodev-codebase.md +18 -0
  254. package/vault/wiki/entities/ck-tool.md +59 -0
  255. package/vault/wiki/entities/codesearch.md +18 -0
  256. package/vault/wiki/entities/disler-indydevdan.md +33 -0
  257. package/vault/wiki/entities/gsd-get-shit-done.md +56 -0
  258. package/vault/wiki/entities/javascript-runtimes.md +48 -0
  259. package/vault/wiki/entities/jesse-vincent.md +38 -0
  260. package/vault/wiki/entities/lean-ctx.md +32 -0
  261. package/vault/wiki/entities/opendev.md +41 -0
  262. package/vault/wiki/entities/ops-codegraph-tool.md +18 -0
  263. package/vault/wiki/entities/pi-coding-agent.md +53 -0
  264. package/vault/wiki/entities/sentrux.md +54 -0
  265. package/vault/wiki/entities/vgrep-tool.md +57 -0
  266. package/vault/wiki/entities/vitest.md +41 -0
  267. package/vault/wiki/flows/harness-wiki-pipeline.md +204 -0
  268. package/vault/wiki/hot.md +932 -0
  269. package/vault/wiki/index.md +437 -0
  270. package/vault/wiki/log.md +418 -0
  271. package/vault/wiki/meta/dashboard.md +30 -0
  272. package/vault/wiki/meta/lint-report-2026-04-30.md +86 -0
  273. package/vault/wiki/meta/lint-report-2026-05-02.md +251 -0
  274. package/vault/wiki/meta/overview.canvas +43 -0
  275. package/vault/wiki/modules/adversarial-verification.md +57 -0
  276. package/vault/wiki/modules/automated-observability.md +54 -0
  277. package/vault/wiki/modules/bench.md +20 -0
  278. package/vault/wiki/modules/extensions.md +23 -0
  279. package/vault/wiki/modules/grounding-checkpoints.md +62 -0
  280. package/vault/wiki/modules/harness-implementation-plan.md +345 -0
  281. package/vault/wiki/modules/harness-wiki-skill-mapping.md +135 -0
  282. package/vault/wiki/modules/harness.md +86 -0
  283. package/vault/wiki/modules/persistent-memory.md +85 -0
  284. package/vault/wiki/modules/schema-orchestration.md +68 -0
  285. package/vault/wiki/modules/skills.md +27 -0
  286. package/vault/wiki/modules/spec-hardening.md +58 -0
  287. package/vault/wiki/modules/structured-planning.md +53 -0
  288. package/vault/wiki/modules/think-in-code-enforcement.md +153 -0
  289. package/vault/wiki/modules/wiki-query-interface.md +64 -0
  290. package/vault/wiki/overview.md +51 -0
  291. package/vault/wiki/questions/Research-pi-vs-claude-code-agentic-orchestration-pipeline.md +87 -0
  292. package/vault/wiki/questions/Research-sentrux-dev.md +123 -0
  293. package/vault/wiki/questions/Research-superpowers-skill-for-agentic-coding-agents.md +164 -0
  294. package/vault/wiki/questions/Research: Augment Code Context Engine.md +244 -0
  295. package/vault/wiki/questions/Research: Automating Software Engineering - Lovable, Bolt, Emergent, Rocket.md +112 -0
  296. package/vault/wiki/questions/Research: Claude Code State-of-the-Art Harness Improvements.md +209 -0
  297. package/vault/wiki/questions/Research: Codex State-of-the-Art Harness Improvements.md +99 -0
  298. package/vault/wiki/questions/Research: Engineering Workflows of Legendary Programmers and AI Harness Mapping.md +107 -0
  299. package/vault/wiki/questions/Research: Fallow Codebase Intelligence Harness Integration.md +72 -0
  300. package/vault/wiki/questions/Research: Gemini CLI SOTA Harness Integration.md +166 -0
  301. package/vault/wiki/questions/Research: GitHub Issues as Harness Spec Storage.md +188 -0
  302. package/vault/wiki/questions/Research: Google Antigravity Harness Integration.md +120 -0
  303. package/vault/wiki/questions/Research: Meta-Agent Context Drift Detection.md +236 -0
  304. package/vault/wiki/questions/Research: Model-Adaptive Agent Harness Design.md +95 -0
  305. package/vault/wiki/questions/Research: Model-Specific Prompting Guides.md +165 -0
  306. package/vault/wiki/questions/Research: Prompt Renderer for Multi-Model Agent Harness.md +216 -0
  307. package/vault/wiki/questions/Research: Skill-First Harness Architecture.md +91 -0
  308. package/vault/wiki/questions/Research: TypeScript Best Practices and Codebase Structure.md +88 -0
  309. package/vault/wiki/questions/Research: TypeScript Execution Layer for Agent Tool Calling.md +81 -0
  310. package/vault/wiki/questions/Research: claude-mem over Obsidian for Harness Layer.md +71 -0
  311. package/vault/wiki/questions/Research: claude-mem over obsidian wiki as the knowledge base for our agentic harness pipeline. think from first principles. does this replace or complement our current setup? no hard feelings about previous decisions. gimme accurate points.md +80 -0
  312. package/vault/wiki/questions/Research: context-mode vs lean-ctx.md +72 -0
  313. package/vault/wiki/questions/Research: cursor.sh Harness Innovations.md +92 -0
  314. package/vault/wiki/questions/Research: executor.sh Harness Integration.md +170 -0
  315. package/vault/wiki/questions/Research: how GSD fits into our coding harness setup.md +97 -0
  316. package/vault/wiki/questions/Research: how claude-mem fits into our workflow. and whether it should replace obsidian in the codebase. no hard feelings about previous actions, rethink from first principles always.md +80 -0
  317. package/vault/wiki/questions/Research: pi-vcc.md +113 -0
  318. package/vault/wiki/questions/Research: semantic code search tools.md +69 -0
  319. package/vault/wiki/questions/Research: vcc extension for pi coding agent.md +73 -0
  320. package/vault/wiki/questions/how-to-enable-semantic-code-search-now.md +111 -0
  321. package/vault/wiki/questions/mvp-implementation-blueprint.md +552 -0
  322. package/vault/wiki/questions/research-agent-first-codebase-exploration.md +199 -0
  323. package/vault/wiki/questions/research-agentic-coding-harness-latest-papers.md +142 -0
  324. package/vault/wiki/questions/research-gitingest-gitreverse-integration.md +100 -0
  325. package/vault/wiki/questions/research-wozcode-token-reduction.md +67 -0
  326. package/vault/wiki/questions/resolved-context-pruning-inplace-vs-restart.md +95 -0
  327. package/vault/wiki/questions/resolved-context-window-economics.md +167 -0
  328. package/vault/wiki/questions/resolved-imad-debate-gating-transfer.md +126 -0
  329. package/vault/wiki/questions/resolved-mcp-tool-preference.md +112 -0
  330. package/vault/wiki/questions/resolved-small-model-meta-agents.md +107 -0
  331. package/vault/wiki/questions/resolved-treesitter-dynamic-languages.md +95 -0
  332. package/vault/wiki/sources/Auggie Context MCP Server.md +63 -0
  333. package/vault/wiki/sources/Augment Code Codacy AI Giants.md +61 -0
  334. package/vault/wiki/sources/Augment Code MCP SiliconAngle.md +49 -0
  335. package/vault/wiki/sources/Augment Code WorkOS ERC 2025.md +55 -0
  336. package/vault/wiki/sources/Augment Context Engine Official.md +71 -0
  337. package/vault/wiki/sources/Augment SWE-bench Agent GitHub.md +74 -0
  338. package/vault/wiki/sources/Augment SWE-bench Pro Blog.md +58 -0
  339. package/vault/wiki/sources/Source: AgentBus Jinja2 Prompt Pipelines.md +75 -0
  340. package/vault/wiki/sources/Source: Arxiv /342/200/224 Don't Break the Cache.md" +85 -0
  341. package/vault/wiki/sources/Source: Augment - Harness Engineering for AI Coding Agents.md +58 -0
  342. package/vault/wiki/sources/Source: Blake Crosley Agent Architecture Guide.md +100 -0
  343. package/vault/wiki/sources/Source: Bolt.new Architecture & Case Study.md +75 -0
  344. package/vault/wiki/sources/Source: Build-Time Prompt Compilation Architecture.md +107 -0
  345. package/vault/wiki/sources/Source: Claude API Agent Skills Overview.md +70 -0
  346. package/vault/wiki/sources/Source: Gemini CLI Changelogs.md +88 -0
  347. package/vault/wiki/sources/Source: Google Blog - Gemini CLI Announcement.md +57 -0
  348. package/vault/wiki/sources/Source: Google Gemini CLI Architecture Docs.md +53 -0
  349. package/vault/wiki/sources/Source: LangChain - Anatomy of Agent Harness.md +65 -0
  350. package/vault/wiki/sources/Source: Lovable Architecture & Clone Analysis.md +83 -0
  351. package/vault/wiki/sources/Source: Martin Fowler - Harness Engineering.md +70 -0
  352. package/vault/wiki/sources/Source: OpenAI Harness Engineering Five Principles.md +58 -0
  353. package/vault/wiki/sources/Source: OpenAI Harness Engineering /342/200/224 0 Lines of Human Code.md" +101 -0
  354. package/vault/wiki/sources/Source: OpenDev /342/200/224 Building AI Coding Agents for the Terminal.md" +100 -0
  355. package/vault/wiki/sources/Source: Render AI Coding Agents Benchmark 2025.md +53 -0
  356. package/vault/wiki/sources/Source: Rocket.new /342/200/224 Vibe Solutioning Platform.md" +70 -0
  357. package/vault/wiki/sources/Source: SwirlAI Agent Skills Progressive Disclosure.md +71 -0
  358. package/vault/wiki/sources/Source: TianPan Prompt Caching Architecture.md +89 -0
  359. package/vault/wiki/sources/Source: Vercel Labs agent-browser.md +155 -0
  360. package/vault/wiki/sources/Source: browser-harness CDP Harness.md +126 -0
  361. package/vault/wiki/sources/agent-drift-academic-paper.md +79 -0
  362. package/vault/wiki/sources/aider-repomap-tree-sitter.md +42 -0
  363. package/vault/wiki/sources/anthropic-compaction-api.md +58 -0
  364. package/vault/wiki/sources/anthropic-effective-harnesses.md +42 -0
  365. package/vault/wiki/sources/anthropic-prompt-best-practices.md +100 -0
  366. package/vault/wiki/sources/anthropic2026-harness-design.md +63 -0
  367. package/vault/wiki/sources/barrel-files-tkdodo.md +38 -0
  368. package/vault/wiki/sources/birth-of-unix-kernighan-interview.md +57 -0
  369. package/vault/wiki/sources/bockeler2026-harness-engineering.md +69 -0
  370. package/vault/wiki/sources/cast-code-chunking-paper.md +50 -0
  371. package/vault/wiki/sources/ck-semantic-search.md +78 -0
  372. package/vault/wiki/sources/claude-code-architecture-karaxai-2026.md +71 -0
  373. package/vault/wiki/sources/claude-code-architecture-qubytes-2026.md +50 -0
  374. package/vault/wiki/sources/claude-code-architecture-vila-lab-2026.md +64 -0
  375. package/vault/wiki/sources/claude-code-security-architecture-penligent-2026.md +70 -0
  376. package/vault/wiki/sources/claude-context-editing-docs.md +13 -0
  377. package/vault/wiki/sources/cloudflare-codemode.md +63 -0
  378. package/vault/wiki/sources/code-chunk-library-supermemory.md +63 -0
  379. package/vault/wiki/sources/codeact-apple-2024.md +62 -0
  380. package/vault/wiki/sources/codex-dsc-rfc-8573.md +41 -0
  381. package/vault/wiki/sources/codex-open-source-agent-2026.md +110 -0
  382. package/vault/wiki/sources/coir-code-retrieval-benchmark.md +51 -0
  383. package/vault/wiki/sources/colinmcnamara-context-optimization-codemode.md +48 -0
  384. package/vault/wiki/sources/context-folding-paper.md +61 -0
  385. package/vault/wiki/sources/context-mode-website.md +63 -0
  386. package/vault/wiki/sources/cursor-agent-best-practices-2026.md +62 -0
  387. package/vault/wiki/sources/cursor-fork-29b-2025.md +50 -0
  388. package/vault/wiki/sources/cursor-harness-april-2026.md +76 -0
  389. package/vault/wiki/sources/cursor-instant-apply-2024.md +45 -0
  390. package/vault/wiki/sources/cursor-shadow-workspace-2024.md +52 -0
  391. package/vault/wiki/sources/cursor-shipped-coding-agent-2026.md +53 -0
  392. package/vault/wiki/sources/cursor-vs-antigravity-2026.md +51 -0
  393. package/vault/wiki/sources/disler-pi-vs-claude-code.md +69 -0
  394. package/vault/wiki/sources/distill-deterministic-context-compression.md +53 -0
  395. package/vault/wiki/sources/embedding-models-benchmark-supermemory-2025.md +48 -0
  396. package/vault/wiki/sources/executor-rhyssullivan.md +122 -0
  397. package/vault/wiki/sources/fallow-rs-codebase-intelligence.md +125 -0
  398. package/vault/wiki/sources/fan2025-imad.md +60 -0
  399. package/vault/wiki/sources/forgecode-gpt5-agent-improvements.md +63 -0
  400. package/vault/wiki/sources/gemini-3-prompting-guide.md +78 -0
  401. package/vault/wiki/sources/gh-cli-sub-issue-rfc.md +50 -0
  402. package/vault/wiki/sources/gh-sub-issue-extension.md +72 -0
  403. package/vault/wiki/sources/github-fork-issues-discussion.md +44 -0
  404. package/vault/wiki/sources/github-issue-dependencies-docs.md +49 -0
  405. package/vault/wiki/sources/github-sub-issues-docs.md +51 -0
  406. package/vault/wiki/sources/gitingest.md +91 -0
  407. package/vault/wiki/sources/gitreverse.md +63 -0
  408. package/vault/wiki/sources/google-antigravity-official-blog.md +47 -0
  409. package/vault/wiki/sources/google-antigravity-wikipedia.md +53 -0
  410. package/vault/wiki/sources/gsd-codecentric-deep-dive.md +57 -0
  411. package/vault/wiki/sources/gsd-github-repo.md +51 -0
  412. package/vault/wiki/sources/gsd-hn-discussion.md +59 -0
  413. package/vault/wiki/sources/guido-python-design-philosophy.md +56 -0
  414. package/vault/wiki/sources/hejlsberg-7-learnings.md +48 -0
  415. package/vault/wiki/sources/ironclaw-drift-monitor.md +80 -0
  416. package/vault/wiki/sources/langsight-loop-detection.md +80 -0
  417. package/vault/wiki/sources/leanctx-website.md +69 -0
  418. package/vault/wiki/sources/lee2026-meta-harness.md +59 -0
  419. package/vault/wiki/sources/linux-kernel-coding-workflow.md +50 -0
  420. package/vault/wiki/sources/lou2026-autoharness.md +53 -0
  421. package/vault/wiki/sources/martin-fowler-harness-engineering.md +73 -0
  422. package/vault/wiki/sources/mcp-architecture-docs.md +13 -0
  423. package/vault/wiki/sources/meng2026-agent-harness-survey.md +79 -0
  424. package/vault/wiki/sources/mindstudio-four-agent-types.md +68 -0
  425. package/vault/wiki/sources/ms-chat-history-management.md +13 -0
  426. package/vault/wiki/sources/openai-prompt-guidance.md +104 -0
  427. package/vault/wiki/sources/openclaw-session-pruning.md +13 -0
  428. package/vault/wiki/sources/opencode-dcp.md +13 -0
  429. package/vault/wiki/sources/opendev-arxiv-2603.05344v1.md +79 -0
  430. package/vault/wiki/sources/openhands-platform.md +39 -0
  431. package/vault/wiki/sources/oss-guide-codebase-exploration.md +53 -0
  432. package/vault/wiki/sources/pi-compaction-extensions-ecosystem.md +102 -0
  433. package/vault/wiki/sources/pi-context-prune-github-repo.md +38 -0
  434. package/vault/wiki/sources/pi-mono-compaction-docs.md +38 -0
  435. package/vault/wiki/sources/pi-omni-compact-github-repo.md +50 -0
  436. package/vault/wiki/sources/pi-rtk-optimizer-github-repo.md +45 -0
  437. package/vault/wiki/sources/pi-vcc-github-repo.md +69 -0
  438. package/vault/wiki/sources/pi-vscode-marketplace.md +41 -0
  439. package/vault/wiki/sources/pi-vscode-model-provider-marketplace.md +39 -0
  440. package/vault/wiki/sources/py-tree-sitter.md +13 -0
  441. package/vault/wiki/sources/sentrux-dev-landing.md +40 -0
  442. package/vault/wiki/sources/sentrux-docs-pro-architecture.md +75 -0
  443. package/vault/wiki/sources/sentrux-docs-quality-signal.md +46 -0
  444. package/vault/wiki/sources/sentrux-docs-root-cause-metrics.md +57 -0
  445. package/vault/wiki/sources/sentrux-docs-rules-engine.md +58 -0
  446. package/vault/wiki/sources/sentrux-github-repo.md +56 -0
  447. package/vault/wiki/sources/superpowers-github-repo.md +56 -0
  448. package/vault/wiki/sources/superpowers-release-blog.md +54 -0
  449. package/vault/wiki/sources/superpowers-termdock-analysis.md +45 -0
  450. package/vault/wiki/sources/swe-agent-aci.md +42 -0
  451. package/vault/wiki/sources/swe-bench.md +45 -0
  452. package/vault/wiki/sources/swe-pruner-context-pruning.md +13 -0
  453. package/vault/wiki/sources/think-in-code-blog.md +48 -0
  454. package/vault/wiki/sources/tree-sitter-docs.md +13 -0
  455. package/vault/wiki/sources/ts-best-practices-2025-devto.md +42 -0
  456. package/vault/wiki/sources/ts-folder-structure-mingyang.md +58 -0
  457. package/vault/wiki/sources/ts-monorepo-koerselman.md +44 -0
  458. package/vault/wiki/sources/ts-result-error-handling-kkalamarski.md +52 -0
  459. package/vault/wiki/sources/ts-runtimes-comparison-betterstack.md +42 -0
  460. package/vault/wiki/sources/ts-strict-mode-rishikc.md +43 -0
  461. package/vault/wiki/sources/unix-philosophy.md +48 -0
  462. package/vault/wiki/sources/vectara-chunking-vs-embedding-naacl2025.md +39 -0
  463. package/vault/wiki/sources/vectara-guardian-agents.md +79 -0
  464. package/vault/wiki/sources/vgrep-semantic-search.md +76 -0
  465. package/vault/wiki/sources/vitest-official.md +41 -0
  466. package/vault/wiki/sources/vscode-pi-community-extension.md +40 -0
  467. package/vault/wiki/sources/wozcode.md +79 -0
  468. package/.agents/skills/compress/SKILL.md +0 -111
  469. package/.agents/skills/compress/scripts/__init__.py +0 -9
  470. package/.agents/skills/compress/scripts/__main__.py +0 -3
  471. package/.agents/skills/compress/scripts/benchmark.py +0 -78
  472. package/.agents/skills/compress/scripts/cli.py +0 -73
  473. package/.agents/skills/compress/scripts/compress.py +0 -227
  474. package/.agents/skills/compress/scripts/detect.py +0 -121
  475. package/.agents/skills/compress/scripts/validate.py +0 -189
  476. package/.agents/skills/emil-design-eng/SKILL.md +0 -679
  477. package/.agents/skills/lean-ctx/SKILL.md +0 -149
  478. package/.agents/skills/lean-ctx/scripts/install.sh +0 -95
  479. package/.agents/skills/scrapling-official/LICENSE.txt +0 -28
  480. package/.agents/skills/scrapling-official/SKILL.md +0 -390
  481. package/.agents/skills/scrapling-official/examples/01_fetcher_session.py +0 -26
  482. package/.agents/skills/scrapling-official/examples/02_dynamic_session.py +0 -26
  483. package/.agents/skills/scrapling-official/examples/03_stealthy_session.py +0 -26
  484. package/.agents/skills/scrapling-official/examples/04_spider.py +0 -58
  485. package/.agents/skills/scrapling-official/examples/README.md +0 -45
  486. package/.agents/skills/scrapling-official/references/fetching/choosing.md +0 -78
  487. package/.agents/skills/scrapling-official/references/fetching/dynamic.md +0 -352
  488. package/.agents/skills/scrapling-official/references/fetching/static.md +0 -432
  489. package/.agents/skills/scrapling-official/references/fetching/stealthy.md +0 -255
  490. package/.agents/skills/scrapling-official/references/mcp-server.md +0 -214
  491. package/.agents/skills/scrapling-official/references/migrating_from_beautifulsoup.md +0 -86
  492. package/.agents/skills/scrapling-official/references/parsing/adaptive.md +0 -212
  493. package/.agents/skills/scrapling-official/references/parsing/main_classes.md +0 -586
  494. package/.agents/skills/scrapling-official/references/parsing/selection.md +0 -494
  495. package/.agents/skills/scrapling-official/references/spiders/advanced.md +0 -344
  496. package/.agents/skills/scrapling-official/references/spiders/architecture.md +0 -94
  497. package/.agents/skills/scrapling-official/references/spiders/getting-started.md +0 -164
  498. package/.agents/skills/scrapling-official/references/spiders/proxy-blocking.md +0 -235
  499. package/.agents/skills/scrapling-official/references/spiders/requests-responses.md +0 -196
  500. package/.agents/skills/scrapling-official/references/spiders/sessions.md +0 -205
  501. package/.github/banner.png +0 -0
  502. package/PLAN.md +0 -11
  503. package/extensions/lean-ctx-enforce.ts +0 -166
  504. package/skills-lock.json +0 -35
  505. package/wiki/README.md +0 -10
  506. package/wiki/decisions/0001-establish-project-wiki-and-decision-record-format.md +0 -25
  507. package/wiki/decisions/0002-add-project-banner-to-readme.md +0 -26
  508. package/wiki/decisions/0003-remove-redundant-readme-title-heading.md +0 -26
  509. package/wiki/decisions/0004-publish-package-to-npm-as-ultimate-pi.md +0 -26
@@ -0,0 +1,51 @@
1
+ ---
2
+ type: source
3
+ status: ingested
4
+ source_type: documentation
5
+ title: "GitHub Sub-Issues — Official Documentation"
6
+ author: GitHub Docs
7
+ date_published: 2025-04-11
8
+ url: https://docs.github.com/en/issues/tracking-your-work-with-issues/using-issues/adding-sub-issues
9
+ confidence: high
10
+ key_claims:
11
+ - "Sub-issues allow breaking larger issues into smaller tasks, available since April 2025"
12
+ - "Up to 100 sub-issues per parent issue and up to 8 levels of nested sub-issues"
13
+ - "Parent issues and sub-issue progress is available in GitHub Projects (filter, group, views)"
14
+ - "Sub-issues can themselves contain sub-issues (full hierarchies)"
15
+ - "Cross-repository sub-issues supported"
16
+ - "Requires at least triage permissions"
17
+ tags:
18
+ - github
19
+ - issues
20
+ - sub-issues
21
+ - project-management
22
+ related:
23
+ - "[[Research: GitHub Issues as Harness Spec Storage]]"
24
+ created: 2026-05-02
25
+ updated: 2026-05-02
26
+
27
+ ---# GitHub Sub-Issues — Official Documentation
28
+
29
+ GitHub's official documentation for the sub-issues feature, launched in April 2025.
30
+
31
+ ## Key Capabilities
32
+
33
+ - **Parent-child hierarchies**: Break larger issues into manageable tasks
34
+ - **Depth**: Up to 8 levels of nesting
35
+ - **Breadth**: Up to 100 sub-issues per parent
36
+ - **Cross-repo**: Sub-issues can live in different repositories
37
+ - **Projects integration**: Progress fields, filters, grouping by parent issue
38
+ - **Two creation modes**: Create new sub-issue inline, or add existing issue as child
39
+
40
+ ## API Layer
41
+
42
+ Sub-issues are exposed through GitHub's GraphQL API with dedicated fields:
43
+ - `subIssues` — list of child issues
44
+ - `parent` — parent issue reference
45
+ - `subIssuesSummary` — aggregate progress (total, completed, not_planned)
46
+
47
+ The REST API also supports sub-issue relationships through the issues endpoint with parent/child fields.
48
+
49
+ ## Relevance to Harness
50
+
51
+ This is the canonical cloud storage mechanism for spec decomposition. Each hardened spec (L1) becomes a parent issue; each task from structured planning (L2) becomes a sub-issue. Progress auto-rolls up from children to parent.
@@ -0,0 +1,91 @@
1
+ ---
2
+ type: source
3
+ source_type: tool
4
+ name: Gitingest
5
+ author: coderamp-labs
6
+ date_published: 2025
7
+ url: https://gitingest.com
8
+ repo: https://github.com/coderamp-labs/gitingest
9
+ confidence: high
10
+ key_claims:
11
+ - "Turn any Git repository into a simple text digest of its codebase"
12
+ - "Replace 'hub' with 'ingest' in any GitHub URL for prompt-friendly text"
13
+ - Supports public and private repos (via PAT)
14
+ - Pattern include/exclude filtering, file size limits
15
+ - Python package (`pip install gitingest`), CLI, Chrome extension, web UI
16
+ - Output: summary + directory tree + file contents with clear delimiters
17
+ tags:
18
+ - codebase-ingestion
19
+ - llm-context
20
+ - tool
21
+ created: 2026-04-30
22
+ updated: 2026-04-30
23
+ status: ingested
24
+ title: "Gitingest"
25
+
26
+ ---# Gitingest
27
+
28
+ ## What It Is
29
+
30
+ Gitingest converts a Git repository into structured plaintext suitable for feeding into an LLM. It clones the repo, extracts all files, and produces a three-part output:
31
+
32
+ 1. **Summary**: Natural language description of the repo
33
+ 2. **Directory tree**: Hierarchical view of file structure
34
+ 3. **File contents**: Every file wrapped in `=== FILE: path ===` markers
35
+
36
+ ## How It Works
37
+
38
+ - Clones the repository (or reads local directory)
39
+ - Applies pattern filters (include/exclude globs)
40
+ - Applies file size limits (skip files above threshold)
41
+ - Generates summary based on repo metadata and structure
42
+ - Outputs as structured plaintext
43
+
44
+ For private repos, a GitHub Personal Access Token (PAT) is used once for cloning and then discarded. Cloned repos are deleted after processing.
45
+
46
+ ## Output Format
47
+
48
+ ```
49
+ ===============================================
50
+ SUMMARY
51
+ ===============================================
52
+ [Repository description]
53
+
54
+ ===============================================
55
+ DIRECTORY STRUCTURE
56
+ ===============================================
57
+ repo/
58
+ ├── src/
59
+ │ ├── main.py
60
+ │ └── utils.py
61
+ ├── tests/
62
+ └── README.md
63
+
64
+ ===============================================
65
+ FILE: src/main.py
66
+ ===============================================
67
+ [file contents]
68
+ ===============================================
69
+ FILE: README.md
70
+ ===============================================
71
+ [file contents]
72
+ ```
73
+
74
+ ## Integration Surface
75
+
76
+ - **Python API**: `from gitingest import ingest` → `(summary, tree, content)`
77
+ - **CLI**: `gitingest <url> -o - | your_ai_processor`
78
+ - **Web**: https://gitingest.com/owner/repo
79
+ - **Async**: `from gitingest import ingest_async` for Jupyter/async contexts
80
+ - **Environment variables**: `GITHUB_TOKEN`, `GITINGEST_SENTRY_ENABLED`
81
+
82
+ ## Stack
83
+
84
+ - Backend: FastAPI + Jinja2
85
+ - Frontend: Tailwind CSS
86
+ - Token estimation: tiktoken
87
+ - Analytics: PostHog
88
+
89
+ ## Relevance to ultimate-pi
90
+
91
+ Direct fit for the harness's need to ingest external codebases as context. Currently the harness uses lean-ctx to read individual files. Gitingest provides bulk codebase ingestion in a format already optimized for LLM context windows.
@@ -0,0 +1,63 @@
1
+ ---
2
+ type: source
3
+ source_type: tool
4
+ name: GitReverse
5
+ author: filiksyos
6
+ date_published: 2025
7
+ url: https://gitreverse.com
8
+ repo: https://github.com/filiksyos/gitreverse
9
+ confidence: high
10
+ key_claims:
11
+ - "Turn a GitHub repository into a plain-language coding agent prompt"
12
+ - "Reverse engineer a codebase into a prompt that likely created it"
13
+ - Uses OpenRouter LLM to generate synthetic user prompts from repo metadata
14
+ - Replace 'hub' with 'reverse' in any GitHub URL
15
+ - Has "Deep Reverse" mode for more detailed prompts
16
+ - Public repos only
17
+ tags:
18
+ - prompt-generation
19
+ - repo-analysis
20
+ - llm-tool
21
+ created: 2026-04-30
22
+ updated: 2026-04-30
23
+ status: ingested
24
+ title: "GitReverse"
25
+
26
+ ---# GitReverse
27
+
28
+ ## What It Is
29
+
30
+ GitReverse takes a public GitHub repo URL and generates a synthetic user prompt — a prompt someone might paste into Cursor, Claude Code, or Codex to "vibe code" the project from scratch.
31
+
32
+ ## How It Works
33
+
34
+ 1. Fetches repo metadata via GitHub API: description, topics, language breakdown, file tree, README
35
+ 2. Sends metadata + README to an LLM via OpenRouter
36
+ 3. LLM generates a synthetic user prompt describing what the repo does and how to build it
37
+ 4. Output: 3-5 paragraphs of natural language prompt
38
+
39
+ **Crucially, it does NOT read the actual source code files.** It only uses metadata and README. This means the generated prompt is a high-level description, not a code-level specification.
40
+
41
+ ## Features
42
+
43
+ - **Quick Reverse**: Basic prompt from metadata + README
44
+ - **Deep Reverse**: More detailed prompt (likely uses more metadata or a different LLM prompt)
45
+ - **Library**: Browse previously generated prompts
46
+ - **History**: Personal prompt generation history
47
+ - **Manual control**: Toggle for manual parameter adjustment
48
+ - **Shareable URLs**: `/owner/repo` route pattern
49
+
50
+ ## Output Example (for gitreverse repo itself)
51
+
52
+ > Build me a simple web app that can "reverse engineer" a GitHub repository. The main idea is to take a public repo's URL and generate a synthetic prompt. The user interface should be clean and straightforward: just a single page with an input box. On the backend, it will need to use the GitHub API to fetch the repo's metadata, its root file tree, and the README content. Then, it should pass all that context to a large language model using OpenRouter to generate the final prompt. Let's build this with Next.js using the App Router, React, and TypeScript. For styling, please use Tailwind CSS.
53
+
54
+ ## Stack
55
+
56
+ - Next.js (App Router), React, TypeScript
57
+ - Tailwind CSS
58
+ - OpenRouter for LLM access
59
+ - GitHub API for repo metadata
60
+
61
+ ## Relevance to ultimate-pi
62
+
63
+ **Low direct relevance.** GitReverse generates prompts FROM repos — it helps a USER figure out what prompt to write. The ultimate-pi harness is an AGENT that already receives prompts. The harness doesn't need to generate prompts from repos; it needs to ingest repos as context. GitReverse solves the inverse problem.
@@ -0,0 +1,47 @@
1
+ ---
2
+ type: source
3
+ source_type: engineering-blog
4
+ title: "Build with Google Antigravity, our new agentic development platform"
5
+ author: "Google Antigravity Team"
6
+ date_published: 2025-11-20
7
+ url: "https://developers.googleblog.com/build-with-google-antigravity-our-new-agentic-development-platform/"
8
+ confidence: high
9
+ status: ingested
10
+ created: 2026-05-01
11
+ updated: 2026-05-01
12
+ tags:
13
+ - antigravity
14
+ - google
15
+ - agentic-coding
16
+ - harness-design
17
+ key_claims:
18
+ - "Antigravity combines AI-powered IDE with agent-first Manager Surface"
19
+ - "Agents autonomously plan, execute, and verify complex tasks across editor, terminal, and browser"
20
+ - "Artifacts (task lists, implementation plans, screenshots, browser recordings) replace raw tool call logs"
21
+ - "Agents learn from past work via knowledge base"
22
+ - "Free public preview with Gemini 3 Pro, Claude Sonnet 4.5, and GPT-OSS support"
23
+ - "Cross-platform: macOS, Windows, Linux"
24
+
25
+ ---# Build with Google Antigravity (Official Announcement)
26
+
27
+ Google's official announcement blog post for Antigravity, published November 20, 2025.
28
+
29
+ ## Summary
30
+
31
+ Antigravity is an **agentic development platform** that introduces two distinct interfaces:
32
+
33
+ - **Editor View**: Traditional AI-powered IDE with tab completions and inline commands
34
+ - **Manager Surface**: Dedicated interface to spawn, orchestrate, and observe multiple agents working asynchronously
35
+
36
+ The platform is built around four design tenets: trust, autonomy, feedback, and self-improvement.
37
+
38
+ ## Key Details
39
+
40
+ - **Artifacts**: Tangible deliverables replacing raw tool call logs. Developers comment directly on artifacts (Google Docs-style) and agents incorporate feedback without stopping execution.
41
+ - **Learning**: Core primitive. Agents save useful context and code snippets to knowledge base for future tasks.
42
+ - **Pricing**: Free public preview for individuals with generous rate limits on Gemini 3 Pro.
43
+ - **Models**: Gemini 3 Pro, Anthropic Claude Sonnet 4.5, OpenAI GPT-OSS.
44
+
45
+ ## Relevance to Harness
46
+
47
+ This is the primary source for understanding Antigravity's architecture. The Artifact system, Manager View, and learning knowledge base are the three innovations most relevant to our harness design.
@@ -0,0 +1,53 @@
1
+ ---
2
+ type: source
3
+ source_type: encyclopedia
4
+ title: "Google Antigravity - Wikipedia"
5
+ author: "Wikipedia contributors"
6
+ date_published: 2025-11-18
7
+ url: "https://en.wikipedia.org/wiki/Google_Antigravity"
8
+ confidence: high
9
+ status: ingested
10
+ created: 2026-05-01
11
+ updated: 2026-05-01
12
+ tags:
13
+ - antigravity
14
+ - google
15
+ - reference
16
+ key_claims:
17
+ - "Announced November 18, 2025 alongside Gemini 3 release"
18
+ - "Heavily modified fork of Visual Studio Code (debate: direct fork or Windsurf fork)"
19
+ - "Supports Gemini 3.1 Pro, Gemini 3 Flash, Claude Sonnet 4.6/Opus 4.6, GPT-OSS-120B"
20
+ - "Free public preview, cross-platform (Windows, macOS, Linux)"
21
+ - "Editor view + Manager view for agent orchestration"
22
+ - "Artifacts: verifiable deliverables replacing raw tool calls"
23
+
24
+ ---# Google Antigravity - Wikipedia
25
+
26
+ Wikipedia entry for Google Antigravity. Last updated April 24, 2026.
27
+
28
+ ## Key Facts
29
+
30
+ - **Release**: November 18, 2025 (public preview, currently v1.23.2 as of April 2026)
31
+ - **Platform**: 64-bit Windows 10+, macOS Monterey 12+, 64-bit Linux
32
+ - **License**: Proprietary (free during preview)
33
+ - **Origin**: Heavily modified VS Code fork. Debate exists whether it's a direct fork or a Windsurf fork (Google hired Windsurf team + licensed tech for $2.4B in July 2025)
34
+
35
+ ## Features
36
+
37
+ - **Agent-first paradigm**: Shifts from AI assistance to AI agents operating with autonomy
38
+ - **Editor view**: Standard IDE interface with agent sidebar
39
+ - **Manager view**: Control center for orchestrating multiple agents in parallel
40
+ - **Artifacts**: Verifiable deliverables (task lists, implementation plans, screenshots, browser recordings)
41
+ - **Agent access**: Direct editor, terminal, and integrated browser control
42
+ - **Learning**: Agents learn from previous interactions
43
+
44
+ ## Model Support
45
+
46
+ - Gemini 3.1 Pro (primary)
47
+ - Gemini 3 Flash
48
+ - Anthropic Claude Sonnet 4.6 and Opus 4.6
49
+ - OpenAI GPT-OSS-120B (open-source variant)
50
+
51
+ ## Relevance to Harness
52
+
53
+ Provides authoritative timeline, version history, and architectural origin. The Windsurf acquisition context is significant: Antigravity represents Google's $2.4B bet on agent-first development.
@@ -0,0 +1,57 @@
1
+ ---
2
+ type: source
3
+ source_type: engineering-blog
4
+ title: "GSD for Claude Code: A Deep Dive into the Workflow System (codecentric)"
5
+ author: "Felix Abele"
6
+ date_published: 2026-03-03
7
+ date_accessed: 2026-05-05
8
+ url: "https://www.codecentric.de/en/knowledge-hub/blog/the-anatomy-of-claude-code-workflows-turning-slash-commands-into-an-ai-development-system"
9
+ confidence: high
10
+ tags:
11
+ - gsd
12
+ - architecture
13
+ - claude-code
14
+ - spec-driven-development
15
+ key_claims:
16
+ - "GSD relies entirely on native Claude Code features — no proprietary runtime, no framework"
17
+ - "Architecture: Slash Commands (WHAT), Workflow Files (HOW), References (reusable knowledge), Templates (output formats)"
18
+ - "@-file references for context injection: commands reference workflows which reference templates"
19
+ - "AskUserQuestion tool used for interactive decision points with gates and feedback loops"
20
+ - "Parallel research orchestration: 4 researchers → Synthesizer → Roadmapper, in waves"
21
+ - "Two agent spawning patterns: general-purpose with manual role assignment vs registered agent type"
22
+ - "Bash scripts (gsd-tools.cjs) used for deterministic project state capture — queries that LLMs would do unreliably"
23
+ - "Hooks: SessionStart (update check), PostToolUse (auto-formatting), statusLine (context usage progress bar)"
24
+ - "GSD designed for small to medium projects; not for every use case"
25
+ ---
26
+
27
+ # GSD Architecture Deep Dive (codecentric, March 2026)
28
+
29
+ ## Summary
30
+
31
+ This is the most detailed public architectural analysis of GSD. It walks through the `/gsd:new-project` command step-by-step, showing how Claude Code's native features (skills, agents, hooks, AskUserQuestion, @-file references) are composed into a full software development lifecycle system.
32
+
33
+ ## Architectural Layers
34
+
35
+ ### 1. Slash Commands (Skills)
36
+ Each command is a markdown file in `claude/commands/gsd/` with:
37
+ - **Frontmatter:** name, description, argument-hint, allowed-tools
38
+ - **Prompt body:** XML-structured (`<objective>`, `<execution_context>`, `<process>`) with @-file references
39
+
40
+ ### 2. Workflow Files
41
+ The actual logic lives in workflow files (e.g., `workflows/new-project.md`). Slash commands are thin wrappers that declare permissions and reference the workflow.
42
+
43
+ ### 3. Agent Orchestration
44
+ - **Wave 1:** 4 parallel researchers (stack, features, architecture, pitfalls) — each writes to its own file
45
+ - **Wave 2:** Synthesizer reads all 4 files → `SUMMARY.md`
46
+ - **Wave 3:** Roadmapper reads synthesis + requirements → creates roadmap
47
+
48
+ ### 4. Deterministic Tooling
49
+ `gsd-tools.cjs` is a Node.js CLI that returns project state as JSON. Avoids the LLM doing unreliable file-existence checks, config loading, or phase number calculations.
50
+
51
+ ### 5. Cross-Session Memory
52
+ All state persisted in `.planning/` files (PROJECT.md, REQUIREMENTS.md, ROADMAP.md, STATE.md). After every completed step, a git commit is performed. `/gsd-resume-work` reconstructs previous state.
53
+
54
+ ## Limitations Noted
55
+ - Designed for small to medium projects
56
+ - May not go deep enough in some places
57
+ - Once you understand the workflow structure, building your own specific systems is straightforward
@@ -0,0 +1,51 @@
1
+ ---
2
+ type: source
3
+ source_type: github-repo
4
+ title: "GitHub - gsd-build/get-shit-done"
5
+ author: "TÂCHES (@glittercowboy)"
6
+ date_published: 2025-12-15
7
+ date_accessed: 2026-05-05
8
+ url: "https://github.com/gsd-build/get-shit-done"
9
+ confidence: high
10
+ tags:
11
+ - gsd
12
+ - meta-prompting
13
+ - spec-driven-development
14
+ - context-engineering
15
+ - claude-code
16
+ key_claims:
17
+ - "GSD is a lightweight meta-prompting, context engineering, and spec-driven development system for Claude Code (and 15+ other runtimes)"
18
+ - "Solves context rot — the quality degradation that happens as LLMs fill their context window"
19
+ - "60.1k GitHub stars, 5.1k forks, 2,367 commits, 143 contributors (May 2026)"
20
+ - "v1.40.0 released May 3, 2026; MIT License"
21
+ - "Built entirely on Claude Code native features: skills, agents, hooks — ~50 markdown files + a Node.js CLI helper"
22
+ - "Core workflow: discuss → plan → execute → verify → ship (phase-based)"
23
+ - "Multi-agent orchestration: thin orchestrator spawns specialized agents with fresh context per plan"
24
+ - "Atomic git commits per task; wave execution (parallel where independent, sequential where dependent)"
25
+ - "Model profiles: quality/balanced/budget/inherit across planning/execution/verification"
26
+ - "86 skills + 33 subagents full install; --minimal flag cuts to 6 core skills (~700 token overhead vs ~12K)"
27
+ - "Skill consolidation v1.40: 86→59 commands via grouped skills (capture, phase, config, workspace)"
28
+ - "GSD-2 standalone version being built on pi.dev"
29
+ ---
30
+
31
+ # GSD (Get Shit Done) — GitHub Repository
32
+
33
+ ## Summary
34
+
35
+ GSD is the most popular spec-driven development harness in the Claude Code ecosystem. It is a set of ~50 markdown files (skills, agents, workflows), a Node.js CLI helper (`gsd-tools.cjs`), and hooks that install into Claude Code's `.claude/` directory via `npx get-shit-done-cc@latest`. No proprietary runtime — all orchestration uses Claude Code's native Task tool for subagent spawning, file-based state for cross-session memory, and structured XML plans for execution.
36
+
37
+ ## Architecture
38
+
39
+ - **Skills (59 shipped):** Slash commands like `/gsd-new-project`, `/gsd-plan-phase`, `/gsd-execute-phase`. Each is a markdown file with frontmatter (allowed-tools, description) + XML-structured prompt body.
40
+ - **Subagents (33):** Specialized agents for research (4 parallel: stack, features, architecture, pitfalls), planning (planner + plan-checker), execution (executors in waves), verification (verifier + debuggers).
41
+ - **Hooks:** SessionStart (update check), PostToolUse (auto-formatting with Prettier), statusLine (context usage + active task).
42
+ - **State files:** `.planning/PROJECT.md`, `REQUIREMENTS.md`, `ROADMAP.md`, `STATE.md` — file-based persistent memory across sessions.
43
+ - **SDK:** TypeScript ESM package (`gsd-sdk`) for headless CLI with init + auto commands.
44
+ - **Security:** Prompt injection detection, path traversal prevention, CI security scanning.
45
+
46
+ ## Key Design Decisions
47
+
48
+ 1. **Deterministic logic in code, not prompts.** The `gsd-tools.cjs` CLI handles file existence checks, config loading, phase numbering — operations where scripts are more reliable than LLM prompts.
49
+ 2. **Fresh context per plan.** Plans are small enough to execute in a clean 200K context window. No accumulated garbage.
50
+ 3. **Filesystem as message bus.** Agent-to-agent communication happens exclusively through files in `.planning/`.
51
+ 4. **Two spawning patterns:** General-purpose agents with manual role assignment (researchers share one definition) vs registered agent types (planner, verifier have unique definitions).
@@ -0,0 +1,59 @@
1
+ ---
2
+ type: source
3
+ source_type: discussion-thread
4
+ title: "Hacker News: Get Shit Done — meta-prompting, context engineering and spec-driven dev system"
5
+ author: "HN Community (submitted by stefankuehnel)"
6
+ date_published: 2026-03-18
7
+ date_accessed: 2026-05-05
8
+ url: "https://news.ycombinator.com/item?id=47417804"
9
+ confidence: high
10
+ tags:
11
+ - gsd
12
+ - community-feedback
13
+ - tool-comparison
14
+ - token-usage
15
+ key_claims:
16
+ - "473 points, 254 comments on HN — high engagement"
17
+ - "Consensus: GSD is good for greenfield/small projects, degrades on large existing codebases"
18
+ - "Multiple users report burning through Claude Max weekly limits in 1-2 days"
19
+ - "Plan mode (native Claude Code) often sufficient; GSD overkill for simple tasks"
20
+ - "Spec-driven tools debated: natural language specs are ambiguous vs. executable tests are precise"
21
+ - "Community comparison: GSD vs Superpowers — both overengineered; Superpowers better for brainstorming, GSD better for state tracking"
22
+ - "Key insight from user DIVx0: GSD agents start leaving orphans in large codebases; verification stages use simple lexical tools, not AST-aware analysis"
23
+ - "User paddy_m described ideal system: plan → adversarial review → test implementation → adversarial PR review, with web UI and git reset on failure"
24
+ - "Several users built custom harnesses after finding GSD too slow or opaque"
25
+ - "GSD-2 standalone version being built on pi.dev"
26
+ ---
27
+
28
+ # GSD Hacker News Discussion (473 points, March 2026)
29
+
30
+ ## Community Consensus
31
+
32
+ ### Positive
33
+ - Works well for greenfield projects and solo developers
34
+ - State tracking across sessions is genuinely useful
35
+ - Helps non-technical users build functional apps
36
+ - The discuss → plan → execute → verify pipeline produces better results than raw prompting
37
+
38
+ ### Negative
39
+ - **Token burner:** Multiple users hit Claude Max weekly limits within 1-2 days
40
+ - **Too slow:** "hours instead of minutes" compared to native plan mode
41
+ - **Degrades on large codebases:** Agents leave orphaned code; verification uses lexical tools, not AST-aware analysis
42
+ - **Over-engineered:** Many users stripped it back to 30% or built their own simpler versions
43
+ - **Black box:** Hard to understand what's happening inside the pipeline
44
+ - **Waterfall feel:** Difficult to adjust phases/plans mid-execution when bugs or requirement changes arise
45
+
46
+ ### Key Comparisons
47
+ | Tool | Strength | Weakness |
48
+ |------|----------|----------|
49
+ | GSD | State tracking, session memory | Token-heavy, slow |
50
+ | Superpowers | Brainstorming, exploration | Overzealous, writes code into plans |
51
+ | BMAD | Deep elicitation, adversarial review | Steep learning curve, heavy artifacts |
52
+ | OpenSpec | Delta specs, parallel work | Opinionated directory structure |
53
+ | Native Plan Mode | Fast, simple | No cross-session memory |
54
+
55
+ ### Notable Quotes
56
+ - "These frameworks are great for fire-and-forget tasks, especially when there is some research involved but they burn 10x more tokens"
57
+ - "The spec-driven approach is underrated. Treating the spec as a living artifact the AI can reference across sessions"
58
+ - "I prefer move fast and start over if anything goes off track"
59
+ - "Spec-Driven Development is a curious term — it suggests it is in the tradition of TDD but goes in the opposite direction"
@@ -0,0 +1,56 @@
1
+ ---
2
+ type: source
3
+ source_type: interview-blog
4
+ title: "Python's Design Philosophy — Guido van Rossum"
5
+ author: "Guido van Rossum"
6
+ date_published: 2009-01-13
7
+ url: "http://python-history.blogspot.com/2009/01/pythons-design-philosophy.html"
8
+ confidence: high
9
+ key_claims:
10
+ - "Borrow ideas from elsewhere whenever it makes sense"
11
+ - "Things should be as simple as possible, but no simpler (Einstein)"
12
+ - "Do one thing well (Unix philosophy)"
13
+ - "Don't fret too much about performance — plan to optimize later"
14
+ - "Don't try for perfection because 'good enough' is often just that"
15
+ - "It's okay to cut corners sometimes, especially if you can do it right later"
16
+ - "The Python implementation should not be tied to a particular platform"
17
+ - "Errors should not be fatal. At the same time, errors should not pass silently"
18
+ - "A bug in the user's Python code should never lead to undefined behavior of the interpreter"
19
+ tags: [python, guido-van-rossum, language-design, zen-of-python]
20
+ also_see:
21
+ - "[[guido-van-rossum-2025-interview]]"
22
+ ---
23
+
24
+ # Python's Design Philosophy — Guido van Rossum
25
+
26
+ ## Timesaving Rules (from Python's origin as skunkworks project)
27
+
28
+ - Borrow ideas from elsewhere whenever it makes sense.
29
+ - "Things should be as simple as possible, but no simpler." (Einstein)
30
+ - Do one thing well (The Unix Philosophy).
31
+ - Don't fret too much about performance — plan to optimize later when needed.
32
+ - Don't fight the environment and go with the flow.
33
+ - Don't try for perfection because "good enough" is often just that.
34
+ - It's okay to cut corners sometimes, especially if you can do it right later.
35
+
36
+ ## Design Principles
37
+
38
+ - The Python implementation should not be tied to a particular platform.
39
+ - Don't bother users with details that the machine can handle.
40
+ - Support and encourage platform-independent user code, but don't cut off access to platform capabilities.
41
+ - A large complex system should have multiple levels of extensibility.
42
+ - Errors should not be fatal. User code should be able to recover.
43
+ - Errors should not pass silently (led to exceptions throughout).
44
+ - A bug in user code should never lead to undefined interpreter behavior; a core dump is never the user's fault.
45
+
46
+ ## The Zen of Python (Tim Peters)
47
+
48
+ Beautiful is better than ugly. Explicit is better than implicit. Simple is better than complex. Readability counts. Errors should never pass silently. In the face of ambiguity, refuse the temptation to guess. There should be one — and preferably only one — obvious way to do it. If the implementation is hard to explain, it's a bad idea. Namespaces are one honking great idea.
49
+
50
+ ## Deliberate Departures from ABC
51
+
52
+ The ABC group (where van Rossum worked before Python) strived for perfection, used optimal algorithms for asymptotically large collections (bad for small ones), isolated users from the "big bad world of computers," and created a closed system. Python deliberately went opposite: pragmatic, evolutionary, open, and welcoming of user participation in design.
53
+
54
+ ## Guido's 2025 Perspective on Type Hints
55
+
56
+ "Type hints are useful above about 10,000 lines of code — below that, it's of diminishing value since a developer can keep enough of it in their head. I wouldn't foist them upon beginners." (Source: [[guido-van-rossum-2025-interview]])
@@ -0,0 +1,48 @@
1
+ ---
2
+ type: source
3
+ source_type: interview-blog
4
+ title: "7 Learnings from Anders Hejlsberg: Architect Behind C# and TypeScript"
5
+ author: "Aaron Winston, GitHub Blog"
6
+ date_published: 2026-01-27
7
+ url: "https://github.blog/developer-skills/programming-languages-and-frameworks/7-learnings-from-anders-hejlsberg-the-architect-behind-c-and-typescript/"
8
+ confidence: high
9
+ key_claims:
10
+ - "Fast feedback loops matter more than elegance"
11
+ - "Scaling software means letting go of personal preferences"
12
+ - "TypeScript succeeded because it extended JavaScript instead of replacing it"
13
+ - "Visibility is part of what makes open source work — develop in the open"
14
+ - "Behavioral compatibility often matters more than architectural purity"
15
+ - "In an AI-driven workflow, grounding matters more than generation — type systems as guardrails"
16
+ - "Leaving JavaScript as implementation language for Go was a necessary break for performance"
17
+ tags: [anders-hejlsberg, typescript, csharp, language-design, ai-coding]
18
+ ---
19
+
20
+ # 7 Learnings from Anders Hejlsberg
21
+
22
+ ## 1. Fast feedback matters more than almost anything else
23
+
24
+ Turbo Pascal's impact came from shortening the feedback loop — edit, compile, run without touching disk. "When you typed your code, you wanted to run it immediately." TypeScript's value comes from tooling: incremental checking, fast partial results, language services that respond quickly even on large codebases. Fast feedback changes behavior: developers experiment more, refactor more confidently, catch problems closer to introduction.
25
+
26
+ ## 2. Scaling software means letting go of personal preferences
27
+
28
+ "You have to accept that things get done differently than you would have preferred. Fixing it would not really change the behavior anyway." The goal shifts from code that looks the way you'd write it to code that many people can understand, maintain, and evolve together.
29
+
30
+ ## 3. TypeScript extended JavaScript instead of replacing it
31
+
32
+ Creating a brand-new language in 2012 would have required years of investment in editors, debuggers, and community adoption. TypeScript worked with constraints developers already had. "Meaningful progress often comes from making the systems you already depend on more capable instead of trying to start over."
33
+
34
+ ## 4. Visibility is part of what makes open source work
35
+
36
+ 2014 move to GitHub transformed TypeScript. Design debates, rejected ideas, and tradeoffs remain accessible. "12 years of history captured in our project."
37
+
38
+ ## 5. Leaving JavaScript as implementation language was a necessary break
39
+
40
+ TypeScript compiler ported to Go for performance and concurrency. Not a rewrite — semantic fidelity was the goal. "The new compiler needed to behave exactly like the old one, including quirks and edge cases."
41
+
42
+ ## 6. AI workflow: grounding matters more than generation
43
+
44
+ Hejlsberg skeptical of AI-first programming languages. The risk: "plausible, confident code that lacks enough grounding in the realities of a codebase." Strong type systems, reliable refactoring tools, and accurate semantic models become essential guardrails. "The most valuable tools in an AI-assisted workflow aren't the ones that generate the most code, but the ones that constrain it correctly."
45
+
46
+ ## 7. Open collaboration builds institutional memory
47
+
48
+ "Years of discussion, decisions, and tradeoffs remain searchable and visible. That history does not disappear into private email threads or internal systems."
@@ -0,0 +1,80 @@
1
+ ---
2
+ type: source
3
+ status: ingested
4
+ source_type: github-issue
5
+ title: "ironclaw DriftMonitor — Anti-Drift Self-Checks in Agentic Loop"
6
+ author: ilblackdragon (nearai)
7
+ date_published: 2026-03-25
8
+ url: https://github.com/nearai/ironclaw/issues/1634
9
+ confidence: high
10
+ key_claims:
11
+ - "Rule-based DriftMonitor detects 5 stuck patterns without additional LLM calls"
12
+ - "Corrections injected as system messages into LLM context"
13
+ - "Integrates via existing delegate hook system, no agentic_loop.rs changes"
14
+ - "Prior art: RuFlo's Continue Gate (checkpoint, rework ratio, budget slope)"
15
+ tags:
16
+ - source
17
+ - drift-detection
18
+ - agent-loop
19
+ - ironclaw
20
+ - guardian-agent
21
+ related:
22
+ - "[[Research: Meta-Agent Context Drift Detection]]"
23
+ - "[[context-drift-in-agents]]"
24
+ - "[[agent-loop-detection-patterns]]"
25
+ created: 2026-05-02
26
+ updated: 2026-05-02
27
+
28
+ ---# ironclaw DriftMonitor
29
+
30
+ ## Summary
31
+
32
+ GitHub issue proposing a lightweight, rule-based `DriftMonitor` for the ironclaw agentic loop. Detects common failure patterns (repetition loops, failure spirals, tool cycling, silence drift, rework churn) and injects corrective system messages — without requiring additional LLM calls. This is the closest existing implementation to the meta-agent context drift detection concept.
33
+
34
+ ## What It Contributes
35
+
36
+ This is the **primary prior art** for the meta-agent context drift detection concept. It implements detection + injection but does NOT implement context pruning or session restart. The proposed meta-agent extends this by adding pruning heuristics and escalation levels.
37
+
38
+ ## Five Detection Rules
39
+
40
+ 1. **Repetition** — Same tool + same param hash ≥3 times in last 10 calls → inject correction
41
+ 2. **Failure spiral** — ≥4 consecutive tool failures → inject "reassess approach"
42
+ 3. **Tool cycling** — A-B-A-B-A-B pattern in last 6 calls → inject "state what's blocking you"
43
+ 4. **Silence drift** — ≥15 iterations since last text response → inject "provide progress update"
44
+ 5. **Rework detection** — Same file written ≥3 times → inject "review before writing again"
45
+
46
+ ## Design Details
47
+
48
+ - `DriftMonitor` struct with `original_goal`, `tool_history` (VecDeque), `IterationMetrics`, `DriftConfig`
49
+ - `ToolCallRecord` has `name`, `params_hash` (u64), `succeeded`, `iteration`
50
+ - Corrections injected as system messages (same pattern as existing `TOOL_INTENT_NUDGE`)
51
+ - Configurable via env vars (`IRONCLAW_DRIFT_*`) or disabled entirely
52
+ - Config struct: `enabled`, `repetition_window`, `repetition_threshold`, `max_consecutive_failures`, `cycle_detection_window`, `silence_threshold`, `max_file_rewrites`, `checkpoint_interval`
53
+
54
+ ## Future Extensions (Not in Scope)
55
+
56
+ - **Semantic drift detection** — LLM-based check comparing current context to original goal
57
+ - **Plan adherence** — Compare actual tool sequence to planned sequence
58
+ - **Budget slope analysis** — Linear regression over token consumption windows
59
+ - **Escalation levels** — Soft nudge → stronger → early loop exit
60
+
61
+ ## Integration Points
62
+
63
+ | File | Change |
64
+ |------|--------|
65
+ | `src/agent/drift_monitor.rs` | **New** — struct + detection rules |
66
+ | `src/agent/dispatcher.rs` | Add field, call check() in before_llm_call() |
67
+ | `src/worker/job.rs` | Same integration for JobDelegate |
68
+ | `src/agent/mod.rs` | Module declaration |
69
+
70
+ No changes to `agentic_loop.rs` — delegates already own the hooks.
71
+
72
+ ## Relevance to Meta-Agent Concept
73
+
74
+ The ironclaw DriftMonitor is detection + injection. The meta-agent concept adds:
75
+ - **Context pruning**: Removing dead-end entries, not just injecting corrections
76
+ - **Session restart**: Clean context after pruning
77
+ - **Escalation model**: Soft → strong → forced restart
78
+ - **Model-adaptive behavior**: Different detection frequencies per model profile
79
+
80
+ The DriftMonitor validates that rule-based detection is feasible and effective. The missing piece — context pruning — is the novel contribution.