groundswell 0.0.2 → 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (554) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +26 -9
  3. package/dist/cache/cache-key.d.ts +86 -0
  4. package/dist/cache/cache-key.d.ts.map +1 -0
  5. package/dist/cache/cache-key.js +204 -0
  6. package/dist/cache/cache-key.js.map +1 -0
  7. package/dist/cache/cache.d.ts +104 -0
  8. package/dist/cache/cache.d.ts.map +1 -0
  9. package/dist/cache/cache.js +179 -0
  10. package/dist/cache/cache.js.map +1 -0
  11. package/{src/cache/index.ts → dist/cache/index.d.ts} +1 -1
  12. package/dist/cache/index.d.ts.map +1 -0
  13. package/dist/cache/index.js +6 -0
  14. package/dist/cache/index.js.map +1 -0
  15. package/dist/core/agent.d.ts +203 -0
  16. package/dist/core/agent.d.ts.map +1 -0
  17. package/dist/core/agent.js +833 -0
  18. package/dist/core/agent.js.map +1 -0
  19. package/{src/core/context.ts → dist/core/context.d.ts} +16 -67
  20. package/dist/core/context.d.ts.map +1 -0
  21. package/dist/core/context.js +80 -0
  22. package/dist/core/context.js.map +1 -0
  23. package/dist/core/event-tree.d.ts +72 -0
  24. package/dist/core/event-tree.d.ts.map +1 -0
  25. package/dist/core/event-tree.js +211 -0
  26. package/dist/core/event-tree.js.map +1 -0
  27. package/{src/core/factory.ts → dist/core/factory.d.ts} +6 -27
  28. package/dist/core/factory.d.ts.map +1 -0
  29. package/dist/core/factory.js +110 -0
  30. package/dist/core/factory.js.map +1 -0
  31. package/{src/core/index.ts → dist/core/index.d.ts} +2 -10
  32. package/dist/core/index.d.ts.map +1 -0
  33. package/dist/core/index.js +9 -0
  34. package/dist/core/index.js.map +1 -0
  35. package/dist/core/logger.d.ts +50 -0
  36. package/dist/core/logger.d.ts.map +1 -0
  37. package/dist/core/logger.js +91 -0
  38. package/dist/core/logger.js.map +1 -0
  39. package/dist/core/mcp-handler.d.ts +127 -0
  40. package/dist/core/mcp-handler.d.ts.map +1 -0
  41. package/dist/core/mcp-handler.js +323 -0
  42. package/dist/core/mcp-handler.js.map +1 -0
  43. package/dist/core/prompt.d.ts +80 -0
  44. package/dist/core/prompt.d.ts.map +1 -0
  45. package/dist/core/prompt.js +120 -0
  46. package/dist/core/prompt.js.map +1 -0
  47. package/dist/core/workflow-context.d.ts +61 -0
  48. package/dist/core/workflow-context.d.ts.map +1 -0
  49. package/dist/core/workflow-context.js +358 -0
  50. package/dist/core/workflow-context.js.map +1 -0
  51. package/dist/core/workflow.d.ts +543 -0
  52. package/dist/core/workflow.d.ts.map +1 -0
  53. package/dist/core/workflow.js +986 -0
  54. package/dist/core/workflow.js.map +1 -0
  55. package/dist/debugger/event-replayer.d.ts +422 -0
  56. package/dist/debugger/event-replayer.d.ts.map +1 -0
  57. package/dist/debugger/event-replayer.js +639 -0
  58. package/dist/debugger/event-replayer.js.map +1 -0
  59. package/dist/debugger/index.d.ts +2 -0
  60. package/dist/debugger/index.d.ts.map +1 -0
  61. package/{src/debugger/index.ts → dist/debugger/index.js} +1 -0
  62. package/dist/debugger/index.js.map +1 -0
  63. package/dist/debugger/tree-debugger.d.ts +240 -0
  64. package/dist/debugger/tree-debugger.d.ts.map +1 -0
  65. package/dist/debugger/tree-debugger.js +620 -0
  66. package/dist/debugger/tree-debugger.js.map +1 -0
  67. package/dist/decorators/index.d.ts +4 -0
  68. package/dist/decorators/index.d.ts.map +1 -0
  69. package/{src/decorators/index.ts → dist/decorators/index.js} +1 -0
  70. package/dist/decorators/index.js.map +1 -0
  71. package/dist/decorators/observed-state.d.ts +32 -0
  72. package/dist/decorators/observed-state.d.ts.map +1 -0
  73. package/dist/decorators/observed-state.js +79 -0
  74. package/dist/decorators/observed-state.js.map +1 -0
  75. package/dist/decorators/step.d.ts +15 -0
  76. package/dist/decorators/step.d.ts.map +1 -0
  77. package/dist/decorators/step.js +192 -0
  78. package/dist/decorators/step.js.map +1 -0
  79. package/dist/decorators/task.d.ts +50 -0
  80. package/dist/decorators/task.d.ts.map +1 -0
  81. package/dist/decorators/task.js +118 -0
  82. package/dist/decorators/task.js.map +1 -0
  83. package/dist/examples/index.d.ts +3 -0
  84. package/dist/examples/index.d.ts.map +1 -0
  85. package/{src/examples/index.ts → dist/examples/index.js} +1 -0
  86. package/dist/examples/index.js.map +1 -0
  87. package/dist/examples/tdd-orchestrator.d.ts +15 -0
  88. package/dist/examples/tdd-orchestrator.d.ts.map +1 -0
  89. package/dist/examples/tdd-orchestrator.js +121 -0
  90. package/dist/examples/tdd-orchestrator.js.map +1 -0
  91. package/dist/examples/test-cycle-workflow.d.ts +14 -0
  92. package/dist/examples/test-cycle-workflow.d.ts.map +1 -0
  93. package/dist/examples/test-cycle-workflow.js +116 -0
  94. package/dist/examples/test-cycle-workflow.js.map +1 -0
  95. package/dist/harnesses/claude-code-harness.d.ts +391 -0
  96. package/dist/harnesses/claude-code-harness.d.ts.map +1 -0
  97. package/dist/harnesses/claude-code-harness.js +1076 -0
  98. package/dist/harnesses/claude-code-harness.js.map +1 -0
  99. package/dist/harnesses/harness-registry.d.ts +440 -0
  100. package/dist/harnesses/harness-registry.d.ts.map +1 -0
  101. package/dist/harnesses/harness-registry.js +543 -0
  102. package/dist/harnesses/harness-registry.js.map +1 -0
  103. package/dist/harnesses/index.d.ts +12 -0
  104. package/dist/harnesses/index.d.ts.map +1 -0
  105. package/dist/harnesses/index.js +11 -0
  106. package/dist/harnesses/index.js.map +1 -0
  107. package/dist/harnesses/pi-harness.d.ts +219 -0
  108. package/dist/harnesses/pi-harness.d.ts.map +1 -0
  109. package/dist/harnesses/pi-harness.js +676 -0
  110. package/dist/harnesses/pi-harness.js.map +1 -0
  111. package/dist/harnesses/pi-schema-converter.d.ts +24 -0
  112. package/dist/harnesses/pi-schema-converter.d.ts.map +1 -0
  113. package/dist/harnesses/pi-schema-converter.js +81 -0
  114. package/dist/harnesses/pi-schema-converter.js.map +1 -0
  115. package/dist/harnesses/register-defaults.d.ts +24 -0
  116. package/dist/harnesses/register-defaults.d.ts.map +1 -0
  117. package/dist/harnesses/register-defaults.js +40 -0
  118. package/dist/harnesses/register-defaults.js.map +1 -0
  119. package/dist/harnesses/session-store.d.ts +201 -0
  120. package/dist/harnesses/session-store.d.ts.map +1 -0
  121. package/dist/harnesses/session-store.js +254 -0
  122. package/dist/harnesses/session-store.js.map +1 -0
  123. package/dist/index.d.ts +37 -0
  124. package/dist/index.d.ts.map +1 -0
  125. package/dist/index.js +57 -0
  126. package/dist/index.js.map +1 -0
  127. package/dist/reflection/index.d.ts +5 -0
  128. package/dist/reflection/index.d.ts.map +1 -0
  129. package/{src/reflection/index.ts → dist/reflection/index.js} +1 -1
  130. package/dist/reflection/index.js.map +1 -0
  131. package/dist/reflection/reflection.d.ts +84 -0
  132. package/dist/reflection/reflection.d.ts.map +1 -0
  133. package/dist/reflection/reflection.js +344 -0
  134. package/dist/reflection/reflection.js.map +1 -0
  135. package/dist/tools/index.d.ts +6 -0
  136. package/dist/tools/index.d.ts.map +1 -0
  137. package/dist/tools/index.js +11 -0
  138. package/dist/tools/index.js.map +1 -0
  139. package/dist/tools/introspection.d.ts +165 -0
  140. package/dist/tools/introspection.d.ts.map +1 -0
  141. package/dist/tools/introspection.js +324 -0
  142. package/dist/tools/introspection.js.map +1 -0
  143. package/dist/types/agent.d.ts +1317 -0
  144. package/dist/types/agent.d.ts.map +1 -0
  145. package/dist/types/agent.js +423 -0
  146. package/dist/types/agent.js.map +1 -0
  147. package/dist/types/decorators.d.ts +40 -0
  148. package/dist/types/decorators.d.ts.map +1 -0
  149. package/dist/types/decorators.js +2 -0
  150. package/dist/types/decorators.js.map +1 -0
  151. package/dist/types/error-strategy.d.ts +13 -0
  152. package/dist/types/error-strategy.d.ts.map +1 -0
  153. package/dist/types/error-strategy.js +2 -0
  154. package/dist/types/error-strategy.js.map +1 -0
  155. package/dist/types/error.d.ts +20 -0
  156. package/dist/types/error.d.ts.map +1 -0
  157. package/dist/types/error.js +2 -0
  158. package/dist/types/error.js.map +1 -0
  159. package/dist/types/events.d.ts +113 -0
  160. package/dist/types/events.d.ts.map +1 -0
  161. package/dist/types/events.js +2 -0
  162. package/dist/types/events.js.map +1 -0
  163. package/dist/types/harnesses.d.ts +474 -0
  164. package/dist/types/harnesses.d.ts.map +1 -0
  165. package/dist/types/harnesses.js +2 -0
  166. package/dist/types/harnesses.js.map +1 -0
  167. package/dist/types/index.d.ts +23 -0
  168. package/dist/types/index.d.ts.map +1 -0
  169. package/dist/types/index.js +8 -0
  170. package/dist/types/index.js.map +1 -0
  171. package/dist/types/logging.d.ts +24 -0
  172. package/dist/types/logging.d.ts.map +1 -0
  173. package/dist/types/logging.js +2 -0
  174. package/dist/types/logging.js.map +1 -0
  175. package/dist/types/observer.d.ts +18 -0
  176. package/dist/types/observer.d.ts.map +1 -0
  177. package/dist/types/observer.js +2 -0
  178. package/dist/types/observer.js.map +1 -0
  179. package/dist/types/prompt.d.ts +31 -0
  180. package/dist/types/prompt.d.ts.map +1 -0
  181. package/dist/types/prompt.js +6 -0
  182. package/dist/types/prompt.js.map +1 -0
  183. package/dist/types/providers.d.ts +691 -0
  184. package/dist/types/providers.d.ts.map +1 -0
  185. package/dist/types/providers.js +14 -0
  186. package/dist/types/providers.js.map +1 -0
  187. package/dist/types/reflection.d.ts +96 -0
  188. package/dist/types/reflection.d.ts.map +1 -0
  189. package/dist/types/reflection.js +24 -0
  190. package/dist/types/reflection.js.map +1 -0
  191. package/dist/types/restart.d.ts +132 -0
  192. package/dist/types/restart.d.ts.map +1 -0
  193. package/dist/types/restart.js +2 -0
  194. package/dist/types/restart.js.map +1 -0
  195. package/dist/types/sdk-primitives.d.ts +118 -0
  196. package/dist/types/sdk-primitives.d.ts.map +1 -0
  197. package/dist/types/sdk-primitives.js +6 -0
  198. package/dist/types/sdk-primitives.js.map +1 -0
  199. package/{src/types/snapshot.ts → dist/types/snapshot.d.ts} +5 -5
  200. package/dist/types/snapshot.d.ts.map +1 -0
  201. package/dist/types/snapshot.js +2 -0
  202. package/dist/types/snapshot.js.map +1 -0
  203. package/dist/types/streaming.d.ts +194 -0
  204. package/dist/types/streaming.d.ts.map +1 -0
  205. package/dist/types/streaming.js +67 -0
  206. package/dist/types/streaming.js.map +1 -0
  207. package/dist/types/workflow-context.d.ts +275 -0
  208. package/dist/types/workflow-context.d.ts.map +1 -0
  209. package/dist/types/workflow-context.js +8 -0
  210. package/dist/types/workflow-context.js.map +1 -0
  211. package/dist/types/workflow.d.ts +30 -0
  212. package/dist/types/workflow.d.ts.map +1 -0
  213. package/dist/types/workflow.js +2 -0
  214. package/dist/types/workflow.js.map +1 -0
  215. package/dist/utils/agent-validation.d.ts +88 -0
  216. package/dist/utils/agent-validation.d.ts.map +1 -0
  217. package/dist/utils/agent-validation.js +87 -0
  218. package/dist/utils/agent-validation.js.map +1 -0
  219. package/dist/utils/delay.d.ts +7 -0
  220. package/dist/utils/delay.d.ts.map +1 -0
  221. package/dist/utils/delay.js +9 -0
  222. package/dist/utils/delay.js.map +1 -0
  223. package/dist/utils/harness-config.d.ts +180 -0
  224. package/dist/utils/harness-config.d.ts.map +1 -0
  225. package/dist/utils/harness-config.js +311 -0
  226. package/dist/utils/harness-config.js.map +1 -0
  227. package/dist/utils/id.d.ts +6 -0
  228. package/dist/utils/id.d.ts.map +1 -0
  229. package/dist/utils/id.js +12 -0
  230. package/dist/utils/id.js.map +1 -0
  231. package/dist/utils/index.d.ts +13 -0
  232. package/dist/utils/index.d.ts.map +1 -0
  233. package/dist/utils/index.js +11 -0
  234. package/dist/utils/index.js.map +1 -0
  235. package/dist/utils/model-spec.d.ts +110 -0
  236. package/dist/utils/model-spec.d.ts.map +1 -0
  237. package/dist/utils/model-spec.js +149 -0
  238. package/dist/utils/model-spec.js.map +1 -0
  239. package/dist/utils/observable.d.ts +54 -0
  240. package/dist/utils/observable.d.ts.map +1 -0
  241. package/dist/utils/observable.js +82 -0
  242. package/dist/utils/observable.js.map +1 -0
  243. package/dist/utils/provider-config.d.ts +10 -0
  244. package/dist/utils/provider-config.d.ts.map +1 -0
  245. package/dist/utils/provider-config.js +10 -0
  246. package/dist/utils/provider-config.js.map +1 -0
  247. package/dist/utils/restart-analysis.d.ts +202 -0
  248. package/dist/utils/restart-analysis.d.ts.map +1 -0
  249. package/dist/utils/restart-analysis.js +426 -0
  250. package/dist/utils/restart-analysis.js.map +1 -0
  251. package/dist/utils/session-serialization.d.ts +118 -0
  252. package/dist/utils/session-serialization.d.ts.map +1 -0
  253. package/dist/utils/session-serialization.js +217 -0
  254. package/dist/utils/session-serialization.js.map +1 -0
  255. package/dist/utils/workflow-error-utils.d.ts +22 -0
  256. package/dist/utils/workflow-error-utils.d.ts.map +1 -0
  257. package/dist/utils/workflow-error-utils.js +45 -0
  258. package/dist/utils/workflow-error-utils.js.map +1 -0
  259. package/package.json +34 -5
  260. package/.claude/commands/subtask-planning/prp-base-create.md +0 -120
  261. package/.claude/commands/subtask-planning/prp-base-execute.md +0 -65
  262. package/.claude/commands/task-breakdown.md +0 -94
  263. package/.claude/settings.local.json +0 -9
  264. package/.claude/system_prompts/task-breakdown.md +0 -101
  265. package/CHANGELOG.md +0 -188
  266. package/PRD.md +0 -543
  267. package/PRPs/001-hierarchical-workflow-engine.md +0 -2438
  268. package/PRPs/PRDs/002-agent-prompt.md +0 -390
  269. package/PRPs/PRDs/003-agent-prompt.md +0 -943
  270. package/PRPs/PRDs/004-agent-prompt.md +0 -1136
  271. package/PRPs/PRDs/tasks-001.json +0 -492
  272. package/PRPs/README.md +0 -83
  273. package/PRPs/templates/prp_base.md +0 -222
  274. package/docs/agent.md +0 -422
  275. package/docs/prompt.md +0 -419
  276. package/docs/workflow.md +0 -600
  277. package/examples/README.md +0 -258
  278. package/examples/examples/01-basic-workflow.ts +0 -100
  279. package/examples/examples/02-decorator-options.ts +0 -217
  280. package/examples/examples/03-parent-child.ts +0 -241
  281. package/examples/examples/04-observers-debugger.ts +0 -340
  282. package/examples/examples/05-error-handling.ts +0 -387
  283. package/examples/examples/06-concurrent-tasks.ts +0 -352
  284. package/examples/examples/07-agent-loops.ts +0 -432
  285. package/examples/examples/08-sdk-features.ts +0 -667
  286. package/examples/examples/09-reflection.ts +0 -573
  287. package/examples/examples/10-introspection.ts +0 -550
  288. package/examples/examples/11-reparenting-workflows.ts +0 -269
  289. package/examples/index.ts +0 -147
  290. package/examples/utils/helpers.ts +0 -57
  291. package/package-lock.json +0 -2398
  292. package/plan/001_d3bb02af4886/TEST_RESULTS.md +0 -259
  293. package/plan/001_d3bb02af4886/backlog.json +0 -867
  294. package/plan/001_d3bb02af4886/bug_fix_tasks.json +0 -484
  295. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M1T1S1/PRP.md +0 -488
  296. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M1T1S2/PRP.md +0 -581
  297. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M1T1S3/PRP.md +0 -687
  298. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T1S1/PRP.md +0 -492
  299. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T1S3/PRP.md +0 -932
  300. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T1S3/research/concurrent_error_testing_patterns.md +0 -1109
  301. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T1S3/research/vitest_concurrent_testing.md +0 -802
  302. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T1S3/research/workflow_engine_test_references.md +0 -603
  303. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T2S1/PRP.md +0 -564
  304. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T2S3/PRP.md +0 -518
  305. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T2S4/PRP.md +0 -1252
  306. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T3S1/PRP.md +0 -364
  307. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T3S1/research/CODEBASE_INVENTORY.md +0 -114
  308. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T3S1/research/DECORATOR_DOCUMENTATION_PATTERNS.md +0 -205
  309. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T3S1/research/PRD_LOCATION_ANALYSIS.md +0 -199
  310. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M2T3S1/research/ULTRATHINK_PRP_PLAN.md +0 -134
  311. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T1S1/PRP.md +0 -495
  312. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T1S1/research/console_error_inventory.md +0 -435
  313. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T1S2/PRP.md +0 -506
  314. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T1S3/PRP.md +0 -612
  315. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T2S2/PRP.md +0 -558
  316. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T2S2/research/external_research.md +0 -788
  317. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T3S2/PRP.md +0 -460
  318. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T3S3/PRP.md +0 -454
  319. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T4S1/PRP.md +0 -520
  320. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T4S1/RECOMMENDATION.md +0 -417
  321. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T4S1/research/external_workflow_engines_research.md +0 -760
  322. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T4S1/research/security_implications_analysis.md +0 -245
  323. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M3T4S2/PRP.md +0 -792
  324. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T1S1/PRP.md +0 -535
  325. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T1S1/TEST_EXECUTION_REPORT.md +0 -190
  326. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T1S2/PRP.md +0 -654
  327. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T1S2/TEST_FIX_REPORT.md +0 -227
  328. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T1S2/research/KEY_FINDINGS.md +0 -345
  329. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T1S2/research/QUICK_REFERENCE.md +0 -193
  330. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T1S2/research/test_maintenance_research.md +0 -1323
  331. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T3S1/BREAKING_CHANGES_AUDIT.md +0 -1011
  332. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T3S1/PRP.md +0 -927
  333. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/P1M4T3S2/PRP.md +0 -505
  334. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/architecture/logger_child_signature_analysis.md +0 -401
  335. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M1T1S3/child_implementation_research.md +0 -142
  336. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M1T1S3/test_patterns_research.md +0 -112
  337. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M1T1S3/vitest_patterns_research.md +0 -159
  338. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M1T1S4/PRP.md +0 -549
  339. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M1T1S4/VERIFICATION_REPORT.md +0 -368
  340. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M1T1S4/edge_case_analysis.md +0 -172
  341. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M1T1S4/usage_inventory.md +0 -175
  342. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T1S2/PRP.md +0 -696
  343. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T1S4/PRP.md +0 -860
  344. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/PRP.md +0 -1066
  345. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/01-testing-aggregated-errors.md +0 -1103
  346. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/01_typescript_error_aggregation_patterns.md +0 -789
  347. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/02-error-merge-strategy-testing-guide.md +0 -1098
  348. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/02_aggregate_error_patterns.md +0 -1037
  349. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/03-promise-allsettled-testing-patterns.md +0 -916
  350. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/03_error_merging_strategies.md +0 -1045
  351. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/04_github_stackoverflow_examples.md +0 -890
  352. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/05_comprehensive_summary.md +0 -822
  353. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/INDEX.md +0 -668
  354. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/QUICK_REFERENCE.md +0 -706
  355. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/README.md +0 -265
  356. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S2/research/RESEARCH_REPORT.md +0 -655
  357. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T2S4/research/vitest_testing_patterns.md +0 -1103
  358. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M2T3S2/PRP.md +0 -426
  359. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T1S2/PRP.md +0 -506
  360. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T1S2/research/QUICK_REFERENCE.md +0 -114
  361. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T1S2/research/RESEARCH_SUMMARY.md +0 -316
  362. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T1S2/research/vitest_observer_error_logging_best_practices.md +0 -754
  363. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T1S3/PRP.md +0 -612
  364. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T2S1/PRP.md +0 -719
  365. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T2S1/README.md +0 -215
  366. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T2S1/analysis.md +0 -765
  367. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T2S3/PRP.md +0 -718
  368. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T3S1/DECISION.md +0 -149
  369. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T3S1/PRP.md +0 -470
  370. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T3S1/research/ULTRATHINK_PLAN.md +0 -332
  371. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T3S1/research/codebase_workflow_name_analysis.md +0 -167
  372. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T3S1/research/external_best_practices.md +0 -265
  373. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T3S1/research/validation_patterns.md +0 -273
  374. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T4S1/workflow_engine_ancestry_api_research.md +0 -760
  375. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M3T4S3-PRP.md +0 -434
  376. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M4T2S1/PRP.md +0 -717
  377. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M4T2S2/PRP.md +0 -472
  378. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M4T2S2/VALIDATION_REPORT.md +0 -125
  379. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/P1M4T2S2/research/ULTRATHINK_PRP_PLAN.md +0 -301
  380. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/error-logging-best-practices.md +0 -1170
  381. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/research_typescript_partial_and_overloads.md +0 -940
  382. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/vitest-quick-reference.md +0 -151
  383. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/docs/vitest-research.md +0 -650
  384. package/plan/001_d3bb02af4886/bugfix/001_e8e04329daf3/prd_snapshot.md +0 -259
  385. package/plan/001_d3bb02af4886/bugfix/P1M1T1S1/PRP.md +0 -457
  386. package/plan/001_d3bb02af4886/bugfix/RESEARCH_SUMMARY.md +0 -346
  387. package/plan/001_d3bb02af4886/bugfix/architecture/codebase_structure.md +0 -311
  388. package/plan/001_d3bb02af4886/bugfix/architecture/concurrent_execution_best_practices.md +0 -1565
  389. package/plan/001_d3bb02af4886/bugfix/architecture/error_handling_patterns.md +0 -288
  390. package/plan/001_d3bb02af4886/bugfix/architecture/promise_all_analysis.md +0 -741
  391. package/plan/001_d3bb02af4886/docs/PRP/P1M1T1S4-functional-workflow-error-state-capture-test.md +0 -652
  392. package/plan/001_d3bb02af4886/docs/PRP/P1P2-PRP.md +0 -527
  393. package/plan/001_d3bb02af4886/docs/PRP/P3P4-PRP.md +0 -1388
  394. package/plan/001_d3bb02af4886/docs/PRP/P4P5-PRP.md +0 -1136
  395. package/plan/001_d3bb02af4886/docs/PRP/PRP.md +0 -527
  396. package/plan/001_d3bb02af4886/docs/PRP/bugfix/P1M1T2S1-PRP.md +0 -415
  397. package/plan/001_d3bb02af4886/docs/PRP/bugfix/P1M1T2S2-PRP.md +0 -378
  398. package/plan/001_d3bb02af4886/docs/PRP/bugfix/P1M1T2S4-PRP.md +0 -713
  399. package/plan/001_d3bb02af4886/docs/PRP/bugfix/P1M2T1S4-PRP.md +0 -370
  400. package/plan/001_d3bb02af4886/docs/PRP_P1M3T1S3.md +0 -499
  401. package/plan/001_d3bb02af4886/docs/TEST_RESULTS.md +0 -230
  402. package/plan/001_d3bb02af4886/docs/architecture/external_deps.md +0 -358
  403. package/plan/001_d3bb02af4886/docs/architecture/system_context.md +0 -242
  404. package/plan/001_d3bb02af4886/docs/bugfix/ANALYSIS_PRD_VS_IMPLEMENTATION.md +0 -1134
  405. package/plan/001_d3bb02af4886/docs/bugfix/GAP_ANALYSIS_SUMMARY.md +0 -179
  406. package/plan/001_d3bb02af4886/docs/bugfix/P1M4T2S1/PRP.md +0 -629
  407. package/plan/001_d3bb02af4886/docs/bugfix/P1M4T2S1/validation-report.md +0 -214
  408. package/plan/001_d3bb02af4886/docs/bugfix/PRP_P1M4T2S3.md +0 -629
  409. package/plan/001_d3bb02af4886/docs/bugfix/bugfix_PRP.md +0 -529
  410. package/plan/001_d3bb02af4886/docs/bugfix/bugfix_QUICK_REFERENCE.md +0 -142
  411. package/plan/001_d3bb02af4886/docs/bugfix/bugfix_README.md +0 -304
  412. package/plan/001_d3bb02af4886/docs/bugfix/bugfix_TEST_RESULTS.md +0 -558
  413. package/plan/001_d3bb02af4886/docs/bugfix/bugfix_VALIDATION_SUMMARY.md +0 -256
  414. package/plan/001_d3bb02af4886/docs/bugfix/system_context.md +0 -346
  415. package/plan/001_d3bb02af4886/docs/bugfix-architecture/bug_analysis.md +0 -415
  416. package/plan/001_d3bb02af4886/docs/bugfix-architecture/implementation_patterns.md +0 -489
  417. package/plan/001_d3bb02af4886/docs/bugfix-architecture/system_context.md +0 -218
  418. package/plan/001_d3bb02af4886/docs/bugfix_INITIATION_SUMMARY.md +0 -380
  419. package/plan/001_d3bb02af4886/docs/research/CYCLE_DETECTION_PATTERNS.md +0 -1923
  420. package/plan/001_d3bb02af4886/docs/research/CYCLE_DETECTION_QUICK_REF.md +0 -319
  421. package/plan/001_d3bb02af4886/docs/research/P1M1T2S1/codebase-context.md +0 -115
  422. package/plan/001_d3bb02af4886/docs/research/P1M1T2S1/cycle-detection-algorithms.md +0 -134
  423. package/plan/001_d3bb02af4886/docs/research/P1M1T2S1/test-patterns.md +0 -153
  424. package/plan/001_d3bb02af4886/docs/research/P1M1T2S1/workflow-class.md +0 -132
  425. package/plan/001_d3bb02af4886/docs/research/P1M2T1S4/DECORATOR_DOCUMENTATION_BEST_PRACTICES.md +0 -716
  426. package/plan/001_d3bb02af4886/docs/research/P1M2T1S4/DECORATOR_DOCUMENTATION_QUICK_REF.md +0 -186
  427. package/plan/001_d3bb02af4886/docs/research/P1M2T1S4/GROUNDSWELL_DECORATOR_EXAMPLES.md +0 -604
  428. package/plan/001_d3bb02af4886/docs/research/P1M2T1S4/INDEX.md +0 -213
  429. package/plan/001_d3bb02af4886/docs/research/P1M2T1S4/codebase_structure.md +0 -30
  430. package/plan/001_d3bb02af4886/docs/research/P1M2T1S4/existing_test_pattern.md +0 -56
  431. package/plan/001_d3bb02af4886/docs/research/P1M2T1S4/getRootObservers_implementation.md +0 -53
  432. package/plan/001_d3bb02af4886/docs/research/P1M2T1S4/test_conventions.md +0 -49
  433. package/plan/001_d3bb02af4886/docs/research/P1M3T1S4/PRP.md +0 -958
  434. package/plan/001_d3bb02af4886/docs/research/P1M3T1S4/QUICK_REFERENCE.md +0 -339
  435. package/plan/001_d3bb02af4886/docs/research/P1M3T1S4/README.md +0 -305
  436. package/plan/001_d3bb02af4886/docs/research/P1M3T1S4/SUMMARY.md +0 -433
  437. package/plan/001_d3bb02af4886/docs/research/P1M3T1S4/bidirectional-tree-consistency-testing.md +0 -1574
  438. package/plan/001_d3bb02af4886/docs/research/P1M3T1S4/test-pattern-examples.md +0 -1014
  439. package/plan/001_d3bb02af4886/docs/research/P1P2/LRU_CACHE_BEST_PRACTICES.md +0 -1929
  440. package/plan/001_d3bb02af4886/docs/research/P1P2/LRU_CACHE_CODE_PATTERNS.md +0 -857
  441. package/plan/001_d3bb02af4886/docs/research/P1P2/LRU_CACHE_INTEGRATION_GUIDE.md +0 -738
  442. package/plan/001_d3bb02af4886/docs/research/P1P2/LRU_CACHE_RESEARCH_INDEX.md +0 -424
  443. package/plan/001_d3bb02af4886/docs/research/P1P2/REFLECTION_INDEX.md +0 -291
  444. package/plan/001_d3bb02af4886/docs/research/P1P2/REFLECTION_RESEARCH_REPORT.md +0 -1342
  445. package/plan/001_d3bb02af4886/docs/research/P1P2/RESEARCH_SUMMARY.md +0 -342
  446. package/plan/001_d3bb02af4886/docs/research/P1P2/anthropic-sdk.md +0 -174
  447. package/plan/001_d3bb02af4886/docs/research/P1P2/async-local-storage.md +0 -200
  448. package/plan/001_d3bb02af4886/docs/research/P1P2/reflection-code-patterns.md +0 -1205
  449. package/plan/001_d3bb02af4886/docs/research/P1P2/reflection-decision-matrix.md +0 -421
  450. package/plan/001_d3bb02af4886/docs/research/P1P2/reflection-implementation-guide.md +0 -1341
  451. package/plan/001_d3bb02af4886/docs/research/P1P2/reflection-integration-guide.md +0 -834
  452. package/plan/001_d3bb02af4886/docs/research/P1P2/reflection-patterns.md +0 -1468
  453. package/plan/001_d3bb02af4886/docs/research/P1P2/reflection-quick-reference.md +0 -558
  454. package/plan/001_d3bb02af4886/docs/research/P1P2/zod-schema.md +0 -152
  455. package/plan/001_d3bb02af4886/docs/research/P3P4/caching-lru.md +0 -116
  456. package/plan/001_d3bb02af4886/docs/research/P3P4/introspection-tools.md +0 -177
  457. package/plan/001_d3bb02af4886/docs/research/P3P4/reflection-patterns.md +0 -117
  458. package/plan/001_d3bb02af4886/docs/research/P4P5/RESEARCH_SUMMARY.md +0 -151
  459. package/plan/001_d3bb02af4886/docs/research/PROMISE_ALLSETTLED_QUICK_REF.md +0 -376
  460. package/plan/001_d3bb02af4886/docs/research/PROMISE_ALLSETTLED_RESEARCH.md +0 -1507
  461. package/plan/001_d3bb02af4886/docs/research/bugfix_typescript_patterns.md +0 -949
  462. package/plan/001_d3bb02af4886/docs/research/error-testing-research.md +0 -619
  463. package/plan/001_d3bb02af4886/docs/research/error_handling_patterns.md +0 -723
  464. package/plan/001_d3bb02af4886/docs/research/general/INTROSPECTION_RESEARCH_SUMMARY.md +0 -378
  465. package/plan/001_d3bb02af4886/docs/research/general/README-INTROSPECTION.md +0 -352
  466. package/plan/001_d3bb02af4886/docs/research/general/agent-introspection-patterns.md +0 -1085
  467. package/plan/001_d3bb02af4886/docs/research/general/introspection-security-guide.md +0 -984
  468. package/plan/001_d3bb02af4886/docs/research/general/introspection-tool-examples.md +0 -875
  469. package/plan/001_d3bb02af4886/docs/research/incremental-tree-map-updates/PRP_TEMPLATE.md +0 -460
  470. package/plan/001_d3bb02af4886/docs/research/incremental-tree-map-updates/QUICK_REFERENCE.md +0 -324
  471. package/plan/001_d3bb02af4886/docs/research/incremental-tree-map-updates/README.md +0 -175
  472. package/plan/001_d3bb02af4886/docs/research/incremental-tree-map-updates/RESEARCH_REPORT.md +0 -499
  473. package/plan/001_d3bb02af4886/docs/research/incremental-tree-map-updates/SUMMARY.md +0 -163
  474. package/plan/001_d3bb02af4886/prd_snapshot.md +0 -543
  475. package/plan/bugfix/BUG_FIX_SUMMARY.md +0 -961
  476. package/scripts/generate-llms-full.ts +0 -206
  477. package/src/__tests__/adversarial/attachChild-performance.test.ts +0 -216
  478. package/src/__tests__/adversarial/circular-reference.test.ts +0 -101
  479. package/src/__tests__/adversarial/complex-circular-reference.test.ts +0 -139
  480. package/src/__tests__/adversarial/concurrent-task-failures.test.ts +0 -571
  481. package/src/__tests__/adversarial/deep-analysis.test.ts +0 -729
  482. package/src/__tests__/adversarial/deep-hierarchy-stress.test.ts +0 -213
  483. package/src/__tests__/adversarial/e2e-prd-validation.test.ts +0 -448
  484. package/src/__tests__/adversarial/edge-case.test.ts +0 -703
  485. package/src/__tests__/adversarial/error-merge-strategy.test.ts +0 -760
  486. package/src/__tests__/adversarial/incremental-performance.test.ts +0 -140
  487. package/src/__tests__/adversarial/node-map-update-benchmarks.test.ts +0 -457
  488. package/src/__tests__/adversarial/observer-propagation.test.ts +0 -487
  489. package/src/__tests__/adversarial/parent-validation.test.ts +0 -143
  490. package/src/__tests__/adversarial/prd-12-2-compliance.test.ts +0 -611
  491. package/src/__tests__/adversarial/prd-compliance.test.ts +0 -731
  492. package/src/__tests__/compatibility/backward-compatibility.test.ts +0 -1572
  493. package/src/__tests__/helpers/index.ts +0 -18
  494. package/src/__tests__/helpers/tree-verification.ts +0 -257
  495. package/src/__tests__/integration/agent-workflow.test.ts +0 -256
  496. package/src/__tests__/integration/bidirectional-consistency.test.ts +0 -847
  497. package/src/__tests__/integration/observer-logging.test.ts +0 -643
  498. package/src/__tests__/integration/tree-mirroring.test.ts +0 -151
  499. package/src/__tests__/integration/workflow-reparenting.test.ts +0 -303
  500. package/src/__tests__/unit/agent.test.ts +0 -169
  501. package/src/__tests__/unit/cache-key.test.ts +0 -182
  502. package/src/__tests__/unit/cache.test.ts +0 -172
  503. package/src/__tests__/unit/context.test.ts +0 -217
  504. package/src/__tests__/unit/decorators.test.ts +0 -100
  505. package/src/__tests__/unit/introspection-tools.test.ts +0 -277
  506. package/src/__tests__/unit/logger.test.ts +0 -293
  507. package/src/__tests__/unit/observable.test.ts +0 -321
  508. package/src/__tests__/unit/prompt.test.ts +0 -135
  509. package/src/__tests__/unit/reflection.test.ts +0 -210
  510. package/src/__tests__/unit/tree-debugger-incremental.test.ts +0 -170
  511. package/src/__tests__/unit/tree-debugger.test.ts +0 -85
  512. package/src/__tests__/unit/utils/workflow-error-utils.test.ts +0 -209
  513. package/src/__tests__/unit/workflow-detachChild.test.ts +0 -100
  514. package/src/__tests__/unit/workflow-emitEvent-childDetached.test.ts +0 -153
  515. package/src/__tests__/unit/workflow-isDescendantOf.test.ts +0 -180
  516. package/src/__tests__/unit/workflow.test.ts +0 -357
  517. package/src/cache/cache-key.ts +0 -244
  518. package/src/cache/cache.ts +0 -236
  519. package/src/core/agent.ts +0 -593
  520. package/src/core/event-tree.ts +0 -260
  521. package/src/core/logger.ts +0 -112
  522. package/src/core/mcp-handler.ts +0 -184
  523. package/src/core/prompt.ts +0 -150
  524. package/src/core/workflow-context.ts +0 -351
  525. package/src/core/workflow.ts +0 -540
  526. package/src/debugger/tree-debugger.ts +0 -255
  527. package/src/decorators/observed-state.ts +0 -95
  528. package/src/decorators/step.ts +0 -139
  529. package/src/decorators/task.ts +0 -159
  530. package/src/examples/tdd-orchestrator.ts +0 -65
  531. package/src/examples/test-cycle-workflow.ts +0 -64
  532. package/src/index.ts +0 -142
  533. package/src/reflection/reflection.ts +0 -407
  534. package/src/tools/index.ts +0 -36
  535. package/src/tools/introspection.ts +0 -464
  536. package/src/types/agent.ts +0 -90
  537. package/src/types/decorators.ts +0 -32
  538. package/src/types/error-strategy.ts +0 -13
  539. package/src/types/error.ts +0 -20
  540. package/src/types/events.ts +0 -75
  541. package/src/types/index.ts +0 -55
  542. package/src/types/logging.ts +0 -24
  543. package/src/types/observer.ts +0 -18
  544. package/src/types/prompt.ts +0 -40
  545. package/src/types/reflection.ts +0 -117
  546. package/src/types/sdk-primitives.ts +0 -128
  547. package/src/types/workflow-context.ts +0 -163
  548. package/src/types/workflow.ts +0 -37
  549. package/src/utils/id.ts +0 -11
  550. package/src/utils/index.ts +0 -4
  551. package/src/utils/observable.ts +0 -106
  552. package/src/utils/workflow-error-utils.ts +0 -56
  553. package/tsconfig.json +0 -22
  554. package/vitest.config.ts +0 -16
@@ -1,1205 +0,0 @@
1
- # AI Agent Reflection - Practical Code Patterns
2
-
3
- This document provides copy-paste-ready patterns for implementing reflection in TypeScript/JavaScript agents.
4
-
5
- ## Pattern 1: Simple Reflection Loop (Minimal)
6
-
7
- **Use Case**: Basic validation + single reflection pass
8
- **Lines of Code**: ~30
9
- **Tokens per attempt**: ~200-400
10
-
11
- ```typescript
12
- async function simpleReflection(task: string): Promise<string> {
13
- // Generate
14
- const response = await client.messages.create({
15
- model: "claude-opus-4.5",
16
- max_tokens: 1024,
17
- messages: [{ role: "user", content: task }],
18
- });
19
- const output = response.content[0].text || "";
20
-
21
- // Quick validation
22
- if (output.length < 50) {
23
- // Reflect and retry
24
- const improved = await client.messages.create({
25
- model: "claude-opus-4.5",
26
- max_tokens: 1024,
27
- messages: [
28
- {
29
- role: "user",
30
- content: `${task}\n\nYour previous response was too short. Provide a more detailed, comprehensive answer.`,
31
- },
32
- ],
33
- });
34
- return improved.content[0].text || output;
35
- }
36
-
37
- return output;
38
- }
39
- ```
40
-
41
- ---
42
-
43
- ## Pattern 2: Multi-Attempt Loop with History
44
-
45
- **Use Case**: Complex tasks needing intelligent retry
46
- **Lines of Code**: ~50
47
- **Tokens per attempt**: ~300-600
48
-
49
- ```typescript
50
- interface AttemptRecord {
51
- number: number;
52
- output: string;
53
- error: string | null;
54
- timestamp: Date;
55
- }
56
-
57
- async function multiAttemptReflection(
58
- task: string,
59
- maxAttempts: number = 3
60
- ): Promise<string> {
61
- const attempts: AttemptRecord[] = [];
62
-
63
- for (let i = 1; i <= maxAttempts; i++) {
64
- const historyContext =
65
- attempts.length > 0
66
- ? `\n\nPrevious attempts:\n${attempts
67
- .map((a) => `Attempt ${a.number}: ${a.error || "completed"}`)
68
- .join("\n")}\n`
69
- : "";
70
-
71
- const response = await client.messages.create({
72
- model: "claude-opus-4.5",
73
- max_tokens: 1024,
74
- messages: [
75
- {
76
- role: "user",
77
- content: `${task}${historyContext}`,
78
- },
79
- ],
80
- });
81
-
82
- const output = response.content[0].text || "";
83
- const validation = validateOutput(output);
84
-
85
- if (validation.isValid) {
86
- return output;
87
- }
88
-
89
- attempts.push({
90
- number: i,
91
- output,
92
- error: validation.errors[0],
93
- timestamp: new Date(),
94
- });
95
-
96
- // Request reflection if not on last attempt
97
- if (i < maxAttempts) {
98
- const reflection = await client.messages.create({
99
- model: "claude-opus-4.5",
100
- max_tokens: 300,
101
- messages: [
102
- {
103
- role: "user",
104
- content: `Task: ${task}\n\nYour attempt failed: ${validation.errors[0]}\n\nWhat should you try differently?`,
105
- },
106
- ],
107
- });
108
- console.log("Reflection:", reflection.content[0].text);
109
- }
110
- }
111
-
112
- throw new Error(
113
- `Failed after ${maxAttempts} attempts. Last error: ${
114
- attempts[attempts.length - 1].error
115
- }`
116
- );
117
- }
118
-
119
- function validateOutput(output: string): {
120
- isValid: boolean;
121
- errors: string[];
122
- } {
123
- const errors: string[] = [];
124
- if (output.length < 20) errors.push("Output too short");
125
- if (!output.includes(" ")) errors.push("No proper sentences");
126
- return { isValid: errors.length === 0, errors };
127
- }
128
- ```
129
-
130
- ---
131
-
132
- ## Pattern 3: Error-Triggered Reflection
133
-
134
- **Use Case**: Reflection only on detected failures
135
- **Lines of Code**: ~60
136
- **Tokens per attempt**: ~400-800
137
-
138
- ```typescript
139
- interface ReflectionContext {
140
- originalInput: string;
141
- failedOutput: string;
142
- errorType: "validation" | "execution" | "logic";
143
- errorMessage: string;
144
- }
145
-
146
- async function errorTriggeredReflection(
147
- task: string,
148
- executeTask: (input: string) => Promise<{ success: boolean; output: string; error?: string }>
149
- ): Promise<string> {
150
- let attempts = 0;
151
- const maxAttempts = 3;
152
-
153
- while (attempts < maxAttempts) {
154
- attempts++;
155
-
156
- // Generate solution
157
- const response = await client.messages.create({
158
- model: "claude-opus-4.5",
159
- max_tokens: 1024,
160
- messages: [{ role: "user", content: task }],
161
- });
162
- const solution = response.content[0].text || "";
163
-
164
- // Try to execute
165
- const execution = await executeTask(solution);
166
-
167
- if (execution.success) {
168
- return solution;
169
- }
170
-
171
- // Build reflection context
172
- const context: ReflectionContext = {
173
- originalInput: task,
174
- failedOutput: solution,
175
- errorType: detectErrorType(execution.error),
176
- errorMessage: execution.error || "Unknown error",
177
- };
178
-
179
- // Reflect on error
180
- if (attempts < maxAttempts) {
181
- const reflectionPrompt = buildReflectionPrompt(context);
182
- const reflectionResponse = await client.messages.create({
183
- model: "claude-opus-4.5",
184
- max_tokens: 400,
185
- messages: [{ role: "user", content: reflectionPrompt }],
186
- });
187
- const reflection = reflectionResponse.content[0].text || "";
188
- console.log(`Attempt ${attempts} - Reflection:\n${reflection}\n`);
189
-
190
- // Update task with reflection
191
- task = `${context.originalInput}\n\nPrevious approach didn't work because: ${context.errorMessage}\n\nReflection: ${reflection}\n\nTry again with a different strategy.`;
192
- }
193
- }
194
-
195
- throw new Error(
196
- `Failed after ${maxAttempts} attempts on task: ${task.substring(0, 100)}`
197
- );
198
- }
199
-
200
- function detectErrorType(
201
- error: string | undefined
202
- ): "validation" | "execution" | "logic" {
203
- if (!error) return "logic";
204
- if (error.includes("TypeError") || error.includes("SyntaxError"))
205
- return "execution";
206
- if (error.includes("assert") || error.includes("expect")) return "validation";
207
- return "logic";
208
- }
209
-
210
- function buildReflectionPrompt(context: ReflectionContext): string {
211
- return `Your solution failed with this error:
212
-
213
- ERROR TYPE: ${context.errorType}
214
- ERROR MESSAGE: ${context.errorMessage}
215
-
216
- Your attempted solution:
217
- ${context.failedOutput}
218
-
219
- Analyze:
220
- 1. Why did this approach fail?
221
- 2. What's a fundamentally different approach?
222
- 3. What assumption was wrong?
223
-
224
- Provide a new strategy to solve: ${context.originalInput}`;
225
- }
226
- ```
227
-
228
- ---
229
-
230
- ## Pattern 4: Instruction-Following Validation
231
-
232
- **Use Case**: Ensuring outputs meet explicit criteria
233
- **Lines of Code**: ~80
234
- **Tokens per attempt**: ~400-700
235
-
236
- ```typescript
237
- interface ValidationRule {
238
- name: string;
239
- description: string;
240
- validate: (output: string) => boolean;
241
- }
242
-
243
- interface ValidatedOutput {
244
- output: string;
245
- passedRules: string[];
246
- failedRules: string[];
247
- }
248
-
249
- async function validateWithReflection(
250
- task: string,
251
- rules: ValidationRule[],
252
- maxAttempts: number = 3
253
- ): Promise<string> {
254
- let output = "";
255
-
256
- for (let attempt = 1; attempt <= maxAttempts; attempt++) {
257
- // Generate
258
- const response = await client.messages.create({
259
- model: "claude-opus-4.5",
260
- max_tokens: 1024,
261
- messages: [
262
- {
263
- role: "user",
264
- content: buildGenerationPrompt(
265
- task,
266
- rules,
267
- attempt > 1
268
- ),
269
- },
270
- ],
271
- });
272
- output = response.content[0].text || "";
273
-
274
- // Validate
275
- const validation = validateOutput(output, rules);
276
- console.log(`Attempt ${attempt}: ${validation.passedRules.length}/${rules.length} rules passed`);
277
-
278
- if (validation.failedRules.length === 0) {
279
- return output;
280
- }
281
-
282
- // Reflect if not last attempt
283
- if (attempt < maxAttempts) {
284
- const reflection = await client.messages.create({
285
- model: "claude-opus-4.5",
286
- max_tokens: 400,
287
- messages: [
288
- {
289
- role: "user",
290
- content: buildReflectionPromptForValidation(
291
- task,
292
- output,
293
- validation.failedRules,
294
- rules
295
- ),
296
- },
297
- ],
298
- });
299
- console.log("Reflection:", reflection.content[0].text);
300
- }
301
- }
302
-
303
- throw new Error(
304
- `Validation failed after ${maxAttempts} attempts. ` +
305
- `Failed rules: ${failedRules.join(", ")}`
306
- );
307
- }
308
-
309
- function buildGenerationPrompt(
310
- task: string,
311
- rules: ValidationRule[],
312
- includeReminder: boolean = false
313
- ): string {
314
- const rulesText = rules
315
- .map((r) => `- ${r.name}: ${r.description}`)
316
- .join("\n");
317
-
318
- const reminderText = includeReminder
319
- ? "\n\nREMINDER: Your previous response violated some of these rules. This time, ensure ALL rules are satisfied."
320
- : "";
321
-
322
- return `Task: ${task}
323
-
324
- Your response MUST satisfy these rules:
325
- ${rulesText}${reminderText}`;
326
- }
327
-
328
- function validateOutput(
329
- output: string,
330
- rules: ValidationRule[]
331
- ): ValidatedOutput {
332
- const passedRules: string[] = [];
333
- const failedRules: string[] = [];
334
-
335
- for (const rule of rules) {
336
- if (rule.validate(output)) {
337
- passedRules.push(rule.name);
338
- } else {
339
- failedRules.push(rule.name);
340
- }
341
- }
342
-
343
- return { output, passedRules, failedRules };
344
- }
345
-
346
- function buildReflectionPromptForValidation(
347
- task: string,
348
- output: string,
349
- failedRules: string[],
350
- allRules: ValidationRule[]
351
- ): string {
352
- const failedRulesDetails = allRules
353
- .filter((r) => failedRules.includes(r.name))
354
- .map((r) => `- ${r.name}: ${r.description}`)
355
- .join("\n");
356
-
357
- return `Task: ${task}
358
-
359
- Your response violated these rules:
360
- ${failedRulesDetails}
361
-
362
- Your response was:
363
- ${output}
364
-
365
- What specific changes would make your response satisfy all rules?`;
366
- }
367
-
368
- // Example usage
369
- const rules: ValidationRule[] = [
370
- {
371
- name: "proper_grammar",
372
- description: "Response uses proper grammar and punctuation",
373
- validate: (output) => output.includes(".") || output.includes("?"),
374
- },
375
- {
376
- name: "min_length",
377
- description: "Response is at least 100 characters",
378
- validate: (output) => output.length >= 100,
379
- },
380
- {
381
- name: "structured_format",
382
- description: "Response uses clear formatting with sections",
383
- validate: (output) => output.includes("\n") && output.split("\n").length >= 3,
384
- },
385
- ];
386
-
387
- // const result = await validateWithReflection(
388
- // "Write about the benefits of reflection in AI",
389
- // rules,
390
- // 3
391
- // );
392
- ```
393
-
394
- ---
395
-
396
- ## Pattern 5: Confidence-Based Reflection
397
-
398
- **Use Case**: Reflect only when model is uncertain
399
- **Lines of Code**: ~70
400
- **Tokens per attempt**: ~500-1000
401
-
402
- ```typescript
403
- interface ConfidenceAssessment {
404
- output: string;
405
- confidence: number; // 0-1
406
- uncertaintyAreas: string[];
407
- suggestedAlternatives: string[];
408
- }
409
-
410
- async function confidenceBasedReflection(
411
- task: string,
412
- confidenceThreshold: number = 0.75
413
- ): Promise<string> {
414
- // First pass: generate and assess confidence
415
- const assessment = await generateWithConfidence(task);
416
-
417
- console.log(`Initial confidence: ${(assessment.confidence * 100).toFixed(0)}%`);
418
- console.log(`Uncertainty areas: ${assessment.uncertaintyAreas.join(", ")}`);
419
-
420
- // If confident enough, return immediately
421
- if (assessment.confidence >= confidenceThreshold) {
422
- console.log("Output meets confidence threshold, returning without reflection");
423
- return assessment.output;
424
- }
425
-
426
- // If not confident, reflect and improve
427
- console.log("Confidence below threshold, triggering reflection...");
428
- const improved = await reflectOnLowConfidence(
429
- task,
430
- assessment
431
- );
432
-
433
- return improved;
434
- }
435
-
436
- async function generateWithConfidence(
437
- task: string
438
- ): Promise<ConfidenceAssessment> {
439
- const response = await client.messages.create({
440
- model: "claude-opus-4.5",
441
- max_tokens: 1200,
442
- messages: [
443
- {
444
- role: "user",
445
- content: `${task}
446
-
447
- After providing your response, assess your own confidence by providing a JSON block:
448
- {
449
- "confidence": <0.0 to 1.0>,
450
- "uncertaintyAreas": ["area1", "area2"],
451
- "suggestedAlternatives": ["alternative1", "alternative2"]
452
- }
453
-
454
- Only provide JSON for the assessment, nothing else after it.`,
455
- },
456
- ],
457
- });
458
-
459
- const text = response.content[0].text || "";
460
- const jsonMatch = text.match(/\{[\s\S]*\}$/);
461
-
462
- if (!jsonMatch) {
463
- return {
464
- output: text,
465
- confidence: 0.5,
466
- uncertaintyAreas: [],
467
- suggestedAlternatives: [],
468
- };
469
- }
470
-
471
- const assessment = JSON.parse(jsonMatch[0]);
472
- return {
473
- output: text.substring(0, text.lastIndexOf("{")),
474
- confidence: assessment.confidence,
475
- uncertaintyAreas: assessment.uncertaintyAreas || [],
476
- suggestedAlternatives: assessment.suggestedAlternatives || [],
477
- };
478
- }
479
-
480
- async function reflectOnLowConfidence(
481
- task: string,
482
- assessment: ConfidenceAssessment
483
- ): Promise<string> {
484
- const response = await client.messages.create({
485
- model: "claude-opus-4.5",
486
- max_tokens: 1024,
487
- messages: [
488
- {
489
- role: "user",
490
- content: `Original task: ${task}
491
-
492
- Your previous response (confidence: ${(assessment.confidence * 100).toFixed(0)}%):
493
- ${assessment.output}
494
-
495
- You identified these uncertainty areas:
496
- ${assessment.uncertaintyAreas.map((a) => `- ${a}`).join("\n")}
497
-
498
- You considered these alternatives:
499
- ${assessment.suggestedAlternatives.map((a) => `- ${a}`).join("\n")}
500
-
501
- Given your identified uncertainties, provide an improved response that:
502
- 1. Directly addresses the uncertainty areas
503
- 2. Is more thorough and robust
504
- 3. Includes more detail or evidence
505
- 4. Considers the alternatives you mentioned
506
-
507
- Provide your improved response, then a brief confidence assessment (0-1).`,
508
- },
509
- ],
510
- });
511
-
512
- return response.content[0].text || "";
513
- }
514
- ```
515
-
516
- ---
517
-
518
- ## Pattern 6: Tool-Feedback Reflection (Code)
519
-
520
- **Use Case**: Reflection based on test/lint results
521
- **Lines of Code**: ~90
522
- **Tokens per attempt**: ~600-1200
523
-
524
- ```typescript
525
- interface CodeFeedback {
526
- type: "syntax" | "lint" | "test" | "runtime";
527
- message: string;
528
- severity: "error" | "warning";
529
- }
530
-
531
- async function codeGenerationWithReflection(
532
- requirement: string,
533
- maxAttempts: number = 3
534
- ): Promise<string> {
535
- let code = "";
536
- const feedback: CodeFeedback[] = [];
537
-
538
- for (let attempt = 1; attempt <= maxAttempts; attempt++) {
539
- // Generate code
540
- const response = await client.messages.create({
541
- model: "claude-opus-4.5",
542
- max_tokens: 2048,
543
- messages: [
544
- {
545
- role: "user",
546
- content: buildCodeGenerationPrompt(
547
- requirement,
548
- feedback,
549
- attempt
550
- ),
551
- },
552
- ],
553
- });
554
-
555
- code = extractCode(response.content[0].text || "");
556
-
557
- // Get feedback
558
- const newFeedback = await getCodeFeedback(code);
559
-
560
- if (newFeedback.length === 0) {
561
- console.log(`Code passed on attempt ${attempt}`);
562
- return code;
563
- }
564
-
565
- feedback.push(...newFeedback);
566
- console.log(
567
- `Attempt ${attempt}: ${newFeedback.length} issues found`
568
- );
569
-
570
- // Request reflection if not last attempt
571
- if (attempt < maxAttempts) {
572
- const reflection = await client.messages.create({
573
- model: "claude-opus-4.5",
574
- max_tokens: 400,
575
- messages: [
576
- {
577
- role: "user",
578
- content: buildCodeReflectionPrompt(
579
- requirement,
580
- code,
581
- newFeedback
582
- ),
583
- },
584
- ],
585
- });
586
- console.log("Reflection:", reflection.content[0].text);
587
- }
588
- }
589
-
590
- throw new Error(
591
- `Code generation failed after ${maxAttempts} attempts with ${feedback.length} issues`
592
- );
593
- }
594
-
595
- function buildCodeGenerationPrompt(
596
- requirement: string,
597
- previousFeedback: CodeFeedback[],
598
- attempt: number
599
- ): string {
600
- const feedbackText =
601
- previousFeedback.length > 0
602
- ? `\n\nPrevious issues found:\n${previousFeedback
603
- .map(
604
- (f) =>
605
- `[${f.severity.toUpperCase()}] ${f.type}: ${f.message}`
606
- )
607
- .join("\n")}\n\nFix these issues in your new response.`
608
- : "";
609
-
610
- return `Generate TypeScript/JavaScript code for:
611
- ${requirement}${feedbackText}
612
-
613
- Requirements:
614
- - Use modern TypeScript (5.2+)
615
- - Include proper type annotations
616
- - Include error handling
617
- - Include comments for complex logic
618
- - Be production-ready`;
619
- }
620
-
621
- async function getCodeFeedback(code: string): Promise<CodeFeedback[]> {
622
- const feedback: CodeFeedback[] = [];
623
-
624
- // Syntax check
625
- try {
626
- // Basic syntax validation (would use ts-node or similar in real implementation)
627
- eval(code);
628
- } catch (e) {
629
- feedback.push({
630
- type: "syntax",
631
- message: String(e),
632
- severity: "error",
633
- });
634
- }
635
-
636
- // Lint checks (would use eslint in real implementation)
637
- if (!code.includes("://") && code.includes("http")) {
638
- feedback.push({
639
- type: "lint",
640
- message: "URL should be quoted string",
641
- severity: "warning",
642
- });
643
- }
644
-
645
- // Complexity check
646
- const lines = code.split("\n").length;
647
- if (lines > 100) {
648
- feedback.push({
649
- type: "lint",
650
- message: "Function is too long, consider breaking it up",
651
- severity: "warning",
652
- });
653
- }
654
-
655
- return feedback;
656
- }
657
-
658
- function buildCodeReflectionPrompt(
659
- requirement: string,
660
- code: string,
661
- feedback: CodeFeedback[]
662
- ): string {
663
- return `Requirement: ${requirement}
664
-
665
- Your code had these issues:
666
- ${feedback.map((f) => `[${f.severity.toUpperCase()}] ${f.type}: ${f.message}`).join("\n")}
667
-
668
- Current code:
669
- ${code}
670
-
671
- What specific changes would address these issues? Focus on:
672
- 1. The root cause of each issue
673
- 2. How to fix it without breaking functionality`;
674
- }
675
-
676
- function extractCode(text: string): string {
677
- // Extract code from markdown code blocks
678
- const codeBlockMatch = text.match(/```(?:typescript|javascript)?\n([\s\S]*?)\n```/);
679
- if (codeBlockMatch) {
680
- return codeBlockMatch[1];
681
- }
682
- return text;
683
- }
684
- ```
685
-
686
- ---
687
-
688
- ## Pattern 7: Multi-Agent Reflection (Generator + Critic)
689
-
690
- **Use Case**: Higher quality through dialogue between agents
691
- **Lines of Code**: ~100
692
- **Tokens per attempt**: ~800-1600
693
-
694
- ```typescript
695
- interface CritiqueResult {
696
- isSatisfactory: boolean;
697
- strengths: string[];
698
- weaknesses: string[];
699
- suggestions: string[];
700
- }
701
-
702
- class GeneratorCriticReflection {
703
- private client: LLMClient;
704
- private maxRounds: number;
705
-
706
- constructor(client: LLMClient, maxRounds: number = 3) {
707
- this.client = client;
708
- this.maxRounds = maxRounds;
709
- }
710
-
711
- async generate(task: string): Promise<string> {
712
- let output = await this.generatorPass(task);
713
-
714
- for (let round = 1; round < this.maxRounds; round++) {
715
- const critique = await this.criticPass(task, output);
716
-
717
- if (critique.isSatisfactory) {
718
- console.log(`✓ Critique satisfied on round ${round}`);
719
- return output;
720
- }
721
-
722
- console.log(`Round ${round} critique:`, critique.weaknesses);
723
- output = await this.generatorImprove(
724
- task,
725
- output,
726
- critique
727
- );
728
- }
729
-
730
- return output;
731
- }
732
-
733
- private async generatorPass(task: string): Promise<string> {
734
- const response = await this.client.messages.create({
735
- model: "claude-opus-4.5",
736
- max_tokens: 1024,
737
- messages: [{ role: "user", content: task }],
738
- });
739
- return response.content[0].text || "";
740
- }
741
-
742
- private async generatorImprove(
743
- task: string,
744
- previousOutput: string,
745
- critique: CritiqueResult
746
- ): Promise<string> {
747
- const response = await this.client.messages.create({
748
- model: "claude-opus-4.5",
749
- max_tokens: 1024,
750
- messages: [
751
- {
752
- role: "user",
753
- content: `Task: ${task}
754
-
755
- Previous output:
756
- ${previousOutput}
757
-
758
- Critique feedback:
759
- Weaknesses: ${critique.weaknesses.join("; ")}
760
- Suggestions: ${critique.suggestions.join("; ")}
761
-
762
- Provide an improved version that addresses all the feedback.`,
763
- },
764
- ],
765
- });
766
- return response.content[0].text || "";
767
- }
768
-
769
- private async criticPass(
770
- task: string,
771
- output: string
772
- ): Promise<CritiqueResult> {
773
- const response = await this.client.messages.create({
774
- model: "claude-opus-4.5",
775
- max_tokens: 600,
776
- messages: [
777
- {
778
- role: "user",
779
- content: `You are a critical reviewer.
780
-
781
- Task: ${task}
782
-
783
- Response to critique:
784
- ${output}
785
-
786
- Provide a JSON critique:
787
- {
788
- "isSatisfactory": boolean,
789
- "strengths": ["strength1", "strength2"],
790
- "weaknesses": ["weakness1", "weakness2"],
791
- "suggestions": ["suggestion1", "suggestion2"]
792
- }
793
-
794
- Respond with ONLY the JSON object.`,
795
- },
796
- ],
797
- });
798
-
799
- const text = response.content[0].text || "{}";
800
- try {
801
- return JSON.parse(text);
802
- } catch {
803
- return {
804
- isSatisfactory: true,
805
- strengths: [],
806
- weaknesses: [],
807
- suggestions: [],
808
- };
809
- }
810
- }
811
- }
812
-
813
- // Usage
814
- // const gc = new GeneratorCriticReflection(client, 3);
815
- // const result = await gc.generate("Write an essay on AI reflection");
816
- ```
817
-
818
- ---
819
-
820
- ## Pattern 8: State-Aware Reflection with History
821
-
822
- **Use Case**: Learning from previous attempts within workflow
823
- **Lines of Code**: ~110
824
- **Tokens per attempt**: ~700-1400
825
-
826
- ```typescript
827
- interface ExecutionState {
828
- taskId: string;
829
- attempt: number;
830
- previousAttempts: Array<{
831
- output: string;
832
- result: "success" | "failed";
833
- reason: string;
834
- timestamp: Date;
835
- }>;
836
- currentError: string | null;
837
- succeededApproaches: string[];
838
- failedApproaches: string[];
839
- }
840
-
841
- async function stateAwareReflection(
842
- task: string,
843
- state: ExecutionState,
844
- maxAttempts: number = 3
845
- ): Promise<string> {
846
- while (state.attempt < maxAttempts) {
847
- state.attempt++;
848
-
849
- // Generate solution informed by history
850
- const solution = await generateInformedSolution(
851
- task,
852
- state
853
- );
854
-
855
- // Try to execute
856
- const result = await executeAndValidate(solution);
857
-
858
- if (result.success) {
859
- // Record success
860
- state.previousAttempts.push({
861
- output: solution,
862
- result: "success",
863
- reason: "Execution passed all checks",
864
- timestamp: new Date(),
865
- });
866
- state.succeededApproaches.push(result.approachUsed);
867
- return solution;
868
- }
869
-
870
- // Record failure
871
- state.previousAttempts.push({
872
- output: solution,
873
- result: "failed",
874
- reason: result.error,
875
- timestamp: new Date(),
876
- });
877
- state.failedApproaches.push(result.approachUsed);
878
- state.currentError = result.error;
879
-
880
- // Reflect before next attempt
881
- if (state.attempt < maxAttempts) {
882
- const reflection = await reflectWithState(
883
- task,
884
- solution,
885
- result.error,
886
- state
887
- );
888
- console.log(`Attempt ${state.attempt} reflection:`, reflection);
889
- }
890
- }
891
-
892
- throw new Error(
893
- `Task failed after ${maxAttempts} attempts. ` +
894
- `Last error: ${state.currentError}`
895
- );
896
- }
897
-
898
- async function generateInformedSolution(
899
- task: string,
900
- state: ExecutionState
901
- ): Promise<string> {
902
- const historyContext = buildHistoryContext(state);
903
-
904
- const response = await client.messages.create({
905
- model: "claude-opus-4.5",
906
- max_tokens: 1024,
907
- messages: [
908
- {
909
- role: "user",
910
- content: `${task}${historyContext}`,
911
- },
912
- ],
913
- });
914
-
915
- return response.content[0].text || "";
916
- }
917
-
918
- function buildHistoryContext(state: ExecutionState): string {
919
- if (state.previousAttempts.length === 0) {
920
- return "";
921
- }
922
-
923
- const succeeded =
924
- state.succeededApproaches.length > 0
925
- ? `\n\nApproaches that worked: ${state.succeededApproaches.join(", ")}`
926
- : "";
927
-
928
- const failed =
929
- state.failedApproaches.length > 0
930
- ? `\nApproaches that failed: ${state.failedApproaches.join(", ")}`
931
- : "";
932
-
933
- const recent = state.previousAttempts
934
- .slice(-2)
935
- .map(
936
- (a) =>
937
- `Attempt ${a.previousAttempts.length}: ${a.result} (${a.reason})`
938
- )
939
- .join("\n");
940
-
941
- return `${succeeded}${failed}\n\nRecent attempts:\n${recent}\n\nFor this attempt, try a different approach from what failed before.`;
942
- }
943
-
944
- async function reflectWithState(
945
- task: string,
946
- solution: string,
947
- error: string,
948
- state: ExecutionState
949
- ): Promise<string> {
950
- const response = await client.messages.create({
951
- model: "claude-opus-4.5",
952
- max_tokens: 400,
953
- messages: [
954
- {
955
- role: "user",
956
- content: `Task: ${task}
957
-
958
- Attempt ${state.attempt} failed with: ${error}
959
-
960
- Your attempted solution:
961
- ${solution}
962
-
963
- What different approach should we try next?
964
- - What assumptions was this approach based on?
965
- - How could those assumptions be wrong?
966
- - What fundamentally different strategy exists?`,
967
- },
968
- ],
969
- });
970
-
971
- return response.content[0].text || "";
972
- }
973
-
974
- async function executeAndValidate(solution: string): Promise<{
975
- success: boolean;
976
- error: string;
977
- approachUsed: string;
978
- }> {
979
- // Mock implementation - would be actual execution
980
- try {
981
- // Execute solution (parse, validate, run, etc.)
982
- return {
983
- success: true,
984
- error: "",
985
- approachUsed: "web_search_approach",
986
- };
987
- } catch (e) {
988
- return {
989
- success: false,
990
- error: String(e),
991
- approachUsed: "web_search_approach",
992
- };
993
- }
994
- }
995
- ```
996
-
997
- ---
998
-
999
- ## Pattern 9: Low-Token Reflection (Budget-Conscious)
1000
-
1001
- **Use Case**: Reflection with minimal token overhead
1002
- **Lines of Code**: ~40
1003
- **Tokens per attempt**: ~150-300
1004
-
1005
- ```typescript
1006
- async function budgetConsciousReflection(
1007
- task: string,
1008
- tokenBudget: number = 1000
1009
- ): Promise<string> {
1010
- let tokensUsed = 0;
1011
- let output = "";
1012
-
1013
- // Initial generation
1014
- const gen1 = await client.messages.create({
1015
- model: "claude-haiku-4.5", // Cheaper model
1016
- max_tokens: Math.min(500, tokenBudget - 200),
1017
- messages: [{ role: "user", content: task }],
1018
- });
1019
-
1020
- output = gen1.content[0].text || "";
1021
- tokensUsed += gen1.usage?.input_tokens || 0;
1022
- tokensUsed += gen1.usage?.output_tokens || 0;
1023
-
1024
- if (tokensUsed + 200 > tokenBudget) {
1025
- return output;
1026
- }
1027
-
1028
- // Lightweight reflection
1029
- const reflection = await client.messages.create({
1030
- model: "claude-haiku-4.5",
1031
- max_tokens: Math.min(300, tokenBudget - tokensUsed - 100),
1032
- messages: [
1033
- {
1034
- role: "user",
1035
- content: `Review this response for errors (brief 1-2 sentence assessment):\n\n${output.substring(
1036
- 0,
1037
- 500
1038
- )}...`,
1039
- },
1040
- ],
1041
- });
1042
-
1043
- tokensUsed +=
1044
- reflection.usage?.input_tokens || 0;
1045
- tokensUsed +=
1046
- reflection.usage?.output_tokens || 0;
1047
-
1048
- // If still within budget and issues found, do one quick pass
1049
- const reflectionText = reflection.content[0].text || "";
1050
- if (
1051
- tokensUsed + 200 <= tokenBudget &&
1052
- reflectionText.toLowerCase().includes("error")
1053
- ) {
1054
- const fix = await client.messages.create({
1055
- model: "claude-haiku-4.5",
1056
- max_tokens: 300,
1057
- messages: [
1058
- {
1059
- role: "user",
1060
- content: `Issue: ${reflectionText}\n\nOriginal response: ${output}\n\nQuick fix:`,
1061
- },
1062
- ],
1063
- });
1064
-
1065
- output = fix.content[0].text || output;
1066
- }
1067
-
1068
- return output;
1069
- }
1070
- ```
1071
-
1072
- ---
1073
-
1074
- ## Pattern 10: Timeout-Safe Reflection
1075
-
1076
- **Use Case**: Reflection with guaranteed completion
1077
- **Lines of Code**: ~60
1078
- **Tokens per attempt**: Variable
1079
-
1080
- ```typescript
1081
- interface TimeoutAwareReflectionOptions {
1082
- initialTimeout: number; // ms for first attempt
1083
- maxTotalTime: number; // ms for entire reflection
1084
- reflectionTime: number; // ms budget per reflection
1085
- }
1086
-
1087
- async function timeoutSafeReflection(
1088
- task: string,
1089
- options: TimeoutAwareReflectionOptions
1090
- ): Promise<string> {
1091
- const startTime = Date.now();
1092
- const deadline = startTime + options.maxTotalTime;
1093
- let output = "";
1094
-
1095
- try {
1096
- // First attempt with time limit
1097
- output = await withTimeout(
1098
- generateResponse(task),
1099
- options.initialTimeout
1100
- );
1101
- return output;
1102
- } catch (e) {
1103
- // If generation fails, return error instead of reflecting
1104
- if (Date.now() > deadline) {
1105
- throw new Error("Timeout exceeded during generation");
1106
- }
1107
- }
1108
-
1109
- // Reflection (only if time permits)
1110
- const timeRemaining = deadline - Date.now();
1111
- if (timeRemaining < 500) {
1112
- // Less than 500ms left, don't reflect
1113
- return output;
1114
- }
1115
-
1116
- try {
1117
- const reflection = await withTimeout(
1118
- reflectOnOutput(task, output),
1119
- Math.min(options.reflectionTime, timeRemaining - 100)
1120
- );
1121
- return reflection;
1122
- } catch (e) {
1123
- // Reflection failed or timed out, return what we have
1124
- console.warn("Reflection timed out or failed, returning original output");
1125
- return output;
1126
- }
1127
- }
1128
-
1129
- async function withTimeout<T>(
1130
- promise: Promise<T>,
1131
- timeoutMs: number
1132
- ): Promise<T> {
1133
- return Promise.race([
1134
- promise,
1135
- new Promise<T>((_, reject) =>
1136
- setTimeout(
1137
- () => reject(new Error(`Operation timed out after ${timeoutMs}ms`)),
1138
- timeoutMs
1139
- )
1140
- ),
1141
- ]);
1142
- }
1143
-
1144
- async function generateResponse(task: string): Promise<string> {
1145
- const response = await client.messages.create({
1146
- model: "claude-opus-4.5",
1147
- max_tokens: 1024,
1148
- messages: [{ role: "user", content: task }],
1149
- });
1150
- return response.content[0].text || "";
1151
- }
1152
-
1153
- async function reflectOnOutput(
1154
- task: string,
1155
- output: string
1156
- ): Promise<string> {
1157
- const response = await client.messages.create({
1158
- model: "claude-opus-4.5",
1159
- max_tokens: 400,
1160
- messages: [
1161
- {
1162
- role: "user",
1163
- content: `Quickly review and improve:\n\nTask: ${task}\n\nResponse: ${output}`,
1164
- },
1165
- ],
1166
- });
1167
- return response.content[0].text || output;
1168
- }
1169
- ```
1170
-
1171
- ---
1172
-
1173
- ## Quick Reference: Pattern Selection
1174
-
1175
- | Pattern | Best For | Tokens/Attempt | Latency |
1176
- |---------|----------|------------------|---------|
1177
- | Simple (1) | Basic validation | 200-400 | +200ms |
1178
- | Multi-Attempt (2) | Complex tasks | 300-600 | +400ms |
1179
- | Error-Triggered (3) | Execution errors | 400-800 | +500ms |
1180
- | IFE Validation (4) | Explicit rules | 400-700 | +400ms |
1181
- | Confidence (5) | Uncertain output | 500-1000 | +600ms |
1182
- | Tool-Feedback (6) | Code/tests | 600-1200 | +800ms |
1183
- | Multi-Agent (7) | High quality | 800-1600 | +1000ms |
1184
- | State-Aware (8) | Learning workflows | 700-1400 | +700ms |
1185
- | Budget-Conscious (9) | Limited tokens | 150-300 | +200ms |
1186
- | Timeout-Safe (10) | Time constraints | Variable | Guaranteed |
1187
-
1188
- ---
1189
-
1190
- ## Implementation Checklist
1191
-
1192
- When implementing reflection patterns:
1193
-
1194
- - [ ] Define success criteria (not vague goals)
1195
- - [ ] Set max retry limit (typically 3-5)
1196
- - [ ] Capture error context before reflection
1197
- - [ ] Implement exponential backoff for transient errors
1198
- - [ ] Use state deduplication to detect loops
1199
- - [ ] Include cost/token tracking
1200
- - [ ] Log all attempts and reflections
1201
- - [ ] Test with both success and failure paths
1202
- - [ ] Monitor reflection effectiveness (did it help?)
1203
- - [ ] Consider latency impact on user experience
1204
- - [ ] Plan graceful degradation if reflection fails
1205
-