@chongyan/autospec 1.0.2 → 1.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (688) hide show
  1. package/LICENSE +240 -21
  2. package/README.md +47 -608
  3. package/dist/README.md +47 -0
  4. package/dist/adapters/claude-code/README.md.enc +6 -0
  5. package/dist/adapters/claude-code/agents.js +1 -0
  6. package/dist/adapters/claude-code/commands.config.js +1 -0
  7. package/dist/adapters/claude-code/commands.js +1 -0
  8. package/dist/adapters/claude-code/hooks.config.js +2 -0
  9. package/dist/adapters/claude-code/hooks.js +1 -0
  10. package/dist/adapters/claude-code/install.js +1 -0
  11. package/dist/adapters/claude-code/skills.js +1 -0
  12. package/dist/adapters/codex/README.md.enc +6 -0
  13. package/dist/adapters/codex/hooks/pre-commit.sh +10 -0
  14. package/dist/adapters/codex/install.js +1 -0
  15. package/dist/adapters/codex/prompts/env-learn.md.enc +6 -0
  16. package/dist/adapters/codex/prompts/review.md.enc +6 -0
  17. package/dist/adapters/codex/wrappers/autospec-cli.sh +118 -0
  18. package/dist/adapters/codex/wrappers/parallel.sh +20 -0
  19. package/dist/adapters/codex/wrappers/post-task.sh +138 -0
  20. package/dist/bin/autospec.js +2 -0
  21. package/dist/knowledge/README.md.enc +6 -0
  22. package/dist/knowledge/change-management.md.enc +6 -0
  23. package/dist/knowledge/cognition-engine.md.enc +6 -0
  24. package/dist/knowledge/config/baseline-permissions.md.enc +6 -0
  25. package/dist/knowledge/config/external-mounts.yaml.enc +6 -0
  26. package/dist/knowledge/config/model-profiles.yaml.enc +6 -0
  27. package/dist/knowledge/config/role-composition.yaml.enc +6 -0
  28. package/dist/knowledge/config/token-optimization.yaml.enc +6 -0
  29. package/dist/knowledge/config/validation-patterns.yaml.enc +6 -0
  30. package/dist/knowledge/constitution.md.enc +6 -0
  31. package/dist/knowledge/core-rules.md.enc +6 -0
  32. package/dist/knowledge/environment/adapters/README.md.enc +6 -0
  33. package/dist/knowledge/environment/detection-patterns.yaml.enc +6 -0
  34. package/dist/knowledge/environment/failure-patterns.json +223 -0
  35. package/dist/knowledge/environment/repair-strategies.json +206 -0
  36. package/dist/knowledge/memory/README.md.enc +6 -0
  37. package/dist/knowledge/memory/field/README.md.enc +6 -0
  38. package/dist/knowledge/memory/project/decisions/README.md.enc +6 -0
  39. package/dist/knowledge/memory/project/evolution-log.md.enc +6 -0
  40. package/dist/knowledge/memory/project/health-metrics.md.enc +6 -0
  41. package/dist/knowledge/memory/team/best-practices.md.enc +6 -0
  42. package/dist/knowledge/pipeline/code.md.enc +6 -0
  43. package/dist/knowledge/pipeline/explore.md.enc +6 -0
  44. package/dist/knowledge/pipeline/plan.md.enc +6 -0
  45. package/dist/knowledge/pipeline/protocol.md.enc +6 -0
  46. package/dist/knowledge/protocol/capabilities.yaml.enc +6 -0
  47. package/dist/knowledge/protocol/evolve-integration.md.enc +6 -0
  48. package/dist/knowledge/skills/README.md.enc +6 -0
  49. package/dist/knowledge/skills/adversarial-review.md.enc +6 -0
  50. package/dist/knowledge/skills/analyze-requirement.md.enc +6 -0
  51. package/dist/knowledge/skills/channel-operations.md.enc +6 -0
  52. package/dist/knowledge/skills/content-operations.md.enc +6 -0
  53. package/dist/knowledge/skills/content-prompts.md.enc +6 -0
  54. package/dist/knowledge/skills/conversion-optimization.md.enc +6 -0
  55. package/dist/knowledge/skills/data-operations.md.enc +6 -0
  56. package/dist/knowledge/skills/design-solution.md.enc +6 -0
  57. package/dist/knowledge/skills/growth-strategies.md.enc +6 -0
  58. package/dist/knowledge/skills/implement-code.md.enc +6 -0
  59. package/dist/knowledge/skills/knowledge-distill.md.enc +6 -0
  60. package/dist/knowledge/skills/parallel-dev.md.enc +6 -0
  61. package/dist/knowledge/skills/private-domain-traffic.md.enc +6 -0
  62. package/dist/knowledge/skills/skill-format.md.enc +6 -0
  63. package/dist/knowledge/skills/social-commerce.md.enc +6 -0
  64. package/dist/knowledge/skills/team-orchestration.md.enc +6 -0
  65. package/dist/knowledge/skills/unified-review.md.enc +6 -0
  66. package/dist/knowledge/skills/user-operations.md.enc +6 -0
  67. package/dist/knowledge/templates/autospec-config.yaml.enc +6 -0
  68. package/dist/knowledge/templates/smoke-test.md.enc +6 -0
  69. package/dist/knowledge/templates/spec/SPEC.md.enc +6 -0
  70. package/dist/knowledge/templates/spec/layers/delta.md.enc +6 -0
  71. package/dist/knowledge/templates/spec/layers/how.md.enc +6 -0
  72. package/dist/knowledge/templates/spec/layers/plan.md.enc +6 -0
  73. package/dist/knowledge/templates/spec/layers/what.md.enc +6 -0
  74. package/dist/knowledge/templates/spec/layers/why.md.enc +6 -0
  75. package/dist/knowledge/templates/wiki/catalog.yaml.enc +6 -0
  76. package/dist/knowledge/templates/wiki/content.md.enc +6 -0
  77. package/dist/knowledge/templates/wiki/meta.yaml.enc +6 -0
  78. package/dist/package.json +54 -0
  79. package/{plugins → dist/plugins}/.claude-plugin/plugin.json +259 -101
  80. package/dist/plugins/agents/roles/ai-engineer.md.enc +6 -0
  81. package/dist/plugins/agents/roles/backend-engineer.md.enc +6 -0
  82. package/dist/plugins/agents/roles/ceo.md.enc +6 -0
  83. package/dist/plugins/agents/roles/channel-ops.md.enc +6 -0
  84. package/dist/plugins/agents/roles/content-ops.md.enc +6 -0
  85. package/dist/plugins/agents/roles/conversion-ops.md.enc +6 -0
  86. package/dist/plugins/agents/roles/data-engineer.md.enc +6 -0
  87. package/dist/plugins/agents/roles/data-ops.md.enc +6 -0
  88. package/dist/plugins/agents/roles/devops-engineer.md.enc +6 -0
  89. package/dist/plugins/agents/roles/frontend-engineer.md.enc +6 -0
  90. package/dist/plugins/agents/roles/marketing-director.md.enc +6 -0
  91. package/dist/plugins/agents/roles/operations-director.md.enc +6 -0
  92. package/dist/plugins/agents/roles/private-traffic.md.enc +6 -0
  93. package/dist/plugins/agents/roles/product-owner.md.enc +6 -0
  94. package/dist/plugins/agents/roles/quality-engineer.md.enc +6 -0
  95. package/dist/plugins/agents/roles/security-engineer.md.enc +6 -0
  96. package/dist/plugins/agents/roles/tech-lead.md.enc +6 -0
  97. package/dist/plugins/agents/roles/user-ops.md.enc +6 -0
  98. package/dist/plugins/agents/support/blind-comparator.md.enc +6 -0
  99. package/dist/plugins/agents/support/consistency-checker.md.enc +6 -0
  100. package/dist/plugins/agents/support/experiment-evaluator.md.enc +6 -0
  101. package/dist/plugins/agents/support/failure-diagnostician.md.enc +6 -0
  102. package/dist/plugins/agents/support/independent-reviewer.md.enc +6 -0
  103. package/dist/plugins/agents/support/memory-curator.md.enc +6 -0
  104. package/dist/plugins/agents/support/monitoring-agent.md.enc +6 -0
  105. package/dist/plugins/agents/support/safety-auditor.md.enc +6 -0
  106. package/dist/plugins/agents/support/skill-benchmarker.md.enc +6 -0
  107. package/dist/plugins/agents/support/skill-forger.md.enc +6 -0
  108. package/dist/plugins/agents/support/stage-gate-evaluator.md.enc +6 -0
  109. package/dist/plugins/agents/support/team-orchestrator.md.enc +6 -0
  110. package/dist/plugins/agents/support/test-coverage-reviewer.md.enc +6 -0
  111. package/dist/plugins/benchmarks/templates/README.md.enc +6 -0
  112. package/dist/plugins/benchmarks/templates/commands/code-template.yaml.enc +6 -0
  113. package/dist/plugins/benchmarks/templates/commands/explore-template.yaml.enc +6 -0
  114. package/dist/plugins/benchmarks/templates/commands/field-evolve-template.yaml.enc +6 -0
  115. package/dist/plugins/benchmarks/templates/commands/plan-template.yaml.enc +6 -0
  116. package/dist/plugins/benchmarks/templates/commands/project-evolve-template.yaml.enc +6 -0
  117. package/dist/plugins/benchmarks/templates/commands/review-template.yaml.enc +6 -0
  118. package/dist/plugins/benchmarks/templates/commands/run-template.yaml.enc +6 -0
  119. package/dist/plugins/benchmarks/templates/skills/benchmark-executor-template.yaml.enc +6 -0
  120. package/dist/plugins/benchmarks/templates/skills/benchmark-generator-template.yaml.enc +6 -0
  121. package/dist/plugins/benchmarks/templates/skills/delivery-stage-template.yaml.enc +6 -0
  122. package/dist/plugins/benchmarks/templates/skills/design-stage-template.yaml.enc +6 -0
  123. package/dist/plugins/benchmarks/templates/skills/exploration-phase-template.yaml.enc +6 -0
  124. package/dist/plugins/benchmarks/templates/skills/field-evolve-analyzer-template.yaml.enc +6 -0
  125. package/dist/plugins/benchmarks/templates/skills/field-evolve-distiller-template.yaml.enc +6 -0
  126. package/dist/plugins/benchmarks/templates/skills/field-evolve-executor-template.yaml.enc +6 -0
  127. package/dist/plugins/benchmarks/templates/skills/field-evolve-fixer-template.yaml.enc +6 -0
  128. package/dist/plugins/benchmarks/templates/skills/field-evolve-learner-template.yaml.enc +6 -0
  129. package/dist/plugins/benchmarks/templates/skills/field-evolve-scanner-template.yaml.enc +6 -0
  130. package/dist/plugins/benchmarks/templates/skills/field-evolve-template.yaml.enc +6 -0
  131. package/dist/plugins/benchmarks/templates/skills/field-evolve-verifier-template.yaml.enc +6 -0
  132. package/dist/plugins/benchmarks/templates/skills/implementation-stage-template.yaml.enc +6 -0
  133. package/dist/plugins/benchmarks/templates/skills/layer1-validation-template.yaml.enc +6 -0
  134. package/dist/plugins/benchmarks/templates/skills/project-evolve-analyzer-template.yaml.enc +6 -0
  135. package/dist/plugins/benchmarks/templates/skills/project-evolve-fixer-template.yaml.enc +6 -0
  136. package/dist/plugins/benchmarks/templates/skills/project-evolve-generator-template.yaml.enc +6 -0
  137. package/dist/plugins/benchmarks/templates/skills/project-evolve-learner-template.yaml.enc +6 -0
  138. package/dist/plugins/benchmarks/templates/skills/project-evolve-reviewer-template.yaml.enc +6 -0
  139. package/dist/plugins/benchmarks/templates/skills/project-evolve-scanner-template.yaml.enc +6 -0
  140. package/dist/plugins/benchmarks/templates/skills/project-evolve-template.yaml.enc +6 -0
  141. package/dist/plugins/benchmarks/templates/skills/project-evolve-verifier-template.yaml.enc +6 -0
  142. package/dist/plugins/benchmarks/templates/skills/requirement-analyzer-template.yaml.enc +6 -0
  143. package/dist/plugins/benchmarks/templates/skills/skill-forge-template.yaml.enc +6 -0
  144. package/dist/plugins/benchmarks/templates/skills/startup-guard-template.yaml.enc +6 -0
  145. package/dist/plugins/benchmarks/templates/skills/testing-stage-template.yaml.enc +6 -0
  146. package/dist/plugins/commands/README.md.enc +6 -0
  147. package/dist/plugins/commands/automation.md.enc +6 -0
  148. package/dist/plugins/commands/code.md.enc +6 -0
  149. package/dist/plugins/commands/contribute.md.enc +6 -0
  150. package/dist/plugins/commands/dashboard.md.enc +6 -0
  151. package/dist/plugins/commands/env.md.enc +6 -0
  152. package/dist/plugins/commands/explore.md.enc +6 -0
  153. package/dist/plugins/commands/field-evolve.md.enc +6 -0
  154. package/dist/plugins/commands/global.md.enc +6 -0
  155. package/dist/plugins/commands/init.md.enc +6 -0
  156. package/dist/plugins/commands/list.md.enc +6 -0
  157. package/dist/plugins/commands/memory.md.enc +6 -0
  158. package/dist/plugins/commands/monitor.md.enc +6 -0
  159. package/dist/plugins/commands/org.md.enc +6 -0
  160. package/dist/plugins/commands/persist.md.enc +6 -0
  161. package/dist/plugins/commands/plan.md.enc +6 -0
  162. package/dist/plugins/commands/plugin.md.enc +6 -0
  163. package/dist/plugins/commands/project-evolve.md.enc +6 -0
  164. package/dist/plugins/commands/review.md.enc +6 -0
  165. package/dist/plugins/commands/run.md.enc +6 -0
  166. package/dist/plugins/commands/status.md.enc +6 -0
  167. package/dist/plugins/commands/sync.md.enc +6 -0
  168. package/dist/plugins/commands/update.md.enc +6 -0
  169. package/dist/plugins/env-capabilities/env-core/plugin.json +33 -0
  170. package/dist/plugins/hooks/README.md.enc +6 -0
  171. package/dist/plugins/hooks/artifact-evaluation-hook.js +2 -0
  172. package/dist/plugins/hooks/cognitive-dreamer.js +2 -0
  173. package/dist/plugins/hooks/cognitive-sync.js +2 -0
  174. package/dist/plugins/hooks/cognitive-tracker.js +2 -0
  175. package/dist/plugins/hooks/config/detection-patterns.yaml.enc +6 -0
  176. package/dist/plugins/hooks/constitution-guard.js +2 -0
  177. package/dist/plugins/hooks/do-review-separation-guard.js +2 -0
  178. package/dist/plugins/hooks/environment-autocommit.js +2 -0
  179. package/dist/plugins/hooks/environment-doctor.js +1 -0
  180. package/dist/plugins/hooks/environment-startup-scan.js +2 -0
  181. package/dist/plugins/hooks/execution-tracker.js +2 -0
  182. package/dist/plugins/hooks/frozen-zone-guard.js +2 -0
  183. package/dist/plugins/hooks/layer1-validator.js +2 -0
  184. package/dist/plugins/hooks/lib/artifact-evaluator.js +1 -0
  185. package/dist/plugins/hooks/lib/assets/asset-decision-store.js +1 -0
  186. package/dist/plugins/hooks/lib/assets/asset-graph.js +1 -0
  187. package/dist/plugins/hooks/lib/assets/asset-hydrator.js +1 -0
  188. package/dist/plugins/hooks/lib/assets/asset-outcome-store.js +1 -0
  189. package/dist/plugins/hooks/lib/assets/asset-projection-compiler.js +1 -0
  190. package/dist/plugins/hooks/lib/assets/asset-registry.js +1 -0
  191. package/dist/plugins/hooks/lib/assets/asset-selector.js +1 -0
  192. package/dist/plugins/hooks/lib/assets/index.js +1 -0
  193. package/dist/plugins/hooks/lib/assets/paths.js +1 -0
  194. package/dist/plugins/hooks/lib/assets/projection-targets/claude-code.js +1 -0
  195. package/dist/plugins/hooks/lib/assets/projection-targets/codex.js +1 -0
  196. package/dist/plugins/hooks/lib/auto-fix-loop.js +1 -0
  197. package/dist/plugins/hooks/lib/benchmarks/change-detector.js +1 -0
  198. package/dist/plugins/hooks/lib/benchmarks/evaluator.js +1 -0
  199. package/dist/plugins/hooks/lib/benchmarks/integration-example.js +1 -0
  200. package/dist/plugins/hooks/lib/cognitive/adaptive-matcher.js +1 -0
  201. package/dist/plugins/hooks/lib/cognitive/base-store.js +1 -0
  202. package/dist/plugins/hooks/lib/cognitive/causal-engine.js +1 -0
  203. package/dist/plugins/hooks/lib/cognitive/cognitive-config.js +1 -0
  204. package/dist/plugins/hooks/lib/cognitive/cognitive-fingerprint.js +1 -0
  205. package/dist/plugins/hooks/lib/cognitive/collective-sync.js +1 -0
  206. package/dist/plugins/hooks/lib/cognitive/confidence-engine.js +1 -0
  207. package/dist/plugins/hooks/lib/cognitive/dream-engine.js +1 -0
  208. package/dist/plugins/hooks/lib/cognitive/episodic-store.js +1 -0
  209. package/dist/plugins/hooks/lib/cognitive/index.js +1 -0
  210. package/dist/plugins/hooks/lib/cognitive/kernel.js +1 -0
  211. package/dist/plugins/hooks/lib/cognitive/knowledge-distiller.js +1 -0
  212. package/dist/plugins/hooks/lib/cognitive/memory-transport.js +1 -0
  213. package/dist/plugins/hooks/lib/cognitive/persistence-manager.js +1 -0
  214. package/dist/plugins/hooks/lib/cognitive/priority-store.js +1 -0
  215. package/dist/plugins/hooks/lib/cognitive/procedural-store.js +1 -0
  216. package/dist/plugins/hooks/lib/cognitive/semantic-store.js +1 -0
  217. package/dist/plugins/hooks/lib/cognitive/skill-forge-candidate-loader.js +1 -0
  218. package/dist/plugins/hooks/lib/cognitive/skill-forge-draft.js +1 -0
  219. package/dist/plugins/hooks/lib/cognitive/skill-forge-proposal.js +1 -0
  220. package/dist/plugins/hooks/lib/cognitive/skill-forge-queue.js +1 -0
  221. package/dist/plugins/hooks/lib/cognitive/skill-tuner.js +1 -0
  222. package/dist/plugins/hooks/lib/cognitive/wiki-materializer.js +1 -0
  223. package/dist/plugins/hooks/lib/detection-pattern-loader.js +1 -0
  224. package/dist/plugins/hooks/lib/directory-discovery.js +1 -0
  225. package/dist/plugins/hooks/lib/environment-capability-package.js +1 -0
  226. package/dist/plugins/hooks/lib/environment-capability-probe.js +1 -0
  227. package/dist/plugins/hooks/lib/environment-config-loader.js +1 -0
  228. package/dist/plugins/hooks/lib/environment-executor.js +1 -0
  229. package/dist/plugins/hooks/lib/environment-feedback.js +1 -0
  230. package/dist/plugins/hooks/lib/environment-health-monitor.js +1 -0
  231. package/dist/plugins/hooks/lib/environment-knowledge-synthesizer.js +1 -0
  232. package/dist/plugins/hooks/lib/environment-knowledge-validator.js +1 -0
  233. package/dist/plugins/hooks/lib/environment-learning-discoverer.js +1 -0
  234. package/dist/plugins/hooks/lib/environment-learning-engine.js +1 -0
  235. package/dist/plugins/hooks/lib/environment-module-repository.js +1 -0
  236. package/dist/plugins/hooks/lib/environment-planner.js +1 -0
  237. package/dist/plugins/hooks/lib/environment-plugin-registry.js +1 -0
  238. package/dist/plugins/hooks/lib/environment-readiness.js +1 -0
  239. package/dist/plugins/hooks/lib/environment-route-ranking.js +1 -0
  240. package/dist/plugins/hooks/lib/environment-strategy-overlay.js +1 -0
  241. package/dist/plugins/hooks/lib/execution-path.js +1 -0
  242. package/dist/plugins/hooks/lib/external-mount-adapter.js +1 -0
  243. package/dist/plugins/hooks/lib/external-scanner.js +1 -0
  244. package/dist/plugins/hooks/lib/hook-error-recorder.js +1 -0
  245. package/dist/plugins/hooks/lib/hook-logger.js +1 -0
  246. package/dist/plugins/hooks/lib/hook-runner.js +2 -0
  247. package/dist/plugins/hooks/lib/hook-state-manager.js +1 -0
  248. package/dist/plugins/hooks/lib/memory-extractor.js +1 -0
  249. package/dist/plugins/hooks/lib/memory-manager.js +1 -0
  250. package/dist/plugins/hooks/lib/metrics-analyzer.js +1 -0
  251. package/dist/plugins/hooks/lib/mount-manager.js +1 -0
  252. package/dist/plugins/hooks/lib/plugin-activation-registry.js +1 -0
  253. package/dist/plugins/hooks/lib/plugin-selector.js +1 -0
  254. package/dist/plugins/hooks/lib/plugin-source-registry.js +1 -0
  255. package/dist/plugins/hooks/lib/plugin-workspace-registry.js +1 -0
  256. package/dist/plugins/hooks/lib/project-evolution/auto-fixer.js +1 -0
  257. package/dist/plugins/hooks/lib/project-evolution/memory-manager.js +1 -0
  258. package/dist/plugins/hooks/lib/project-evolution/pattern-detector.js +1 -0
  259. package/dist/plugins/hooks/lib/project-evolution/semantic-indexer.js +1 -0
  260. package/dist/plugins/hooks/lib/rollback-tracker.js +1 -0
  261. package/dist/plugins/hooks/lib/source-code-scanner.js +1 -0
  262. package/dist/plugins/hooks/lib/technology-stack-detector.js +1 -0
  263. package/dist/plugins/hooks/lib/test-failure-analyzer.js +1 -0
  264. package/dist/plugins/hooks/lib/test-failure-fixer.js +1 -0
  265. package/dist/plugins/hooks/lib/trace-context.js +1 -0
  266. package/dist/plugins/hooks/lib/validation-patterns.js +1 -0
  267. package/dist/plugins/hooks/memory-sync.js +1 -0
  268. package/dist/plugins/hooks/pipeline-observer.js +2 -0
  269. package/dist/plugins/hooks/retry-limit-guard.js +2 -0
  270. package/dist/plugins/hooks/scope-sentinel.js +2 -0
  271. package/dist/plugins/hooks/secret-scanner.js +2 -0
  272. package/dist/plugins/hooks/stop-evolve-prompt.js +1 -0
  273. package/dist/plugins/hooks/trace-initialization.js +2 -0
  274. package/dist/plugins/hooks/version-checker.js +2 -0
  275. package/dist/plugins/memory/templates/code-quality.yaml.enc +6 -0
  276. package/dist/plugins/memory/templates/multi-system.yaml.enc +6 -0
  277. package/dist/plugins/memory/templates/team-habits.yaml.enc +6 -0
  278. package/dist/plugins/memory/templates/testing.yaml.enc +6 -0
  279. package/dist/plugins/skills/README.md.enc +6 -0
  280. package/dist/plugins/skills/ab-test-executor/SKILL.md.enc +6 -0
  281. package/dist/plugins/skills/benchmark-executor/SKILL.md.enc +6 -0
  282. package/dist/plugins/skills/benchmark-generator/SKILL.md.enc +6 -0
  283. package/dist/plugins/skills/content-prompts/SKILL.md.enc +6 -0
  284. package/dist/plugins/skills/delivery-stage/SKILL.md.enc +6 -0
  285. package/dist/plugins/skills/design-stage/SKILL.md.enc +6 -0
  286. package/dist/plugins/skills/environment-learning/SKILL.md.enc +6 -0
  287. package/dist/plugins/skills/environment-resilience/build-failure-doctor.md.enc +6 -0
  288. package/dist/plugins/skills/environment-resilience/environment-repair.md.enc +6 -0
  289. package/dist/plugins/skills/environment-resilience/pre-flight-check.md.enc +6 -0
  290. package/dist/plugins/skills/experiment-evaluator/SKILL.md.enc +6 -0
  291. package/dist/plugins/skills/exploration-phase/SKILL.md.enc +6 -0
  292. package/dist/plugins/skills/field-evolve-analyzer/SKILL.md.enc +6 -0
  293. package/dist/plugins/skills/field-evolve-distiller/SKILL.md.enc +6 -0
  294. package/dist/plugins/skills/field-evolve-executor/SKILL.md.enc +6 -0
  295. package/dist/plugins/skills/field-evolve-executor/executor.js +2 -0
  296. package/dist/plugins/skills/field-evolve-fixer/SKILL.md.enc +6 -0
  297. package/dist/plugins/skills/field-evolve-learner/SKILL.md.enc +6 -0
  298. package/dist/plugins/skills/field-evolve-scanner/SKILL.md.enc +6 -0
  299. package/dist/plugins/skills/field-evolve-scanner/scripts/fallback-scanner.js +2 -0
  300. package/dist/plugins/skills/field-evolve-verifier/SKILL.md.enc +6 -0
  301. package/dist/plugins/skills/heartbeat-monitor/SKILL.md.enc +6 -0
  302. package/dist/plugins/skills/implementation-stage/SKILL.md.enc +6 -0
  303. package/dist/plugins/skills/layer1-validation/SKILL.md.enc +6 -0
  304. package/dist/plugins/skills/multi-role-orchestration/SKILL.md.enc +6 -0
  305. package/dist/plugins/skills/ops-content-marketing/SKILL.md.enc +6 -0
  306. package/dist/plugins/skills/ops-conversion/SKILL.md.enc +6 -0
  307. package/dist/plugins/skills/ops-data-driven/SKILL.md.enc +6 -0
  308. package/dist/plugins/skills/ops-growth-strategies/SKILL.md.enc +6 -0
  309. package/dist/plugins/skills/ops-private-domain/SKILL.md.enc +6 -0
  310. package/dist/plugins/skills/ops-social-commerce/SKILL.md.enc +6 -0
  311. package/dist/plugins/skills/ops-user-growth/SKILL.md.enc +6 -0
  312. package/dist/plugins/skills/pending-dashboard/SKILL.md.enc +6 -0
  313. package/dist/plugins/skills/project-evolve-analyzer/SKILL.md.enc +6 -0
  314. package/dist/plugins/skills/project-evolve-fixer/SKILL.md.enc +6 -0
  315. package/dist/plugins/skills/project-evolve-generator/SKILL.md.enc +6 -0
  316. package/dist/plugins/skills/project-evolve-learner/SKILL.md.enc +6 -0
  317. package/dist/plugins/skills/project-evolve-reviewer/SKILL.md.enc +6 -0
  318. package/dist/plugins/skills/project-evolve-scanner/SKILL.md.enc +6 -0
  319. package/dist/plugins/skills/project-evolve-scanner/scripts/dependency-reuse-checker.js +2 -0
  320. package/dist/plugins/skills/project-evolve-scanner/scripts/subsystem-coverage.js +2 -0
  321. package/dist/plugins/skills/project-evolve-verifier/SKILL.md.enc +6 -0
  322. package/dist/plugins/skills/requirement-stage/SKILL.md.enc +6 -0
  323. package/dist/plugins/skills/secret-scanner/SKILL.md.enc +6 -0
  324. package/dist/plugins/skills/skill-forge/SKILL.md.enc +6 -0
  325. package/dist/plugins/skills/skill-forge/references/description-guide.md.enc +6 -0
  326. package/dist/plugins/skills/skill-forge/references/quality-rubric.md.enc +6 -0
  327. package/dist/plugins/skills/skill-forge/references/skill-template.md.enc +6 -0
  328. package/dist/plugins/skills/startup-guard/SKILL.md.enc +6 -0
  329. package/dist/plugins/skills/tdd-workflow/SKILL.md.enc +6 -0
  330. package/dist/plugins/skills/testing-stage/SKILL.md.enc +6 -0
  331. package/dist/plugins/skills/tracking-validator/SKILL.md.enc +6 -0
  332. package/dist/scripts/build-crypto.js +2 -0
  333. package/dist/scripts/cli/assets.js +1 -0
  334. package/dist/scripts/cli/contribute.js +1 -0
  335. package/dist/scripts/cli/dashboard.js +1 -0
  336. package/dist/scripts/cli/env.js +1 -0
  337. package/dist/scripts/cli/global-init.js +1 -0
  338. package/dist/scripts/cli/global.js +1 -0
  339. package/dist/scripts/cli/index.js +1 -0
  340. package/dist/scripts/cli/init.js +1 -0
  341. package/dist/scripts/cli/list.js +1 -0
  342. package/dist/scripts/cli/memory.js +1 -0
  343. package/dist/scripts/cli/org.js +1 -0
  344. package/dist/scripts/cli/plugin.js +1 -0
  345. package/dist/scripts/cli/practice-report.js +1 -0
  346. package/dist/scripts/cli/runtime-governance.js +1 -0
  347. package/dist/scripts/cli/system.js +1 -0
  348. package/dist/scripts/cli/update.js +1 -0
  349. package/dist/scripts/commands/catalog.js +1 -0
  350. package/dist/scripts/commands/slash-command-docs.js +1 -0
  351. package/dist/scripts/config/external-mounts.config.js +2 -0
  352. package/dist/scripts/heartbeat/check.js +2 -0
  353. package/dist/scripts/heartbeat/setup-cron.js +2 -0
  354. package/dist/scripts/install/adapters.js +1 -0
  355. package/dist/scripts/install/constants.js +1 -0
  356. package/dist/scripts/install/file-reader.js +1 -0
  357. package/dist/scripts/install/index.js +1 -0
  358. package/dist/scripts/install/shards/constants-shard.js +1 -0
  359. package/dist/scripts/install/shards/crypto-config-shard.js +1 -0
  360. package/dist/scripts/install/shards/error-messages-shard.js +1 -0
  361. package/dist/scripts/install/shards/reassemble.js +1 -0
  362. package/dist/scripts/install/shards/utils-shard.js +1 -0
  363. package/dist/scripts/install/shards/version-info-shard.js +1 -0
  364. package/dist/scripts/postinstall.js +1 -0
  365. package/dist/scripts/state.js +1 -0
  366. package/package.json +22 -21
  367. package/README.en.md +0 -598
  368. package/bin/autospec.js +0 -3
  369. package/knowledge/01-principles/00-principles-hierarchy.md +0 -247
  370. package/knowledge/01-principles/01-first-principles.md +0 -241
  371. package/knowledge/01-principles/02-strategic-principles.md +0 -286
  372. package/knowledge/01-principles/03-tactical-principles.md +0 -385
  373. package/knowledge/01-principles/04-operational-principles.md +0 -275
  374. package/knowledge/01-principles/05-domain-principles.md +0 -539
  375. package/knowledge/01-principles/06-methodology-principles.md +0 -281
  376. package/knowledge/01-principles/07-cognitive-principles.md +0 -277
  377. package/knowledge/01-principles/08-auto-fix-principles.md +0 -320
  378. package/knowledge/01-principles/09-constitution.md +0 -220
  379. package/knowledge/01-principles/10-evolution-mechanism.md +0 -699
  380. package/knowledge/01-principles/README.en.md +0 -385
  381. package/knowledge/01-principles/README.md +0 -385
  382. package/knowledge/02-process/00-overview.md +0 -404
  383. package/knowledge/02-process/01-requirement.md +0 -113
  384. package/knowledge/02-process/02-design.md +0 -123
  385. package/knowledge/02-process/03-implementation.md +0 -90
  386. package/knowledge/02-process/04-review.md +0 -80
  387. package/knowledge/02-process/05-testing.md +0 -90
  388. package/knowledge/02-process/06-delivery.md +0 -88
  389. package/knowledge/02-process/README.en.md +0 -143
  390. package/knowledge/02-process/README.md +0 -186
  391. package/knowledge/03-guides/00-pipeline-protocol.md +0 -438
  392. package/knowledge/03-guides/01-team-orchestrator.md +0 -368
  393. package/knowledge/03-guides/02-analyze-requirement.md +0 -195
  394. package/knowledge/03-guides/03-design-solution.md +0 -401
  395. package/knowledge/03-guides/04-implement-code.md +0 -205
  396. package/knowledge/03-guides/05-plan-testing.md +0 -183
  397. package/knowledge/03-guides/06-generate-tests.md +0 -241
  398. package/knowledge/03-guides/07-check-release.md +0 -205
  399. package/knowledge/03-guides/08-evaluate-ai-effect.md +0 -100
  400. package/knowledge/03-guides/09-review-requirement.md +0 -83
  401. package/knowledge/03-guides/10-review-design.md +0 -83
  402. package/knowledge/03-guides/11-review-code.md +0 -111
  403. package/knowledge/03-guides/12-review-testing.md +0 -76
  404. package/knowledge/03-guides/13-audit-security.md +0 -89
  405. package/knowledge/03-guides/14-check-consistency.md +0 -177
  406. package/knowledge/03-guides/15-run-unit-tests.md +0 -83
  407. package/knowledge/03-guides/16-run-integration-tests.md +0 -105
  408. package/knowledge/03-guides/17-analyze-test-context.md +0 -250
  409. package/knowledge/03-guides/18-log-practice.md +0 -359
  410. package/knowledge/03-guides/19-distill-skill.md +0 -91
  411. package/knowledge/03-guides/20-update-skill.md +0 -45
  412. package/knowledge/03-guides/21-validate-skill.md +0 -72
  413. package/knowledge/03-guides/22-extract-methodology.md +0 -55
  414. package/knowledge/03-guides/23-infer-scope.md +0 -174
  415. package/knowledge/03-guides/24-assess-complexity.md +0 -270
  416. package/knowledge/03-guides/25-discover-component.md +0 -183
  417. package/knowledge/03-guides/26-analyze-tech-stack.md +0 -139
  418. package/knowledge/03-guides/27-scan-environment.md +0 -207
  419. package/knowledge/03-guides/28-validate-environment.md +0 -207
  420. package/knowledge/03-guides/29-generate-knowledge.md +0 -234
  421. package/knowledge/03-guides/30-analyze-ai-capability.md +0 -193
  422. package/knowledge/03-guides/31-analyze-ai-component.md +0 -169
  423. package/knowledge/03-guides/32-analyze-ai-agent.md +0 -362
  424. package/knowledge/03-guides/33-analyze-ai-rag.md +0 -339
  425. package/knowledge/03-guides/34-assess-ai-task.md +0 -418
  426. package/knowledge/03-guides/35-evaluate-ai-pipeline.md +0 -219
  427. package/knowledge/03-guides/36-evaluate-ai-artifact.md +0 -192
  428. package/knowledge/03-guides/37-plan-ai-evaluation.md +0 -374
  429. package/knowledge/03-guides/38-evaluate-ai-path.md +0 -274
  430. package/knowledge/03-guides/39-validate-ai-data.md +0 -276
  431. package/knowledge/03-guides/40-detect-ai-anomaly.md +0 -213
  432. package/knowledge/03-guides/41-diagnose-ai-test.md +0 -133
  433. package/knowledge/03-guides/42-apply-ddd.md +0 -345
  434. package/knowledge/03-guides/43-run-ai-sdlc.md +0 -475
  435. package/knowledge/03-guides/44-manage-knowledge.md +0 -369
  436. package/knowledge/03-guides/45-test-runner.md +0 -254
  437. package/knowledge/03-guides/README.en.md +0 -212
  438. package/knowledge/03-guides/README.md +0 -212
  439. package/knowledge/04-checklists/00-requirement.md +0 -169
  440. package/knowledge/04-checklists/01-design.md +0 -196
  441. package/knowledge/04-checklists/02-code.md +0 -197
  442. package/knowledge/04-checklists/03-test.md +0 -46
  443. package/knowledge/04-checklists/04-release.md +0 -70
  444. package/knowledge/04-checklists/README.en.md +0 -119
  445. package/knowledge/04-checklists/README.md +0 -123
  446. package/knowledge/05-config/00-validation-patterns.yaml +0 -137
  447. package/knowledge/05-config/01-team-stage.yaml +0 -95
  448. package/knowledge/05-config/02-team-tasks.yaml +0 -139
  449. package/knowledge/05-config/03-role-composition.yaml +0 -346
  450. package/knowledge/05-config/04-role-extensions.yaml +0 -140
  451. package/knowledge/05-config/05-skill-compositions.yaml +0 -142
  452. package/knowledge/05-config/README.en.md +0 -54
  453. package/knowledge/05-config/README.md +0 -132
  454. package/knowledge/06-environment/00-template-registry.md +0 -310
  455. package/knowledge/06-environment/01-detection-patterns.yaml +0 -1692
  456. package/knowledge/06-environment/README.en.md +0 -40
  457. package/knowledge/06-environment/README.md +0 -128
  458. package/knowledge/07-standards/00-coding-style.md +0 -1059
  459. package/knowledge/07-standards/01-code-review.md +0 -876
  460. package/knowledge/07-standards/02-data-consistency.md +0 -1085
  461. package/knowledge/07-standards/03-document-versioning.md +0 -210
  462. package/knowledge/07-standards/04-risk-detection.md +0 -186
  463. package/knowledge/07-standards/README.en.md +0 -119
  464. package/knowledge/07-standards/README.md +0 -123
  465. package/knowledge/08-organization/00-vision-mission.md +0 -113
  466. package/knowledge/08-organization/01-ai-native-culture.md +0 -318
  467. package/knowledge/08-organization/02-team-metrics.md +0 -228
  468. package/knowledge/08-organization/03-committee-structure.md +0 -54
  469. package/knowledge/08-organization/04-governance-metrics.md +0 -55
  470. package/knowledge/08-organization/05-improvement-process.md +0 -71
  471. package/knowledge/08-organization/README.en.md +0 -165
  472. package/knowledge/08-organization/README.md +0 -165
  473. package/knowledge/09-templates/00-requirement-proposal.md +0 -344
  474. package/knowledge/09-templates/01-architecture-design.md +0 -494
  475. package/knowledge/09-templates/02-api-design.md +0 -408
  476. package/knowledge/09-templates/03-database-design.md +0 -313
  477. package/knowledge/09-templates/04-product-design.md +0 -237
  478. package/knowledge/09-templates/05-domain-business.md +0 -388
  479. package/knowledge/09-templates/06-test-design.md +0 -268
  480. package/knowledge/09-templates/07-evaluation-design.md +0 -372
  481. package/knowledge/09-templates/08-component-knowledge.md +0 -272
  482. package/knowledge/09-templates/09-best-practices.md +0 -218
  483. package/knowledge/09-templates/10-middleware-knowledge.md +0 -342
  484. package/knowledge/09-templates/README.en.md +0 -222
  485. package/knowledge/09-templates/README.md +0 -216
  486. package/knowledge/README.en.md +0 -372
  487. package/knowledge/README.md +0 -399
  488. package/plugins/agents/roles/ai-engineer.md +0 -129
  489. package/plugins/agents/roles/backend-engineer.md +0 -165
  490. package/plugins/agents/roles/ceo.md +0 -94
  491. package/plugins/agents/roles/data-engineer.md +0 -135
  492. package/plugins/agents/roles/devops-engineer.md +0 -181
  493. package/plugins/agents/roles/frontend-engineer.md +0 -129
  494. package/plugins/agents/roles/product-owner.md +0 -98
  495. package/plugins/agents/roles/quality-engineer.md +0 -129
  496. package/plugins/agents/roles/security-engineer.md +0 -180
  497. package/plugins/agents/roles/tech-lead.md +0 -97
  498. package/plugins/agents/support/blind-comparator.md +0 -88
  499. package/plugins/agents/support/consistency-checker.md +0 -136
  500. package/plugins/agents/support/failure-diagnostician.md +0 -141
  501. package/plugins/agents/support/independent-reviewer.md +0 -80
  502. package/plugins/agents/support/monitoring-agent.md +0 -215
  503. package/plugins/agents/support/safety-auditor.md +0 -121
  504. package/plugins/agents/support/skill-benchmarker.md +0 -86
  505. package/plugins/agents/support/skill-forger.md +0 -105
  506. package/plugins/agents/support/stage-gate-evaluator.md +0 -205
  507. package/plugins/agents/support/test-coverage-reviewer.md +0 -73
  508. package/plugins/benchmarks/templates/README.md +0 -196
  509. package/plugins/benchmarks/templates/commands/apply-template.yaml +0 -108
  510. package/plugins/benchmarks/templates/commands/archive-template.yaml +0 -65
  511. package/plugins/benchmarks/templates/commands/env-export-template.yaml +0 -64
  512. package/plugins/benchmarks/templates/commands/env-sync-template.yaml +0 -104
  513. package/plugins/benchmarks/templates/commands/env-template-template.yaml +0 -96
  514. package/plugins/benchmarks/templates/commands/env-template.yaml +0 -58
  515. package/plugins/benchmarks/templates/commands/env-update-template.yaml +0 -110
  516. package/plugins/benchmarks/templates/commands/env-validate-template.yaml +0 -95
  517. package/plugins/benchmarks/templates/commands/explore-template.yaml +0 -48
  518. package/plugins/benchmarks/templates/commands/field-evolve-template.yaml +0 -104
  519. package/plugins/benchmarks/templates/commands/project-evolve-template.yaml +0 -104
  520. package/plugins/benchmarks/templates/commands/propose-template.yaml +0 -88
  521. package/plugins/benchmarks/templates/commands/review-template.yaml +0 -124
  522. package/plugins/benchmarks/templates/commands/run-template.yaml +0 -127
  523. package/plugins/benchmarks/templates/commands/test-template.yaml +0 -149
  524. package/plugins/benchmarks/templates/pipeline/agile-template.yaml +0 -84
  525. package/plugins/benchmarks/templates/pipeline/experiment-template.yaml +0 -92
  526. package/plugins/benchmarks/templates/pipeline/hotfix-template.yaml +0 -81
  527. package/plugins/benchmarks/templates/pipeline/waterfall-template.yaml +0 -106
  528. package/plugins/benchmarks/templates/skills/agile-iteration-template.yaml +0 -78
  529. package/plugins/benchmarks/templates/skills/benchmark-executor-template.yaml +0 -114
  530. package/plugins/benchmarks/templates/skills/benchmark-generator-template.yaml +0 -52
  531. package/plugins/benchmarks/templates/skills/delivery-stage-template.yaml +0 -130
  532. package/plugins/benchmarks/templates/skills/design-stage-template.yaml +0 -131
  533. package/plugins/benchmarks/templates/skills/experiment-iteration-template.yaml +0 -60
  534. package/plugins/benchmarks/templates/skills/exploration-phase-template.yaml +0 -114
  535. package/plugins/benchmarks/templates/skills/field-evolve-analyzer-template.yaml +0 -51
  536. package/plugins/benchmarks/templates/skills/field-evolve-distiller-template.yaml +0 -34
  537. package/plugins/benchmarks/templates/skills/field-evolve-executor-template.yaml +0 -50
  538. package/plugins/benchmarks/templates/skills/field-evolve-fixer-template.yaml +0 -52
  539. package/plugins/benchmarks/templates/skills/field-evolve-learner-template.yaml +0 -33
  540. package/plugins/benchmarks/templates/skills/field-evolve-scanner-template.yaml +0 -74
  541. package/plugins/benchmarks/templates/skills/field-evolve-template.yaml +0 -71
  542. package/plugins/benchmarks/templates/skills/field-evolve-verifier-template.yaml +0 -51
  543. package/plugins/benchmarks/templates/skills/hotfix-iteration-template.yaml +0 -54
  544. package/plugins/benchmarks/templates/skills/implementation-stage-template.yaml +0 -127
  545. package/plugins/benchmarks/templates/skills/layer1-validation-template.yaml +0 -121
  546. package/plugins/benchmarks/templates/skills/project-evolve-analyzer-template.yaml +0 -51
  547. package/plugins/benchmarks/templates/skills/project-evolve-fixer-template.yaml +0 -52
  548. package/plugins/benchmarks/templates/skills/project-evolve-generator-template.yaml +0 -34
  549. package/plugins/benchmarks/templates/skills/project-evolve-learner-template.yaml +0 -50
  550. package/plugins/benchmarks/templates/skills/project-evolve-reviewer-template.yaml +0 -50
  551. package/plugins/benchmarks/templates/skills/project-evolve-scanner-template.yaml +0 -75
  552. package/plugins/benchmarks/templates/skills/project-evolve-template.yaml +0 -72
  553. package/plugins/benchmarks/templates/skills/project-evolve-verifier-template.yaml +0 -51
  554. package/plugins/benchmarks/templates/skills/requirement-analyzer-template.yaml +0 -48
  555. package/plugins/benchmarks/templates/skills/skill-forge-template.yaml +0 -117
  556. package/plugins/benchmarks/templates/skills/startup-guard-template.yaml +0 -103
  557. package/plugins/benchmarks/templates/skills/testing-stage-template.yaml +0 -146
  558. package/plugins/benchmarks/templates/skills/waterfall-iteration-template.yaml +0 -55
  559. package/plugins/commands/README.en.md +0 -96
  560. package/plugins/commands/README.md +0 -96
  561. package/plugins/commands/apply.md +0 -277
  562. package/plugins/commands/archive.md +0 -132
  563. package/plugins/commands/env-export.md +0 -79
  564. package/plugins/commands/env-sync.md +0 -1281
  565. package/plugins/commands/env-template.md +0 -99
  566. package/plugins/commands/env-update.md +0 -264
  567. package/plugins/commands/env-validate.md +0 -176
  568. package/plugins/commands/env.md +0 -79
  569. package/plugins/commands/explore.md +0 -193
  570. package/plugins/commands/field-evolve.md +0 -412
  571. package/plugins/commands/memory.md +0 -249
  572. package/plugins/commands/project-evolve.md +0 -920
  573. package/plugins/commands/propose.md +0 -184
  574. package/plugins/commands/review.md +0 -140
  575. package/plugins/commands/run.md +0 -1052
  576. package/plugins/commands/status.md +0 -183
  577. package/plugins/commands/test.md +0 -389
  578. package/plugins/hooks/README.en.md +0 -56
  579. package/plugins/hooks/README.md +0 -56
  580. package/plugins/hooks/ai-project-guard.js +0 -329
  581. package/plugins/hooks/artifact-evaluation-hook.js +0 -237
  582. package/plugins/hooks/constitution-guard.js +0 -211
  583. package/plugins/hooks/environment-autocommit.js +0 -606
  584. package/plugins/hooks/environment-manager.js +0 -779
  585. package/plugins/hooks/execution-tracker.js +0 -459
  586. package/plugins/hooks/frozen-zone-guard.js +0 -140
  587. package/plugins/hooks/layer1-validator.js +0 -539
  588. package/plugins/hooks/lib/artifact-evaluator.js +0 -414
  589. package/plugins/hooks/lib/auto-fix-loop.js +0 -605
  590. package/plugins/hooks/lib/benchmarks/change-detector.js +0 -390
  591. package/plugins/hooks/lib/benchmarks/evaluator.js +0 -605
  592. package/plugins/hooks/lib/benchmarks/integration-example.js +0 -169
  593. package/plugins/hooks/lib/data-and-ai-detector.js +0 -275
  594. package/plugins/hooks/lib/detection-pattern-loader.js +0 -865
  595. package/plugins/hooks/lib/directory-discovery.js +0 -395
  596. package/plugins/hooks/lib/environment-config-loader.js +0 -345
  597. package/plugins/hooks/lib/environment-detector.js +0 -553
  598. package/plugins/hooks/lib/environment-evolver.js +0 -564
  599. package/plugins/hooks/lib/environment-registry.js +0 -813
  600. package/plugins/hooks/lib/execution-path.js +0 -427
  601. package/plugins/hooks/lib/hook-error-recorder.js +0 -245
  602. package/plugins/hooks/lib/hook-logger.js +0 -538
  603. package/plugins/hooks/lib/hook-runner.js +0 -97
  604. package/plugins/hooks/lib/hook-state-manager.js +0 -578
  605. package/plugins/hooks/lib/memory-extractor.js +0 -399
  606. package/plugins/hooks/lib/memory-manager.js +0 -673
  607. package/plugins/hooks/lib/metrics-analyzer.js +0 -489
  608. package/plugins/hooks/lib/project-evolution/auto-fixer.js +0 -511
  609. package/plugins/hooks/lib/project-evolution/memory-manager.js +0 -346
  610. package/plugins/hooks/lib/project-evolution/pattern-detector.js +0 -476
  611. package/plugins/hooks/lib/project-evolution/semantic-indexer.js +0 -480
  612. package/plugins/hooks/lib/project-structure-detector.js +0 -326
  613. package/plugins/hooks/lib/rollback-tracker.js +0 -346
  614. package/plugins/hooks/lib/source-code-scanner.js +0 -596
  615. package/plugins/hooks/lib/technology-stack-detector.js +0 -374
  616. package/plugins/hooks/lib/test-auto-fix.test.js +0 -194
  617. package/plugins/hooks/lib/test-failure-analyzer.js +0 -375
  618. package/plugins/hooks/lib/test-failure-fixer.js +0 -268
  619. package/plugins/hooks/lib/trace-context.js +0 -277
  620. package/plugins/hooks/lib/validation-patterns.js +0 -415
  621. package/plugins/hooks/memory-sync.js +0 -171
  622. package/plugins/hooks/monitoring-trigger.js +0 -467
  623. package/plugins/hooks/pipeline-observer.js +0 -413
  624. package/plugins/hooks/scope-sentinel.js +0 -204
  625. package/plugins/hooks/trace-initialization.js +0 -169
  626. package/plugins/memory/templates/code-quality.yaml +0 -149
  627. package/plugins/memory/templates/multi-system.yaml +0 -155
  628. package/plugins/memory/templates/team-habits.yaml +0 -119
  629. package/plugins/memory/templates/testing.yaml +0 -121
  630. package/plugins/skills/README.en.md +0 -59
  631. package/plugins/skills/README.md +0 -114
  632. package/plugins/skills/agile-iteration/SKILL.md +0 -187
  633. package/plugins/skills/benchmark-executor/SKILL.md +0 -647
  634. package/plugins/skills/benchmark-generator/SKILL.md +0 -349
  635. package/plugins/skills/delivery-stage/SKILL.md +0 -324
  636. package/plugins/skills/design-stage/SKILL.md +0 -307
  637. package/plugins/skills/experiment-evaluator/SKILL.md +0 -271
  638. package/plugins/skills/experiment-iteration/SKILL.md +0 -154
  639. package/plugins/skills/exploration-phase/SKILL.md +0 -216
  640. package/plugins/skills/field-evolve-analyzer/SKILL.md +0 -65
  641. package/plugins/skills/field-evolve-distiller/SKILL.md +0 -66
  642. package/plugins/skills/field-evolve-executor/SKILL.md +0 -94
  643. package/plugins/skills/field-evolve-executor/executor.js +0 -342
  644. package/plugins/skills/field-evolve-fixer/SKILL.md +0 -69
  645. package/plugins/skills/field-evolve-learner/SKILL.md +0 -65
  646. package/plugins/skills/field-evolve-scanner/SKILL.md +0 -87
  647. package/plugins/skills/field-evolve-scanner/scripts/fallback-scanner.js +0 -288
  648. package/plugins/skills/field-evolve-verifier/SKILL.md +0 -64
  649. package/plugins/skills/hotfix-iteration/SKILL.md +0 -279
  650. package/plugins/skills/implementation-stage/SKILL.md +0 -320
  651. package/plugins/skills/layer1-validation/SKILL.md +0 -79
  652. package/plugins/skills/pending-dashboard/SKILL.md +0 -110
  653. package/plugins/skills/project-evolve-analyzer/SKILL.md +0 -95
  654. package/plugins/skills/project-evolve-fixer/SKILL.md +0 -99
  655. package/plugins/skills/project-evolve-generator/SKILL.md +0 -149
  656. package/plugins/skills/project-evolve-learner/SKILL.md +0 -103
  657. package/plugins/skills/project-evolve-reviewer/SKILL.md +0 -104
  658. package/plugins/skills/project-evolve-scanner/SKILL.md +0 -95
  659. package/plugins/skills/project-evolve-scanner/scripts/dependency-reuse-checker.js +0 -395
  660. package/plugins/skills/project-evolve-scanner/scripts/subsystem-coverage.js +0 -315
  661. package/plugins/skills/project-evolve-verifier/SKILL.md +0 -105
  662. package/plugins/skills/requirement-stage/SKILL.md +0 -217
  663. package/plugins/skills/skill-forge/SKILL.md +0 -223
  664. package/plugins/skills/skill-forge/references/description-guide.md +0 -92
  665. package/plugins/skills/skill-forge/references/quality-rubric.md +0 -104
  666. package/plugins/skills/skill-forge/references/skill-template.md +0 -106
  667. package/plugins/skills/startup-guard/SKILL.md +0 -38
  668. package/plugins/skills/testing-stage/SKILL.md +0 -770
  669. package/plugins/skills/waterfall-iteration/SKILL.md +0 -115
  670. package/scripts/cli/global-init.js +0 -288
  671. package/scripts/cli/global.js +0 -324
  672. package/scripts/cli/index.js +0 -55
  673. package/scripts/cli/init.js +0 -408
  674. package/scripts/cli/list.js +0 -70
  675. package/scripts/cli/org.js +0 -340
  676. package/scripts/cli/update.js +0 -44
  677. package/scripts/config/commands.config.js +0 -145
  678. package/scripts/config/hooks.config.js +0 -197
  679. package/scripts/install/agents.js +0 -106
  680. package/scripts/install/commands.js +0 -133
  681. package/scripts/install/constants.js +0 -463
  682. package/scripts/install/hook-logger.js +0 -536
  683. package/scripts/install/hooks.js +0 -110
  684. package/scripts/install/index.js +0 -39
  685. package/scripts/install/skills.js +0 -95
  686. package/scripts/postinstall.js +0 -25
  687. package/scripts/state.js +0 -585
  688. /package/{plugins → dist/plugins}/hooks/lib/hook-runner.sh +0 -0
@@ -1,362 +0,0 @@
1
- ---
2
- name: agent-analyzer
3
- description: 当检测到Agent框架依赖时,分析Agent的能力、工具和架构。用于理解AI智能体系统的结构。
4
- type: ai
5
- ---
6
-
7
- ## 定位
8
-
9
- AI专用技能。分析Agent的能力、可用工具、决策逻辑和协作关系。
10
-
11
- ## 输入
12
-
13
- - 必须输入:Agent代码路径或项目目录
14
- - 可选输入:框架类型(langchain/crewai/autogen等)
15
-
16
- ## 输出
17
-
18
- ```json
19
- {
20
- "framework": "langchain",
21
- "agents": [
22
- {
23
- "name": "ResearchAgent",
24
- "role": "信息收集",
25
- "description": "负责从网络和文档中收集信息",
26
- "tools": [
27
- {"name": "web_search", "description": "网络搜索"},
28
- {"name": "document_reader", "description": "文档读取"}
29
- ],
30
- "decisionLogic": "ReAct",
31
- "llmConfig": {
32
- "model": "gpt-4",
33
- "temperature": 0.7
34
- },
35
- "collaborators": ["WriterAgent"]
36
- },
37
- {
38
- "name": "WriterAgent",
39
- "role": "内容生成",
40
- "description": "负责根据收集的信息生成内容",
41
- "tools": [
42
- {"name": "write_file", "description": "写入文件"}
43
- ],
44
- "decisionLogic": "Plan-Execute",
45
- "collaborators": ["ResearchAgent"]
46
- }
47
- ],
48
- "orchestration": {
49
- "type": "sequential",
50
- "description": "Agent按顺序执行:ResearchAgent → WriterAgent"
51
- },
52
- "evaluationNeeds": {
53
- "dimensions": ["任务完成率", "响应质量", "工具使用正确性"],
54
- "suggestions": [
55
- "建议测试Agent能否正确使用工具",
56
- "建议测试多Agent协作是否正常"
57
- ]
58
- }
59
- }
60
- ```
61
-
62
- ## 执行步骤
63
-
64
- ### Step 1: 识别框架(确定性)
65
-
66
- 基于依赖和代码特征识别Agent框架:
67
-
68
- ```
69
- 框架识别规则:
70
- - langchain: 依赖langchain,代码中有 Agent, Tool, Chain
71
- - crewai: 依赖crewai,代码中有 Agent, Crew, Task
72
- - autogen: 依赖autogen,代码中有 AssistantAgent, UserProxyAgent
73
- - semantic-kernel: 依赖semantic-kernel,代码中有 Kernel, Plugin
74
- ```
75
-
76
- ### Step 2: Grep获取Agent定义(高效)
77
-
78
- 搜索Agent定义模式:
79
-
80
- ```bash
81
- # LangChain风格
82
- grep -r -n -A 10 "Agent\|create_agent\|initialize_agent" --include="*.py" .
83
-
84
- # CrewAI风格
85
- grep -r -n -A 10 "@agent\|class.*Agent\|Agent(" --include="*.py" .
86
-
87
- # AutoGen风格
88
- grep -r -n -A 10 "AssistantAgent\|UserProxyAgent" --include="*.py" .
89
- ```
90
-
91
- ### Step 3: 分析Agent能力(模型)
92
-
93
- 基于代码上下文分析Agent:
94
-
95
- ```
96
- 模型输入:
97
- {
98
- "framework": "langchain",
99
- "codeContexts": "
100
- # agent.py
101
- research_agent = Agent(
102
- role='Researcher',
103
- tools=[web_search, document_reader],
104
- ...
105
- )
106
- ",
107
- "task": "分析Agent的能力、工具、决策逻辑,输出JSON格式"
108
- }
109
- ```
110
-
111
- ### Step 4: 分析协作关系(模型)
112
-
113
- 分析Agent之间的协作:
114
-
115
- ```
116
- 关注点:
117
- - Agent之间如何通信
118
- - 执行顺序(顺序/并行/条件)
119
- - 共享状态如何管理
120
- ```
121
-
122
- ### Step 5: 输出结果
123
-
124
- 汇总Agent分析结果,包括评测建议。
125
-
126
- ## 工作流模式
127
-
128
- 根据业界最佳实践,识别以下工作流模式:
129
-
130
- ### 工作流 vs Agent
131
-
132
- | 类型 | 说明 | 适用场景 |
133
- |------|------|----------|
134
- | **Workflow** | 预定义代码路径编排LLM和工具 | 确定性任务、可预测 |
135
- | **Agent** | LLM动态指导自己的流程和工具使用 | 开放性问题、需要灵活性 |
136
-
137
- ### 工作流模式(从简单到复杂)
138
-
139
- | 模式 | 说明 | 适用场景 | 识别特征 |
140
- |------|------|----------|----------|
141
- | **Prompt Chaining** | 提示链,将任务分解为顺序步骤 | 任务可分解为固定子任务 | 多步骤LLM调用链 |
142
- | **Routing** | 路由,将输入分类到专用处理流程 | 复杂任务有明确分类 | 分类器+条件分支 |
143
- | **Parallelization** | 并行化,同时处理多个子任务 | 独立子任务可并行 | 多LLM调用+聚合 |
144
- | **Orchestrator-workers** | 编排器-工作者,中心LLM动态分配任务 | 复杂任务无法预知子任务 | 中心调度+动态分发 |
145
- | **Evaluator-optimizer** | 评估器-优化器,循环优化 | 有明确评估标准 | 生成-评估循环 |
146
-
147
- ### Agent模式
148
-
149
- 当LLM具备以下能力时使用Agent:
150
- - 理解复杂输入
151
- - 推理和规划
152
- - 可靠使用工具
153
- - 从错误中恢复
154
-
155
- Agent关键特征:
156
- - 从环境获取"ground truth"(工具调用结果、代码执行结果)
157
- - 在检查点暂停等待人类反馈
158
- - 包含停止条件(如最大迭代次数)
159
-
160
- ## 工具设计原则
161
-
162
- 工具设计应遵循以下原则(Agent-Computer Interface, ACI):
163
-
164
- ### 工具设计原则
165
-
166
- 1. **给模型足够token思考**:避免模型在思考过程中被截断
167
- 2. **格式接近自然文本**:让模型容易理解和生成
168
- 3. **无格式化开销**:避免需要精确计数的格式
169
- 4. **像对待HCI一样对待ACI**:投入同样多的精力设计工具接口
170
-
171
- ### 工具设计检查清单
172
-
173
- ```
174
- - [ ] 工具描述清晰,包含示例用法
175
- - [ ] 参数名称和描述直观
176
- - [ ] 边界情况有说明
177
- - [ ] 输入格式要求明确
178
- - [ ] 与其他工具边界清晰
179
- - [ ] 测试模型使用工具的错误模式
180
- - [ ] 使用绝对路径(避免相对路径错误)
181
- ```
182
-
183
- ## 决策逻辑类型
184
-
185
- | 类型 | 说明 | 特点 |
186
- |------|------|------|
187
- | **ReAct** | 推理-行动循环 | 每步思考后执行 |
188
- | **Plan-Execute** | 规划-执行 | 先规划全流程再执行 |
189
- | **Reflexion** | 反思改进 | 执行后反思优化 |
190
- | **MRKL** | 模块化推理 | 组合多个专家模块 |
191
- | **Evaluator-optimizer** | 评估-优化循环 | 基于反馈迭代改进 |
192
-
193
- ## Agent可靠性设计检查
194
-
195
- 根据最佳实践,检查Agent设计可靠性:
196
-
197
- ### 必须检查项
198
-
199
- 1. **停止条件**
200
- - 是否有最大迭代次数限制?
201
- - 是否有超时机制?
202
- - 是否定义了明确的完成条件?
203
-
204
- 2. **错误处理**
205
- - 工具调用失败如何处理?
206
- - 是否有重试机制?
207
- - 错误是否可恢复?
208
-
209
- 3. **检查点机制**
210
- - 是否在关键步骤暂停等待确认?
211
- - 是否有人类反馈回路?
212
- - 是否记录决策点?
213
-
214
- 4. **透明度**
215
- - 是否显示Agent的规划步骤?
216
- - 是否可追溯决策过程?
217
- - 是否有日志记录?
218
-
219
- ### 建议检查项
220
-
221
- 1. **安全性**
222
- - 是否有输入验证?
223
- - 是否有输出过滤?
224
- - 是否有访问控制?
225
-
226
- 2. **可观测性**
227
- - 是否记录每步的输入输出?
228
- - 是否有性能指标?
229
- - 是否有错误统计?
230
-
231
- ## 增强的评估建议
232
-
233
- 根据长时运行Agent测试的最佳实践:
234
-
235
- ### 评估维度扩展
236
-
237
- | 维度 | 指标 | 方法 | 优先级 |
238
- |------|------|------|--------|
239
- | **任务完成率** | success_rate, completion_rate | 自动验证 | 高 |
240
- | **工具使用可靠性** | tool_call_success_rate, error_recovery_rate | 日志分析 | 高 |
241
- | **决策质量** | reasoning_quality, planning_accuracy | LLM评估 | 高 |
242
- | **透明度** | decision_traceability, human_oversight | 审计日志 | 中 |
243
- | **效率** | latency, token_usage, iteration_count | 自动统计 | 中 |
244
- | **安全性** | guardrail_pass_rate, input_validation | 红队测试 | 高 |
245
-
246
- ### 长时运行Agent测试
247
-
248
- 根据harness设计原则:
249
-
250
- 1. **状态管理测试**
251
- - Agent能否正确维护状态?
252
- - 状态在长时间运行后是否一致?
253
- - 状态恢复机制是否有效?
254
-
255
- 2. **错误恢复测试**
256
- - 工具调用失败后能否恢复?
257
- - 是否有优雅降级机制?
258
- - 错误累积是否导致失败?
259
-
260
- 3. **资源管理测试**
261
- - 内存使用是否可控?
262
- - 是否有资源清理机制?
263
- - 长时间运行是否性能下降?
264
-
265
- ### AI-Resistant评估设计
266
-
267
- 根据AI-Resistant评估设计原则:
268
-
269
- 1. **防止评估数据泄露**
270
- - 使用未见过的测试用例
271
- - 动态生成评估数据
272
- - 分离训练和评估数据
273
-
274
- 2. **防止提示注入**
275
- - 评估输入多样化
276
- - 边界情况测试
277
- - 对抗性测试
278
-
279
- 3. **真实能力测试**
280
- - 开放式任务评估
281
- - 多步骤推理测试
282
- - 实际场景模拟
283
-
284
- ## 调用时机
285
-
286
- - 检测到Agent框架依赖时
287
- - AI功能开发前的设计阶段
288
- - 需要理解现有Agent系统时
289
- - 需要评估Agent可靠性时
290
-
291
- ## 示例
292
-
293
- **输入**:
294
- ```
295
- 项目目录:/project
296
- 框架:langchain(已检测到依赖)
297
- ```
298
-
299
- **Grep搜索**:
300
- ```
301
- 找到文件:agents/researcher.py, agents/writer.py, main.py
302
- ```
303
-
304
- **代码上下文**:
305
- ```python
306
- # agents/researcher.py
307
- research_agent = Agent(
308
- role="Researcher",
309
- goal="收集相关信息",
310
- tools=[WebSearchTool(), DocumentReaderTool()],
311
- verbose=True
312
- )
313
-
314
- # agents/writer.py
315
- writer_agent = Agent(
316
- role="Writer",
317
- goal="生成内容",
318
- tools=[FileWriterTool()],
319
- verbose=True
320
- )
321
-
322
- # main.py
323
- crew = Crew(
324
- agents=[research_agent, writer_agent],
325
- tasks=[research_task, write_task],
326
- process=Process.sequential
327
- )
328
- ```
329
-
330
- **输出**:
331
- ```json
332
- {
333
- "framework": "langchain",
334
- "agents": [
335
- {
336
- "name": "research_agent",
337
- "role": "Researcher",
338
- "tools": [
339
- {"name": "WebSearchTool", "description": "网络搜索"},
340
- {"name": "DocumentReaderTool", "description": "文档读取"}
341
- ],
342
- "decisionLogic": "ReAct"
343
- },
344
- {
345
- "name": "writer_agent",
346
- "role": "Writer",
347
- "tools": [
348
- {"name": "FileWriterTool", "description": "文件写入"}
349
- ],
350
- "decisionLogic": "ReAct"
351
- }
352
- ],
353
- "orchestration": {
354
- "type": "sequential",
355
- "description": "顺序执行"
356
- },
357
- "evaluationNeeds": {
358
- "dimensions": ["任务完成率", "工具使用正确性"],
359
- "suggestions": ["测试Agent能否正确调用工具"]
360
- }
361
- }
362
- ```
@@ -1,339 +0,0 @@
1
- ---
2
- name: rag-analyzer
3
- description: 当检测到RAG应用组件时,分析RAG架构的检索策略、向量存储、文档处理流程。用于理解检索增强生成系统的结构。
4
- type: ai
5
- ---
6
-
7
- ## 定位
8
-
9
- AI专用技能。分析RAG应用的架构、检索策略、向量存储配置和文档处理流程。
10
-
11
- ## 输入
12
-
13
- - 必须输入:RAG代码路径或项目目录
14
- - 可选输入:向量存储类型(已检测到的组件)
15
-
16
- ## 输出
17
-
18
- ```json
19
- {
20
- "architecture": {
21
- "type": "standard-rag",
22
- "description": "标准RAG架构:文档加载 → 分块 → 向量化 → 存储 → 检索 → 生成"
23
- },
24
- "components": {
25
- "documentLoader": {
26
- "type": "PDFLoader",
27
- "sources": ["local", "s3"],
28
- "formats": ["pdf", "txt", "md"]
29
- },
30
- "textSplitter": {
31
- "type": "RecursiveCharacterTextSplitter",
32
- "chunkSize": 500,
33
- "chunkOverlap": 50
34
- },
35
- "embeddings": {
36
- "type": "OpenAIEmbeddings",
37
- "model": "text-embedding-3-small",
38
- "dimension": 1536
39
- },
40
- "vectorStore": {
41
- "type": "ChromaDB",
42
- "collection": "documents",
43
- "persistDirectory": "./chroma_db"
44
- },
45
- "retriever": {
46
- "type": "similarity",
47
- "k": 4,
48
- "scoreThreshold": 0.7
49
- },
50
- "llm": {
51
- "type": "ChatOpenAI",
52
- "model": "gpt-4",
53
- "temperature": 0.1
54
- }
55
- },
56
- "retrievalStrategy": {
57
- "type": "similarity",
58
- "enhancements": [],
59
- "description": "基础相似度检索"
60
- },
61
- "generationConfig": {
62
- "promptTemplate": "基于以下上下文回答问题:\n{context}\n\n问题:{question}",
63
- "maxTokens": 1000
64
- },
65
- "evaluationNeeds": {
66
- "dimensions": ["检索准确率", "回答相关性", "上下文利用率", "幻觉率"],
67
- "suggestions": [
68
- "建议测试检索召回率(Recall@K)",
69
- "建议测试生成回答的准确性",
70
- "建议测试不同查询类型的表现"
71
- ]
72
- }
73
- }
74
- ```
75
-
76
- ## 执行步骤
77
-
78
- ### Step 1: 识别RAG框架(确定性)
79
-
80
- 基于依赖和代码特征识别RAG框架:
81
-
82
- ```
83
- 框架识别规则:
84
- - langchain: 依赖langchain,代码中有 VectorStore, Retriever, Document
85
- - llamaindex: 依赖llamaindex,代码中有 Index, QueryEngine, Node
86
- - haystack: 依赖haystack,代码中有 Pipeline, DocumentStore
87
- - custom: 自定义RAG实现
88
- ```
89
-
90
- ### Step 2: Grep获取组件定义(高效)
91
-
92
- 搜索RAG组件模式:
93
-
94
- ```bash
95
- # LangChain风格
96
- grep -r -n -A 5 "VectorStore\|Retriever\|Document\|Embeddings" --include="*.py" .
97
-
98
- # LlamaIndex风格
99
- grep -r -n -A 5 "VectorStoreIndex\|QueryEngine\|NodeParser" --include="*.py" .
100
-
101
- # 文档加载
102
- grep -r -n -A 5 "Loader\|Document\|load\|split" --include="*.py" .
103
- ```
104
-
105
- ### Step 3: 分析组件配置(模型)
106
-
107
- 基于代码上下文分析RAG组件:
108
-
109
- ```
110
- 模型输入:
111
- {
112
- "framework": "langchain",
113
- "codeContexts": "
114
- # rag.py
115
- vectorstore = Chroma.from_documents(
116
- documents=splits,
117
- embedding=OpenAIEmbeddings(),
118
- persist_directory='./chroma_db'
119
- )
120
- retriever = vectorstore.as_retriever(
121
- search_type='similarity',
122
- k=4
123
- )
124
- ",
125
- "task": "分析RAG组件配置,输出JSON格式"
126
- }
127
- ```
128
-
129
- ### Step 4: 分析检索策略(模型)
130
-
131
- 分析检索增强策略:
132
-
133
- ```
134
- 关注点:
135
- - 基础检索:相似度、MMR、混合检索
136
- - 增强策略:重排序、查询改写、多查询
137
- - 过滤条件:元数据过滤、时间范围
138
- ```
139
-
140
- ### Step 5: 输出结果
141
-
142
- 汇总RAG分析结果,包括评测建议。
143
-
144
- ## Contextual Retrieval
145
-
146
- 根据业界最佳实践,Contextual Retrieval技术:
147
-
148
- ### 问题背景
149
-
150
- 传统RAG在编码信息时移除上下文,导致系统无法从知识库中检索到相关信息。
151
-
152
- ### 解决方案:Contextual Retrieval
153
-
154
- 使用两种子技术:
155
- 1. **Contextual Embeddings**:上下文嵌入
156
- 2. **Contextual BM25**:上下文BM25
157
-
158
- **效果**:显著提升检索质量。
159
-
160
- ### 何时使用
161
-
162
- - 知识库小于200,000 tokens(约500页)→ 直接使用长prompt
163
- - 使用prompt caching让成本更低
164
-
165
- ### 检索策略类型
166
-
167
- | 类型 | 说明 | 适用场景 |
168
- |------|------|----------|
169
- | **similarity** | 相似度检索 | 简单问答 |
170
- | **mmr** | 最大边际相关性 | 多样性需求 |
171
- | **similarity_score_threshold** | 带阈值过滤 | 高精度需求 |
172
- | **hybrid** | 向量+关键词混合 | 精确匹配需求 |
173
- | **multi_query** | 多查询扩展 | 复杂问题 |
174
- | **rerank** | 重排序 | 高质量需求 |
175
- | **contextual** | 上下文增强检索 | 复杂文档检索 |
176
-
177
- ## 分块策略优化
178
-
179
- 分块策略优化:
180
-
181
- ### 分块大小选择
182
-
183
- | 场景 | 建议chunk size | 理由 |
184
- |------|---------------|------|
185
- | 代码 | 100-200 tokens | 保持函数/类完整 |
186
- | 短文档 | 300-500 tokens | 保持语义完整 |
187
- | 长文档 | 500-1000 tokens | 平衡精度和覆盖 |
188
- | 复杂结构 | 可变大小 | 按章节/段落 |
189
-
190
- ### 分块优化技术
191
-
192
- 1. **重叠**:chunk_overlap建议为chunk_size的10-20%
193
- 2. **父子索引**:小chunk用于检索,大chunk用于生成
194
- 3. **元数据**:添加来源、标题、摘要等元数据
195
- 4. **上下文前缀**:为每个chunk添加文档上下文
196
-
197
- ## 向量存储选型原则
198
-
199
- | 场景 | 推荐选择 | 理由 |
200
- |------|----------|------|
201
- | 本地开发、轻量级 | 轻量级向量库 | 易于集成、无需额外服务 |
202
- | 生产环境、需要扩展 | 云端向量数据库 | 托管服务、自动扩展 |
203
- | 需要复杂过滤 | 高性能向量库 | 过滤能力强 |
204
- | 大规模数据 | 分布式方案 | 水平扩展能力 |
205
-
206
- ## RAG评估维度
207
-
208
- 扩展评估维度:
209
-
210
- ### 检索质量评估
211
-
212
- | 指标 | 说明 | 测量方法 |
213
- |------|------|----------|
214
- | **Precision@K** | Top-K结果中相关文档比例 | 标注数据 |
215
- | **Recall@K** | 相关文档被召回的比例 | 标注数据 |
216
- | **MRR** | 第一个相关文档的排名倒数 | 自动计算 |
217
- | **NDCG** | 归一化折损累计增益 | 标注数据 |
218
-
219
- ### 生成质量评估
220
-
221
- | 指标 | 说明 | 测量方法 |
222
- |------|------|----------|
223
- | **Context Relevance** | 检索内容与问题的相关程度 | LLM评估 |
224
- | **Answer Faithfulness** | 回答与检索内容的一致性 | LLM评估 |
225
- | **Answer Relevance** | 回答与问题的相关程度 | LLM评估 |
226
- | **Hallucination Rate** | 幻觉内容比例 | 事实核查 |
227
-
228
- ### 上下文优化评估
229
-
230
- | 指标 | 说明 | 测量方法 |
231
- |------|------|----------|
232
- | **Context Utilization** | 模型利用检索内容的程度 | 日志分析 |
233
- | **Chunk Quality** | 分块是否保留完整语义 | 人工评估 |
234
- | **Retrieval Latency** | 检索延迟 | 自动统计 |
235
-
236
- ## 调用时机
237
-
238
- - 检测到RAG应用组件时
239
- - AI功能开发前的设计阶段
240
- - 需要理解现有RAG系统时
241
-
242
- ## 示例
243
-
244
- **输入**:
245
- ```
246
- 项目目录:/project
247
- 向量存储:ChromaDB(已检测)
248
- LLM:OpenAI(已检测)
249
- ```
250
-
251
- **Grep搜索**:
252
- ```
253
- 找到文件:rag/pipeline.py, rag/embeddings.py, rag/retriever.py
254
- ```
255
-
256
- **代码上下文**:
257
- ```python
258
- # rag/pipeline.py
259
- from langchain.document_loaders import PyPDFLoader
260
- from langchain.text_splitter import RecursiveCharacterTextSplitter
261
- from langchain.embeddings import OpenAIEmbeddings
262
- from langchain.vectorstores import Chroma
263
- from langchain.chains import RetrievalQA
264
-
265
- loader = PyPDFLoader("docs.pdf")
266
- documents = loader.load()
267
-
268
- text_splitter = RecursiveCharacterTextSplitter(
269
- chunk_size=500,
270
- chunk_overlap=50
271
- )
272
- splits = text_splitter.split_documents(documents)
273
-
274
- vectorstore = Chroma.from_documents(
275
- documents=splits,
276
- embedding=OpenAIEmbeddings(),
277
- persist_directory="./chroma_db"
278
- )
279
-
280
- retriever = vectorstore.as_retriever(
281
- search_type="similarity",
282
- k=4
283
- )
284
-
285
- qa_chain = RetrievalQA.from_chain_type(
286
- llm=ChatOpenAI(model="gpt-4"),
287
- retriever=retriever,
288
- return_source_documents=True
289
- )
290
- ```
291
-
292
- **输出**:
293
- ```json
294
- {
295
- "architecture": {
296
- "type": "standard-rag",
297
- "description": "标准RAG:PDF加载 → 分块 → 向量化 → Chroma存储 → 相似度检索 → GPT-4生成"
298
- },
299
- "components": {
300
- "documentLoader": {
301
- "type": "PyPDFLoader",
302
- "formats": ["pdf"]
303
- },
304
- "textSplitter": {
305
- "type": "RecursiveCharacterTextSplitter",
306
- "chunkSize": 500,
307
- "chunkOverlap": 50
308
- },
309
- "embeddings": {
310
- "type": "OpenAIEmbeddings"
311
- },
312
- "vectorStore": {
313
- "type": "Chroma",
314
- "persistDirectory": "./chroma_db"
315
- },
316
- "retriever": {
317
- "type": "similarity",
318
- "k": 4
319
- },
320
- "llm": {
321
- "type": "ChatOpenAI",
322
- "model": "gpt-4"
323
- }
324
- },
325
- "retrievalStrategy": {
326
- "type": "similarity",
327
- "enhancements": [],
328
- "description": "基础相似度检索,返回top-4文档"
329
- },
330
- "evaluationNeeds": {
331
- "dimensions": ["检索准确率", "回答相关性", "来源引用准确性"],
332
- "suggestions": [
333
- "测试PDF文档的解析质量",
334
- "测试不同chunk大小对检索效果的影响",
335
- "测试问答准确性"
336
- ]
337
- }
338
- }
339
- ```