@shakudo/kaji-setup-external 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (411) hide show
  1. package/README.md +155 -0
  2. package/assets/skills/ci-cd/.claude-plugin/plugin.json +8 -0
  3. package/assets/skills/ci-cd/SKILL.md +573 -0
  4. package/assets/skills/ci-cd/assets/templates/github-actions/docker-build.yml +164 -0
  5. package/assets/skills/ci-cd/assets/templates/github-actions/go-ci.yml +420 -0
  6. package/assets/skills/ci-cd/assets/templates/github-actions/node-ci.yml +313 -0
  7. package/assets/skills/ci-cd/assets/templates/github-actions/python-ci.yml +388 -0
  8. package/assets/skills/ci-cd/assets/templates/github-actions/security-scan.yml +416 -0
  9. package/assets/skills/ci-cd/assets/templates/gitlab-ci/docker-build.yml +298 -0
  10. package/assets/skills/ci-cd/assets/templates/gitlab-ci/go-ci.yml +548 -0
  11. package/assets/skills/ci-cd/assets/templates/gitlab-ci/node-ci.yml +334 -0
  12. package/assets/skills/ci-cd/assets/templates/gitlab-ci/python-ci.yml +472 -0
  13. package/assets/skills/ci-cd/assets/templates/gitlab-ci/security-scan.yml +479 -0
  14. package/assets/skills/ci-cd/references/best_practices.md +675 -0
  15. package/assets/skills/ci-cd/references/devsecops.md +862 -0
  16. package/assets/skills/ci-cd/references/optimization.md +651 -0
  17. package/assets/skills/ci-cd/references/security.md +611 -0
  18. package/assets/skills/ci-cd/references/troubleshooting.md +656 -0
  19. package/assets/skills/ci-cd/scripts/ci_health.py +301 -0
  20. package/assets/skills/ci-cd/scripts/pipeline_analyzer.py +440 -0
  21. package/assets/skills/context-optimization/CONTRIBUTING.md +78 -0
  22. package/assets/skills/context-optimization/LICENSE +22 -0
  23. package/assets/skills/context-optimization/README.md +228 -0
  24. package/assets/skills/context-optimization/SKILL.md +104 -0
  25. package/assets/skills/context-optimization/docs/agentskills.md +1264 -0
  26. package/assets/skills/context-optimization/docs/blogs.md +1230 -0
  27. package/assets/skills/context-optimization/docs/claude_research.md +85 -0
  28. package/assets/skills/context-optimization/docs/compression.md +298 -0
  29. package/assets/skills/context-optimization/docs/gemini_research.md +22 -0
  30. package/assets/skills/context-optimization/docs/hncapsule.md +92 -0
  31. package/assets/skills/context-optimization/docs/netflix_context.md +10 -0
  32. package/assets/skills/context-optimization/docs/vercel_tool.md +140 -0
  33. package/assets/skills/context-optimization/examples/book-sft-pipeline/README.md +78 -0
  34. package/assets/skills/context-optimization/examples/book-sft-pipeline/SKILL.md +380 -0
  35. package/assets/skills/context-optimization/examples/book-sft-pipeline/examples/gertrude-stein/README.md +168 -0
  36. package/assets/skills/context-optimization/examples/book-sft-pipeline/examples/gertrude-stein/dataset_sample.jsonl +5 -0
  37. package/assets/skills/context-optimization/examples/book-sft-pipeline/examples/gertrude-stein/pangram/Screenshot 2025-12-27 at 3.05.04/342/200/257AM.png +0 -0
  38. package/assets/skills/context-optimization/examples/book-sft-pipeline/examples/gertrude-stein/pangram/Screenshot 2025-12-27 at 3.05.36/342/200/257AM.png +0 -0
  39. package/assets/skills/context-optimization/examples/book-sft-pipeline/examples/gertrude-stein/pangram/Screenshot 2025-12-27 at 3.07.18/342/200/257AM.png +0 -0
  40. package/assets/skills/context-optimization/examples/book-sft-pipeline/examples/gertrude-stein/sample_outputs.md +63 -0
  41. package/assets/skills/context-optimization/examples/book-sft-pipeline/examples/gertrude-stein/training_config.json +80 -0
  42. package/assets/skills/context-optimization/examples/book-sft-pipeline/references/segmentation-strategies.md +324 -0
  43. package/assets/skills/context-optimization/examples/book-sft-pipeline/references/tinker-format.md +211 -0
  44. package/assets/skills/context-optimization/examples/book-sft-pipeline/references/tinker.txt +3176 -0
  45. package/assets/skills/context-optimization/examples/book-sft-pipeline/scripts/pipeline_example.py +187 -0
  46. package/assets/skills/context-optimization/examples/digital-brain-skill/AGENT.md +35 -0
  47. package/assets/skills/context-optimization/examples/digital-brain-skill/HOW-SKILLS-BUILT-THIS.md +407 -0
  48. package/assets/skills/context-optimization/examples/digital-brain-skill/README.md +209 -0
  49. package/assets/skills/context-optimization/examples/digital-brain-skill/SKILL.md +203 -0
  50. package/assets/skills/context-optimization/examples/digital-brain-skill/SKILLS-MAPPING.md +219 -0
  51. package/assets/skills/context-optimization/examples/digital-brain-skill/agents/AGENTS.md +82 -0
  52. package/assets/skills/context-optimization/examples/digital-brain-skill/agents/scripts/content_ideas.py +132 -0
  53. package/assets/skills/context-optimization/examples/digital-brain-skill/agents/scripts/idea_to_draft.py +181 -0
  54. package/assets/skills/context-optimization/examples/digital-brain-skill/agents/scripts/stale_contacts.py +139 -0
  55. package/assets/skills/context-optimization/examples/digital-brain-skill/agents/scripts/weekly_review.py +121 -0
  56. package/assets/skills/context-optimization/examples/digital-brain-skill/content/CONTENT.md +88 -0
  57. package/assets/skills/context-optimization/examples/digital-brain-skill/content/calendar.md +108 -0
  58. package/assets/skills/context-optimization/examples/digital-brain-skill/content/engagement.jsonl +2 -0
  59. package/assets/skills/context-optimization/examples/digital-brain-skill/content/ideas.jsonl +2 -0
  60. package/assets/skills/context-optimization/examples/digital-brain-skill/content/posts.jsonl +2 -0
  61. package/assets/skills/context-optimization/examples/digital-brain-skill/content/templates/linkedin-post.md +102 -0
  62. package/assets/skills/context-optimization/examples/digital-brain-skill/content/templates/newsletter.md +92 -0
  63. package/assets/skills/context-optimization/examples/digital-brain-skill/content/templates/thread.md +73 -0
  64. package/assets/skills/context-optimization/examples/digital-brain-skill/examples/content-workflow.md +204 -0
  65. package/assets/skills/context-optimization/examples/digital-brain-skill/examples/meeting-prep.md +243 -0
  66. package/assets/skills/context-optimization/examples/digital-brain-skill/identity/IDENTITY.md +46 -0
  67. package/assets/skills/context-optimization/examples/digital-brain-skill/identity/bio-variants.md +101 -0
  68. package/assets/skills/context-optimization/examples/digital-brain-skill/identity/brand.md +165 -0
  69. package/assets/skills/context-optimization/examples/digital-brain-skill/identity/prompts/content-generation.xml +46 -0
  70. package/assets/skills/context-optimization/examples/digital-brain-skill/identity/prompts/reply-generator.xml +40 -0
  71. package/assets/skills/context-optimization/examples/digital-brain-skill/identity/values.yaml +60 -0
  72. package/assets/skills/context-optimization/examples/digital-brain-skill/identity/voice.md +165 -0
  73. package/assets/skills/context-optimization/examples/digital-brain-skill/knowledge/KNOWLEDGE.md +85 -0
  74. package/assets/skills/context-optimization/examples/digital-brain-skill/knowledge/bookmarks.jsonl +2 -0
  75. package/assets/skills/context-optimization/examples/digital-brain-skill/knowledge/competitors.md +117 -0
  76. package/assets/skills/context-optimization/examples/digital-brain-skill/knowledge/learning.yaml +74 -0
  77. package/assets/skills/context-optimization/examples/digital-brain-skill/knowledge/research/_template.md +79 -0
  78. package/assets/skills/context-optimization/examples/digital-brain-skill/network/NETWORK.md +110 -0
  79. package/assets/skills/context-optimization/examples/digital-brain-skill/network/circles.yaml +80 -0
  80. package/assets/skills/context-optimization/examples/digital-brain-skill/network/contacts.jsonl +2 -0
  81. package/assets/skills/context-optimization/examples/digital-brain-skill/network/interactions.jsonl +2 -0
  82. package/assets/skills/context-optimization/examples/digital-brain-skill/network/intros.md +92 -0
  83. package/assets/skills/context-optimization/examples/digital-brain-skill/operations/OPERATIONS.md +75 -0
  84. package/assets/skills/context-optimization/examples/digital-brain-skill/operations/goals.yaml +83 -0
  85. package/assets/skills/context-optimization/examples/digital-brain-skill/operations/meetings.jsonl +2 -0
  86. package/assets/skills/context-optimization/examples/digital-brain-skill/operations/metrics.jsonl +2 -0
  87. package/assets/skills/context-optimization/examples/digital-brain-skill/operations/reviews/_weekly_template.md +114 -0
  88. package/assets/skills/context-optimization/examples/digital-brain-skill/operations/todos.md +76 -0
  89. package/assets/skills/context-optimization/examples/digital-brain-skill/package.json +41 -0
  90. package/assets/skills/context-optimization/examples/digital-brain-skill/references/file-formats.md +386 -0
  91. package/assets/skills/context-optimization/examples/digital-brain-skill/scripts/install.sh +79 -0
  92. package/assets/skills/context-optimization/examples/interleaved_thinking/README.md +620 -0
  93. package/assets/skills/context-optimization/examples/interleaved_thinking/SKILL.md +221 -0
  94. package/assets/skills/context-optimization/examples/interleaved_thinking/docs/agentthinking.md +63 -0
  95. package/assets/skills/context-optimization/examples/interleaved_thinking/docs/interleavedthinking.md +610 -0
  96. package/assets/skills/context-optimization/examples/interleaved_thinking/docs/m2-1.md +224 -0
  97. package/assets/skills/context-optimization/examples/interleaved_thinking/examples/01_basic_capture.py +76 -0
  98. package/assets/skills/context-optimization/examples/interleaved_thinking/examples/02_tool_usage.py +187 -0
  99. package/assets/skills/context-optimization/examples/interleaved_thinking/examples/03_full_optimization.py +1222 -0
  100. package/assets/skills/context-optimization/examples/interleaved_thinking/generated_skills/comprehensive-research-agent/SKILL.md +90 -0
  101. package/assets/skills/context-optimization/examples/interleaved_thinking/generated_skills/comprehensive-research-agent/references/optimization_summary.json +9 -0
  102. package/assets/skills/context-optimization/examples/interleaved_thinking/generated_skills/comprehensive-research-agent/references/optimized_prompt.txt +1 -0
  103. package/assets/skills/context-optimization/examples/interleaved_thinking/generated_skills/comprehensive-research-agent/references/patterns_found.json +205 -0
  104. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/final_prompt.txt +67 -0
  105. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_1/analysis.txt +48 -0
  106. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_1/optimization.txt +15 -0
  107. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_1/optimized_prompt.txt +1 -0
  108. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_1/trace.txt +178 -0
  109. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_10/analysis.txt +47 -0
  110. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_10/trace.txt +162 -0
  111. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_2/analysis.txt +48 -0
  112. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_2/optimization.txt +130 -0
  113. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_2/optimized_prompt.txt +72 -0
  114. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_2/trace.txt +156 -0
  115. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_3/analysis.txt +46 -0
  116. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_3/optimization.txt +147 -0
  117. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_3/optimized_prompt.txt +84 -0
  118. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_3/trace.txt +159 -0
  119. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_4/analysis.txt +46 -0
  120. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_4/optimization.txt +134 -0
  121. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_4/optimized_prompt.txt +67 -0
  122. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_4/trace.txt +165 -0
  123. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_5/analysis.txt +50 -0
  124. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_5/optimization.txt +135 -0
  125. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_5/optimized_prompt.txt +71 -0
  126. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_5/trace.txt +146 -0
  127. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_6/analysis.txt +15 -0
  128. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_6/optimization.txt +15 -0
  129. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_6/optimized_prompt.txt +1 -0
  130. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_6/trace.txt +147 -0
  131. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_7/analysis.txt +46 -0
  132. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_7/optimization.txt +103 -0
  133. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_7/optimized_prompt.txt +45 -0
  134. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_7/trace.txt +134 -0
  135. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_8/analysis.txt +47 -0
  136. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_8/optimization.txt +114 -0
  137. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_8/optimized_prompt.txt +60 -0
  138. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_8/trace.txt +135 -0
  139. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_9/analysis.txt +44 -0
  140. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_9/optimization.txt +106 -0
  141. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_9/optimized_prompt.txt +51 -0
  142. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/iteration_9/trace.txt +170 -0
  143. package/assets/skills/context-optimization/examples/interleaved_thinking/optimization_artifacts/summary.json +11 -0
  144. package/assets/skills/context-optimization/examples/interleaved_thinking/pyproject.toml +70 -0
  145. package/assets/skills/context-optimization/examples/interleaved_thinking/reasoning_trace_optimizer/__init__.py +53 -0
  146. package/assets/skills/context-optimization/examples/interleaved_thinking/reasoning_trace_optimizer/analyzer.py +465 -0
  147. package/assets/skills/context-optimization/examples/interleaved_thinking/reasoning_trace_optimizer/capture.py +417 -0
  148. package/assets/skills/context-optimization/examples/interleaved_thinking/reasoning_trace_optimizer/cli.py +271 -0
  149. package/assets/skills/context-optimization/examples/interleaved_thinking/reasoning_trace_optimizer/loop.py +468 -0
  150. package/assets/skills/context-optimization/examples/interleaved_thinking/reasoning_trace_optimizer/models.py +193 -0
  151. package/assets/skills/context-optimization/examples/interleaved_thinking/reasoning_trace_optimizer/optimizer.py +449 -0
  152. package/assets/skills/context-optimization/examples/interleaved_thinking/reasoning_trace_optimizer/skill_generator.py +502 -0
  153. package/assets/skills/context-optimization/examples/interleaved_thinking/tests/__init__.py +1 -0
  154. package/assets/skills/context-optimization/examples/interleaved_thinking/tests/test_models.py +144 -0
  155. package/assets/skills/context-optimization/examples/llm-as-judge-skills/.prettierrc +8 -0
  156. package/assets/skills/context-optimization/examples/llm-as-judge-skills/CONTRIBUTING.md +78 -0
  157. package/assets/skills/context-optimization/examples/llm-as-judge-skills/LICENSE +21 -0
  158. package/assets/skills/context-optimization/examples/llm-as-judge-skills/README.md +659 -0
  159. package/assets/skills/context-optimization/examples/llm-as-judge-skills/agents/evaluator-agent/evaluator-agent.md +177 -0
  160. package/assets/skills/context-optimization/examples/llm-as-judge-skills/agents/index.md +114 -0
  161. package/assets/skills/context-optimization/examples/llm-as-judge-skills/agents/orchestrator-agent/orchestrator-agent.md +205 -0
  162. package/assets/skills/context-optimization/examples/llm-as-judge-skills/agents/research-agent/research-agent.md +183 -0
  163. package/assets/skills/context-optimization/examples/llm-as-judge-skills/env.example +6 -0
  164. package/assets/skills/context-optimization/examples/llm-as-judge-skills/eslint.config.js +18 -0
  165. package/assets/skills/context-optimization/examples/llm-as-judge-skills/examples/basic-evaluation.ts +89 -0
  166. package/assets/skills/context-optimization/examples/llm-as-judge-skills/examples/full-evaluation-workflow.ts +136 -0
  167. package/assets/skills/context-optimization/examples/llm-as-judge-skills/examples/generate-rubric.ts +67 -0
  168. package/assets/skills/context-optimization/examples/llm-as-judge-skills/examples/pairwise-comparison.ts +97 -0
  169. package/assets/skills/context-optimization/examples/llm-as-judge-skills/package.json +79 -0
  170. package/assets/skills/context-optimization/examples/llm-as-judge-skills/prompts/agent-system/orchestrator-prompt.md +197 -0
  171. package/assets/skills/context-optimization/examples/llm-as-judge-skills/prompts/evaluation/direct-scoring-prompt.md +153 -0
  172. package/assets/skills/context-optimization/examples/llm-as-judge-skills/prompts/evaluation/pairwise-comparison-prompt.md +200 -0
  173. package/assets/skills/context-optimization/examples/llm-as-judge-skills/prompts/index.md +138 -0
  174. package/assets/skills/context-optimization/examples/llm-as-judge-skills/prompts/research/research-synthesis-prompt.md +171 -0
  175. package/assets/skills/context-optimization/examples/llm-as-judge-skills/skills/context-fundamentals/context-fundamentals.md +114 -0
  176. package/assets/skills/context-optimization/examples/llm-as-judge-skills/skills/index.md +79 -0
  177. package/assets/skills/context-optimization/examples/llm-as-judge-skills/skills/llm-evaluator/llm-evaluator.md +77 -0
  178. package/assets/skills/context-optimization/examples/llm-as-judge-skills/skills/tool-design/tool-design.md +198 -0
  179. package/assets/skills/context-optimization/examples/llm-as-judge-skills/src/agents/evaluator.ts +112 -0
  180. package/assets/skills/context-optimization/examples/llm-as-judge-skills/src/agents/index.ts +3 -0
  181. package/assets/skills/context-optimization/examples/llm-as-judge-skills/src/config/index.ts +18 -0
  182. package/assets/skills/context-optimization/examples/llm-as-judge-skills/src/index.ts +19 -0
  183. package/assets/skills/context-optimization/examples/llm-as-judge-skills/src/tools/evaluation/direct-score.ts +164 -0
  184. package/assets/skills/context-optimization/examples/llm-as-judge-skills/src/tools/evaluation/generate-rubric.ts +161 -0
  185. package/assets/skills/context-optimization/examples/llm-as-judge-skills/src/tools/evaluation/index.ts +9 -0
  186. package/assets/skills/context-optimization/examples/llm-as-judge-skills/src/tools/evaluation/pairwise-compare.ts +255 -0
  187. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tests/evaluation.test.ts +233 -0
  188. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tests/setup.ts +27 -0
  189. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tests/skills.test.ts +213 -0
  190. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tools/evaluation/direct-score.md +159 -0
  191. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tools/evaluation/generate-rubric.md +189 -0
  192. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tools/evaluation/pairwise-compare.md +182 -0
  193. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tools/index.md +141 -0
  194. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tools/orchestration/delegate-to-agent.md +171 -0
  195. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tools/research/read-url.md +162 -0
  196. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tools/research/web-search.md +128 -0
  197. package/assets/skills/context-optimization/examples/llm-as-judge-skills/tsconfig.json +26 -0
  198. package/assets/skills/context-optimization/examples/llm-as-judge-skills/vitest.config.ts +20 -0
  199. package/assets/skills/context-optimization/examples/x-to-book-system/PRD.md +644 -0
  200. package/assets/skills/context-optimization/examples/x-to-book-system/README.md +181 -0
  201. package/assets/skills/context-optimization/examples/x-to-book-system/SKILLS-MAPPING.md +187 -0
  202. package/assets/skills/context-optimization/researcher/example_output.md +75 -0
  203. package/assets/skills/context-optimization/researcher/llm-as-a-judge.md +362 -0
  204. package/assets/skills/context-optimization/skills/advanced-evaluation/SKILL.md +454 -0
  205. package/assets/skills/context-optimization/skills/advanced-evaluation/references/bias-mitigation.md +288 -0
  206. package/assets/skills/context-optimization/skills/advanced-evaluation/references/implementation-patterns.md +315 -0
  207. package/assets/skills/context-optimization/skills/advanced-evaluation/references/metrics-guide.md +331 -0
  208. package/assets/skills/context-optimization/skills/advanced-evaluation/scripts/evaluation_example.py +337 -0
  209. package/assets/skills/context-optimization/skills/bdi-mental-states/SKILL.md +295 -0
  210. package/assets/skills/context-optimization/skills/bdi-mental-states/references/bdi-ontology-core.md +207 -0
  211. package/assets/skills/context-optimization/skills/bdi-mental-states/references/framework-integration.md +582 -0
  212. package/assets/skills/context-optimization/skills/bdi-mental-states/references/rdf-examples.md +315 -0
  213. package/assets/skills/context-optimization/skills/bdi-mental-states/references/sparql-competency.md +420 -0
  214. package/assets/skills/context-optimization/skills/context-compression/SKILL.md +265 -0
  215. package/assets/skills/context-optimization/skills/context-compression/references/evaluation-framework.md +213 -0
  216. package/assets/skills/context-optimization/skills/context-compression/scripts/compression_evaluator.py +658 -0
  217. package/assets/skills/context-optimization/skills/context-degradation/SKILL.md +231 -0
  218. package/assets/skills/context-optimization/skills/context-degradation/references/patterns.md +314 -0
  219. package/assets/skills/context-optimization/skills/context-degradation/scripts/degradation_detector.py +419 -0
  220. package/assets/skills/context-optimization/skills/context-fundamentals/SKILL.md +185 -0
  221. package/assets/skills/context-optimization/skills/context-fundamentals/references/context-components.md +283 -0
  222. package/assets/skills/context-optimization/skills/context-fundamentals/scripts/context_manager.py +370 -0
  223. package/assets/skills/context-optimization/skills/context-optimization/SKILL.md +179 -0
  224. package/assets/skills/context-optimization/skills/context-optimization/references/optimization_techniques.md +272 -0
  225. package/assets/skills/context-optimization/skills/context-optimization/scripts/compaction.py +379 -0
  226. package/assets/skills/context-optimization/skills/evaluation/SKILL.md +231 -0
  227. package/assets/skills/context-optimization/skills/evaluation/references/metrics.md +339 -0
  228. package/assets/skills/context-optimization/skills/evaluation/scripts/evaluator.py +474 -0
  229. package/assets/skills/context-optimization/skills/filesystem-context/SKILL.md +321 -0
  230. package/assets/skills/context-optimization/skills/filesystem-context/references/implementation-patterns.md +549 -0
  231. package/assets/skills/context-optimization/skills/filesystem-context/scripts/filesystem_context.py +353 -0
  232. package/assets/skills/context-optimization/skills/hosted-agents/SKILL.md +279 -0
  233. package/assets/skills/context-optimization/skills/hosted-agents/references/infrastructure-patterns.md +700 -0
  234. package/assets/skills/context-optimization/skills/hosted-agents/scripts/sandbox_manager.py +495 -0
  235. package/assets/skills/context-optimization/skills/memory-systems/SKILL.md +221 -0
  236. package/assets/skills/context-optimization/skills/memory-systems/references/implementation.md +458 -0
  237. package/assets/skills/context-optimization/skills/memory-systems/scripts/memory_store.py +396 -0
  238. package/assets/skills/context-optimization/skills/multi-agent-patterns/SKILL.md +255 -0
  239. package/assets/skills/context-optimization/skills/multi-agent-patterns/references/frameworks.md +433 -0
  240. package/assets/skills/context-optimization/skills/multi-agent-patterns/scripts/coordination.py +439 -0
  241. package/assets/skills/context-optimization/skills/project-development/SKILL.md +342 -0
  242. package/assets/skills/context-optimization/skills/project-development/references/case-studies.md +388 -0
  243. package/assets/skills/context-optimization/skills/project-development/references/pipeline-patterns.md +610 -0
  244. package/assets/skills/context-optimization/skills/project-development/scripts/pipeline_template.py +677 -0
  245. package/assets/skills/context-optimization/skills/tool-design/SKILL.md +311 -0
  246. package/assets/skills/context-optimization/skills/tool-design/references/architectural_reduction.md +210 -0
  247. package/assets/skills/context-optimization/skills/tool-design/references/best_practices.md +176 -0
  248. package/assets/skills/context-optimization/skills/tool-design/scripts/description_generator.py +237 -0
  249. package/assets/skills/context-optimization/template/SKILL.md +98 -0
  250. package/assets/skills/dremio-analytics/SKILL.md +287 -0
  251. package/assets/skills/elevenlabs-voice/SKILL.md +269 -0
  252. package/assets/skills/git-workflow/SKILL.md +266 -0
  253. package/assets/skills/gitops-workflows/.claude-plugin/plugin.json +8 -0
  254. package/assets/skills/gitops-workflows/SKILL.md +568 -0
  255. package/assets/skills/gitops-workflows/assets/applicationsets/cluster-generator.yaml +32 -0
  256. package/assets/skills/gitops-workflows/assets/argocd/install-argocd-3.x.yaml +92 -0
  257. package/assets/skills/gitops-workflows/assets/flux/flux-bootstrap-github.sh +49 -0
  258. package/assets/skills/gitops-workflows/assets/flux/oci-helmrelease.yaml +38 -0
  259. package/assets/skills/gitops-workflows/assets/progressive-delivery/argo-rollouts-canary.yaml +62 -0
  260. package/assets/skills/gitops-workflows/assets/secrets/sops-age-config.yaml +33 -0
  261. package/assets/skills/gitops-workflows/references/argocd_vs_flux.md +243 -0
  262. package/assets/skills/gitops-workflows/references/best_practices.md +160 -0
  263. package/assets/skills/gitops-workflows/references/multi_cluster.md +80 -0
  264. package/assets/skills/gitops-workflows/references/oci_artifacts.md +290 -0
  265. package/assets/skills/gitops-workflows/references/progressive_delivery.md +94 -0
  266. package/assets/skills/gitops-workflows/references/repo_patterns.md +184 -0
  267. package/assets/skills/gitops-workflows/references/secret_management.md +213 -0
  268. package/assets/skills/gitops-workflows/references/troubleshooting.md +134 -0
  269. package/assets/skills/gitops-workflows/scripts/applicationset_generator.py +156 -0
  270. package/assets/skills/gitops-workflows/scripts/check_argocd_health.py +275 -0
  271. package/assets/skills/gitops-workflows/scripts/check_flux_health.py +418 -0
  272. package/assets/skills/gitops-workflows/scripts/oci_artifact_checker.py +150 -0
  273. package/assets/skills/gitops-workflows/scripts/promotion_validator.py +88 -0
  274. package/assets/skills/gitops-workflows/scripts/secret_audit.py +178 -0
  275. package/assets/skills/gitops-workflows/scripts/sync_drift_detector.py +144 -0
  276. package/assets/skills/gitops-workflows/scripts/validate_gitops_repo.py +299 -0
  277. package/assets/skills/iac-terraform/.claude-plugin/plugin.json +8 -0
  278. package/assets/skills/iac-terraform/SKILL.md +653 -0
  279. package/assets/skills/iac-terraform/assets/templates/MODULE_TEMPLATE.md +386 -0
  280. package/assets/skills/iac-terraform/assets/workflows/github-actions-terraform.yml +224 -0
  281. package/assets/skills/iac-terraform/assets/workflows/github-actions-terragrunt.yml +236 -0
  282. package/assets/skills/iac-terraform/assets/workflows/gitlab-ci-terraform.yml +184 -0
  283. package/assets/skills/iac-terraform/references/best_practices.md +709 -0
  284. package/assets/skills/iac-terraform/references/cost_optimization.md +665 -0
  285. package/assets/skills/iac-terraform/references/troubleshooting.md +635 -0
  286. package/assets/skills/iac-terraform/scripts/init_module.py +319 -0
  287. package/assets/skills/iac-terraform/scripts/inspect_state.py +232 -0
  288. package/assets/skills/iac-terraform/scripts/validate_module.py +227 -0
  289. package/assets/skills/k8s-troubleshooter/.claude-plugin/plugin.json +8 -0
  290. package/assets/skills/k8s-troubleshooter/SKILL.md +336 -0
  291. package/assets/skills/k8s-troubleshooter/references/common_issues.md +582 -0
  292. package/assets/skills/k8s-troubleshooter/references/helm_troubleshooting.md +708 -0
  293. package/assets/skills/k8s-troubleshooter/references/incident_response.md +466 -0
  294. package/assets/skills/k8s-troubleshooter/references/performance_troubleshooting.md +687 -0
  295. package/assets/skills/k8s-troubleshooter/scripts/check_namespace.py +500 -0
  296. package/assets/skills/k8s-troubleshooter/scripts/cluster_health.py +223 -0
  297. package/assets/skills/k8s-troubleshooter/scripts/diagnose_pod.py +157 -0
  298. package/assets/skills/mattermost-notify/SKILL.md +248 -0
  299. package/assets/skills/monitoring-observability/SKILL.md +869 -0
  300. package/assets/skills/monitoring-observability/assets/templates/otel-config/collector-config.yaml +227 -0
  301. package/assets/skills/monitoring-observability/assets/templates/prometheus-alerts/kubernetes-alerts.yml +293 -0
  302. package/assets/skills/monitoring-observability/assets/templates/prometheus-alerts/webapp-alerts.yml +243 -0
  303. package/assets/skills/monitoring-observability/assets/templates/runbooks/incident-runbook-template.md +409 -0
  304. package/assets/skills/monitoring-observability/monitoring-observability.skill +0 -0
  305. package/assets/skills/monitoring-observability/references/alerting_best_practices.md +609 -0
  306. package/assets/skills/monitoring-observability/references/datadog_migration.md +649 -0
  307. package/assets/skills/monitoring-observability/references/dql_promql_translation.md +756 -0
  308. package/assets/skills/monitoring-observability/references/logging_guide.md +775 -0
  309. package/assets/skills/monitoring-observability/references/metrics_design.md +406 -0
  310. package/assets/skills/monitoring-observability/references/slo_sla_guide.md +652 -0
  311. package/assets/skills/monitoring-observability/references/tool_comparison.md +697 -0
  312. package/assets/skills/monitoring-observability/references/tracing_guide.md +663 -0
  313. package/assets/skills/monitoring-observability/scripts/alert_quality_checker.py +315 -0
  314. package/assets/skills/monitoring-observability/scripts/analyze_metrics.py +279 -0
  315. package/assets/skills/monitoring-observability/scripts/dashboard_generator.py +395 -0
  316. package/assets/skills/monitoring-observability/scripts/datadog_cost_analyzer.py +477 -0
  317. package/assets/skills/monitoring-observability/scripts/health_check_validator.py +297 -0
  318. package/assets/skills/monitoring-observability/scripts/log_analyzer.py +321 -0
  319. package/assets/skills/monitoring-observability/scripts/slo_calculator.py +365 -0
  320. package/assets/skills/neo4j-graph-rag/SKILL.md +258 -0
  321. package/assets/skills/pagerduty-ops/SKILL.md +380 -0
  322. package/assets/skills/playwright/API_REFERENCE.md +653 -0
  323. package/assets/skills/playwright/SKILL.md +453 -0
  324. package/assets/skills/playwright/lib/helpers.js +441 -0
  325. package/assets/skills/playwright/package.json +26 -0
  326. package/assets/skills/playwright/run.js +228 -0
  327. package/assets/skills/project-memory/README.md +687 -0
  328. package/assets/skills/project-memory/SKILL.md +298 -0
  329. package/assets/skills/project-memory/references/bugs_template.md +41 -0
  330. package/assets/skills/project-memory/references/decisions_template.md +92 -0
  331. package/assets/skills/project-memory/references/issues_template.md +76 -0
  332. package/assets/skills/project-memory/references/key_facts_template.md +158 -0
  333. package/assets/skills/recruit-workflow/SKILL.md +276 -0
  334. package/assets/skills/recruit-workflow/references/email-templates.md +347 -0
  335. package/assets/skills/recruit-workflow/references/workflow-stages.md +395 -0
  336. package/assets/skills/recruit-workflow/scripts/clay_client.py +188 -0
  337. package/assets/skills/recruit-workflow/scripts/lever_client.py +197 -0
  338. package/assets/skills/recruit-workflow/scripts/mailgun_client.py +245 -0
  339. package/assets/skills/recruit-workflow/scripts/minio_client.py +426 -0
  340. package/assets/skills/shakudo-microservice/SKILL.md +215 -0
  341. package/assets/skills/tmux/SKILL.md +631 -0
  342. package/assets/skills/tmux/references/direct-socket-control.md +108 -0
  343. package/assets/skills/tmux/references/session-lifecycle.md +503 -0
  344. package/assets/skills/tmux/references/session-registry.md +1484 -0
  345. package/assets/skills/tmux/tools/cleanup-sessions.sh +263 -0
  346. package/assets/skills/tmux/tools/create-session.sh +224 -0
  347. package/assets/skills/tmux/tools/find-sessions.sh +262 -0
  348. package/assets/skills/tmux/tools/kill-session.sh +308 -0
  349. package/assets/skills/tmux/tools/lib/registry.sh +437 -0
  350. package/assets/skills/tmux/tools/lib/time_utils.sh +54 -0
  351. package/assets/skills/tmux/tools/list-sessions.sh +255 -0
  352. package/assets/skills/tmux/tools/pane-health.sh +424 -0
  353. package/assets/skills/tmux/tools/safe-send.sh +503 -0
  354. package/assets/skills/tmux/tools/wait-for-text.sh +260 -0
  355. package/assets/skills/twilio-sms/SKILL.md +508 -0
  356. package/assets/skills/zellij/SKILL.md +274 -0
  357. package/assets/skills/zellij/references/actions.md +558 -0
  358. package/assets/skills/zellij/references/layouts.md +424 -0
  359. package/bin/cli.ts +46 -0
  360. package/package.json +43 -0
  361. package/src/alias.ts +108 -0
  362. package/src/backup.ts +51 -0
  363. package/src/config.ts +115 -0
  364. package/src/dependencies.ts +163 -0
  365. package/src/errors.ts +77 -0
  366. package/src/index.ts +207 -0
  367. package/src/prompts.ts +142 -0
  368. package/src/schemas.ts +21 -0
  369. package/src/skills.ts +45 -0
  370. package/src/speckit.ts +116 -0
  371. package/src/types.ts +106 -0
  372. package/src/utils.ts +110 -0
  373. package/src/vibe-git.ts +50 -0
  374. package/templates/.specify/memory/constitution.md +109 -0
  375. package/templates/.specify/scripts/bash/check-prerequisites.sh +262 -0
  376. package/templates/.specify/scripts/bash/common.sh +670 -0
  377. package/templates/.specify/scripts/bash/create-new-feature.sh +594 -0
  378. package/templates/.specify/scripts/bash/create-worktree-feature.sh +401 -0
  379. package/templates/.specify/scripts/bash/init-workspace.sh +433 -0
  380. package/templates/.specify/scripts/bash/list-spec-worktrees.sh +198 -0
  381. package/templates/.specify/scripts/bash/setup-plan.sh +105 -0
  382. package/templates/.specify/scripts/bash/test-workspace-rollup.sh +175 -0
  383. package/templates/.specify/scripts/bash/update-agent-context.sh +799 -0
  384. package/templates/.specify/templates/agent-file-template.md +28 -0
  385. package/templates/.specify/templates/checklist-template.md +40 -0
  386. package/templates/.specify/templates/commands/analyze.md +197 -0
  387. package/templates/.specify/templates/commands/checklist.md +306 -0
  388. package/templates/.specify/templates/commands/clarify.md +194 -0
  389. package/templates/.specify/templates/commands/constitution.md +97 -0
  390. package/templates/.specify/templates/commands/implement.md +149 -0
  391. package/templates/.specify/templates/commands/plan.md +123 -0
  392. package/templates/.specify/templates/commands/projects.md +48 -0
  393. package/templates/.specify/templates/commands/rollup.md +66 -0
  394. package/templates/.specify/templates/commands/specify.md +275 -0
  395. package/templates/.specify/templates/commands/specs.md +71 -0
  396. package/templates/.specify/templates/commands/tasks.md +151 -0
  397. package/templates/.specify/templates/commands/taskstoissues.md +35 -0
  398. package/templates/.specify/templates/commands/workspace.md +128 -0
  399. package/templates/.specify/templates/plan-template.md +104 -0
  400. package/templates/.specify/templates/spec-template.md +115 -0
  401. package/templates/.specify/templates/tasks-template.md +251 -0
  402. package/templates/.specify/templates/workspace.yaml +110 -0
  403. package/templates/.specify/workspace.yaml +95 -0
  404. package/templates/AGENTS.md +460 -0
  405. package/templates/oh-my-opencode.json +27 -0
  406. package/templates/opencode.json +383 -0
  407. package/templates/package.json +10 -0
  408. package/templates/project-memory/bugs.md +16 -0
  409. package/templates/project-memory/decisions.md +22 -0
  410. package/templates/project-memory/issues.md +15 -0
  411. package/templates/project-memory/key_facts.md +26 -0
@@ -0,0 +1,177 @@
1
+ # Evaluator Agent
2
+
3
+ ## Purpose
4
+
5
+ The Evaluator Agent assesses the quality of LLM-generated responses using configurable evaluation criteria. It implements the LLM-as-a-Judge pattern with support for both direct scoring and pairwise comparison.
6
+
7
+ ## Agent Definition
8
+
9
+ ```typescript
10
+ import { ToolLoopAgent } from "ai";
11
+ import { anthropic } from "@ai-sdk/anthropic";
12
+ import { evaluationTools } from "../tools";
13
+
14
+ export const evaluatorAgent = new ToolLoopAgent({
15
+ name: "evaluator",
16
+ model: anthropic("claude-sonnet-4-20250514"),
17
+ instructions: `You are an expert evaluator of LLM-generated content.
18
+
19
+ Your role is to:
20
+ 1. Assess response quality against specific criteria
21
+ 2. Provide structured scores with justifications
22
+ 3. Identify specific issues and strengths
23
+ 4. Compare responses when asked for pairwise evaluation
24
+
25
+ Evaluation Guidelines:
26
+ - Be objective and consistent in your assessments
27
+ - Ground evaluations in specific evidence from the response
28
+ - Consider the context and requirements of the original task
29
+ - Avoid position bias - evaluate content not placement
30
+ - Do not favor verbose responses unless verbosity adds value
31
+
32
+ Always provide:
33
+ - Numerical scores for each criterion
34
+ - Specific examples supporting your assessment
35
+ - Actionable feedback for improvement`,
36
+
37
+ tools: {
38
+ directScore: evaluationTools.directScore,
39
+ pairwiseCompare: evaluationTools.pairwiseCompare,
40
+ extractCriteria: evaluationTools.extractCriteria,
41
+ generateRubric: evaluationTools.generateRubric
42
+ }
43
+ });
44
+ ```
45
+
46
+ ## Capabilities
47
+
48
+ ### Direct Scoring
49
+ Evaluate a single response against defined criteria and rubric.
50
+
51
+ **Input:**
52
+ - Response to evaluate
53
+ - Original prompt/context
54
+ - Evaluation criteria
55
+ - Scoring rubric
56
+
57
+ **Output:**
58
+ - Score per criterion (1-5)
59
+ - Overall score
60
+ - Detailed justification
61
+ - Identified issues and strengths
62
+
63
+ ### Pairwise Comparison
64
+ Compare two responses and select the better one.
65
+
66
+ **Input:**
67
+ - Response A
68
+ - Response B
69
+ - Original prompt/context
70
+ - Comparison criteria
71
+
72
+ **Output:**
73
+ - Winner selection (A, B, or Tie)
74
+ - Confidence score
75
+ - Comparative analysis
76
+ - Specific differentiators
77
+
78
+ ### Criteria Extraction
79
+ Automatically extract evaluation criteria from a task description.
80
+
81
+ **Input:**
82
+ - Task description
83
+ - Domain context
84
+ - Quality expectations
85
+
86
+ **Output:**
87
+ - List of relevant criteria
88
+ - Criterion descriptions
89
+ - Suggested weights
90
+
91
+ ### Rubric Generation
92
+ Generate a scoring rubric for specific criteria.
93
+
94
+ **Input:**
95
+ - Criterion name
96
+ - Quality dimensions
97
+ - Scale (default 1-5)
98
+
99
+ **Output:**
100
+ - Rubric with score descriptions
101
+ - Examples for each level
102
+ - Edge case guidance
103
+
104
+ ## Configuration
105
+
106
+ ```typescript
107
+ interface EvaluatorConfig {
108
+ // Scoring configuration
109
+ scoringMode: "direct" | "pairwise";
110
+ useChainOfThought: boolean;
111
+ nShotExamples: number;
112
+
113
+ // Bias mitigation
114
+ swapPositionsForPairwise: boolean;
115
+ normalizeForLength: boolean;
116
+
117
+ // Output configuration
118
+ includeJustification: boolean;
119
+ includeExamples: boolean;
120
+ outputFormat: "structured" | "prose";
121
+ }
122
+
123
+ const defaultConfig: EvaluatorConfig = {
124
+ scoringMode: "direct",
125
+ useChainOfThought: true,
126
+ nShotExamples: 2,
127
+ swapPositionsForPairwise: true,
128
+ normalizeForLength: false,
129
+ includeJustification: true,
130
+ includeExamples: true,
131
+ outputFormat: "structured"
132
+ };
133
+ ```
134
+
135
+ ## Usage Example
136
+
137
+ ```typescript
138
+ import { evaluatorAgent } from "./agents/evaluator-agent";
139
+
140
+ // Direct scoring
141
+ const evaluation = await evaluatorAgent.generate({
142
+ prompt: `Evaluate the following response:
143
+
144
+ Original Question: "Explain quantum entanglement to a high school student"
145
+
146
+ Response: "${generatedResponse}"
147
+
148
+ Criteria:
149
+ 1. Accuracy - Scientific correctness
150
+ 2. Clarity - Understandable for target audience
151
+ 3. Engagement - Interesting and memorable
152
+ 4. Completeness - Covers key concepts
153
+
154
+ Provide scores and detailed feedback.`
155
+ });
156
+
157
+ // Pairwise comparison
158
+ const comparison = await evaluatorAgent.generate({
159
+ prompt: `Compare these two responses to the same question.
160
+
161
+ Question: "What are the benefits of exercise?"
162
+
163
+ Response A: "${responseA}"
164
+
165
+ Response B: "${responseB}"
166
+
167
+ Which response is better? Explain your reasoning.`
168
+ });
169
+ ```
170
+
171
+ ## Integration Points
172
+
173
+ - **Content Generation Pipeline**: Evaluate outputs before delivery
174
+ - **Model Comparison**: Compare responses from different models
175
+ - **Quality Monitoring**: Track response quality over time
176
+ - **Fine-tuning Data**: Generate preference data for RLHF
177
+
@@ -0,0 +1,114 @@
1
+ # Agents Index
2
+
3
+ Agents are reusable AI components with defined capabilities, tools, and instructions.
4
+
5
+ ## Available Agents
6
+
7
+ ### Evaluator Agent
8
+ **Path**: `agents/evaluator-agent/evaluator-agent.md`
9
+ **Purpose**: Assess the quality of LLM-generated responses
10
+
11
+ **Capabilities**:
12
+ - Direct scoring against rubrics
13
+ - Pairwise comparison of responses
14
+ - Criteria extraction from task descriptions
15
+ - Rubric generation for evaluation
16
+
17
+ **Tools Used**:
18
+ - `directScore`
19
+ - `pairwiseCompare`
20
+ - `extractCriteria`
21
+ - `generateRubric`
22
+
23
+ **Best For**:
24
+ - Quality gates in content pipelines
25
+ - Model comparison studies
26
+ - RLHF preference data generation
27
+ - Output validation before delivery
28
+
29
+ ---
30
+
31
+ ### Research Agent
32
+ **Path**: `agents/research-agent/research-agent.md`
33
+ **Purpose**: Gather, verify, and synthesize information from multiple sources
34
+
35
+ **Capabilities**:
36
+ - Web search and result analysis
37
+ - URL content extraction
38
+ - Claim extraction and verification
39
+ - Research synthesis
40
+
41
+ **Tools Used**:
42
+ - `webSearch`
43
+ - `readUrl`
44
+ - `extractClaims`
45
+ - `verifyClaim`
46
+ - `synthesize`
47
+
48
+ **Best For**:
49
+ - Knowledge base building
50
+ - Fact checking
51
+ - Market research
52
+ - Technical documentation
53
+
54
+ ---
55
+
56
+ ### Orchestrator Agent
57
+ **Path**: `agents/orchestrator-agent/orchestrator-agent.md`
58
+ **Purpose**: Coordinate multi-agent workflows for complex tasks
59
+
60
+ **Capabilities**:
61
+ - Task decomposition and assignment
62
+ - Parallel task execution
63
+ - Result synthesis
64
+ - Error handling and recovery
65
+
66
+ **Tools Used**:
67
+ - `delegateToAgent`
68
+ - `parallelExecution`
69
+ - `waitForCompletion`
70
+ - `synthesizeResults`
71
+ - `handleError`
72
+
73
+ **Best For**:
74
+ - Complex multi-step tasks
75
+ - Cross-capability workflows
76
+ - Quality-assured pipelines
77
+ - Long-running operations
78
+
79
+ ## Agent Interaction Patterns
80
+
81
+ ### Sequential Pipeline
82
+ ```
83
+ Input → Agent A → Agent B → Agent C → Output
84
+ ```
85
+ Use when each step depends on the previous.
86
+
87
+ ### Parallel Fan-Out
88
+ ```
89
+ ┌→ Agent A ─┐
90
+ Input ──┼→ Agent B ──┼→ Synthesis → Output
91
+ └→ Agent C ─┘
92
+ ```
93
+ Use for independent subtasks that can run concurrently.
94
+
95
+ ### Iterative Refinement
96
+ ```
97
+ Input → Agent → Evaluator ─┬→ Output (if pass)
98
+ └→ Agent (if fail, with feedback)
99
+ ```
100
+ Use for quality-critical outputs.
101
+
102
+ ## Adding New Agents
103
+
104
+ 1. Create agent directory: `agents/<agent-name>/`
105
+ 2. Create main file: `agents/<agent-name>/<agent-name>.md`
106
+ 3. Define:
107
+ - Purpose and role
108
+ - System instructions
109
+ - Tool assignments
110
+ - Configuration options
111
+ - Usage examples
112
+ 4. Update this index
113
+ 5. Register with orchestrator if applicable
114
+
@@ -0,0 +1,205 @@
1
+ # Orchestrator Agent
2
+
3
+ ## Purpose
4
+
5
+ The Orchestrator Agent manages complex workflows by delegating tasks to specialized agents, coordinating their outputs, and ensuring coherent end-to-end execution. It serves as the primary interface for multi-agent operations.
6
+
7
+ ## Agent Definition
8
+
9
+ ```typescript
10
+ import { ToolLoopAgent } from "ai";
11
+ import { anthropic } from "@ai-sdk/anthropic";
12
+ import { orchestrationTools } from "../tools";
13
+
14
+ export const orchestratorAgent = new ToolLoopAgent({
15
+ name: "orchestrator",
16
+ model: anthropic("claude-sonnet-4-20250514"),
17
+ instructions: `You are a workflow orchestration expert.
18
+
19
+ Your role is to:
20
+ 1. Analyze complex tasks and break them into subtasks
21
+ 2. Assign subtasks to appropriate specialized agents
22
+ 3. Coordinate agent outputs and handle dependencies
23
+ 4. Synthesize results into coherent final outputs
24
+ 5. Handle errors and retries gracefully
25
+
26
+ Orchestration Principles:
27
+ - Decompose tasks by capability requirements
28
+ - Parallelize independent operations when possible
29
+ - Maintain context continuity across agent handoffs
30
+ - Validate intermediate outputs before proceeding
31
+ - Provide clear status updates during long operations
32
+
33
+ Available Agents:
34
+ - evaluator: Assesses quality of LLM outputs
35
+ - researcher: Gathers and synthesizes information
36
+ - writer: Generates and refines content
37
+ - analyst: Performs data analysis and insights
38
+
39
+ When delegating:
40
+ - Provide complete context the agent needs
41
+ - Specify expected output format
42
+ - Set clear success criteria`,
43
+
44
+ tools: {
45
+ delegateToAgent: orchestrationTools.delegateToAgent,
46
+ parallelExecution: orchestrationTools.parallelExecution,
47
+ waitForCompletion: orchestrationTools.waitForCompletion,
48
+ synthesizeResults: orchestrationTools.synthesizeResults,
49
+ handleError: orchestrationTools.handleError
50
+ }
51
+ });
52
+ ```
53
+
54
+ ## Capabilities
55
+
56
+ ### Task Delegation
57
+ Route a task to a specialized agent.
58
+
59
+ **Input:**
60
+ - Agent name
61
+ - Task description
62
+ - Context/dependencies
63
+ - Expected output format
64
+
65
+ **Output:**
66
+ - Agent response
67
+ - Execution metadata
68
+ - Status
69
+
70
+ ### Parallel Execution
71
+ Execute multiple independent tasks simultaneously.
72
+
73
+ **Input:**
74
+ - List of (agent, task) pairs
75
+ - Timeout configuration
76
+
77
+ **Output:**
78
+ - Results array
79
+ - Completion status per task
80
+ - Any errors encountered
81
+
82
+ ### Result Synthesis
83
+ Combine outputs from multiple agents into coherent result.
84
+
85
+ **Input:**
86
+ - Agent outputs
87
+ - Synthesis instructions
88
+ - Target format
89
+
90
+ **Output:**
91
+ - Synthesized result
92
+ - Source attribution
93
+ - Confidence assessment
94
+
95
+ ### Error Handling
96
+ Manage failures and implement retry logic.
97
+
98
+ **Input:**
99
+ - Failed task
100
+ - Error details
101
+ - Retry policy
102
+
103
+ **Output:**
104
+ - Retry result or
105
+ - Graceful degradation or
106
+ - Error escalation
107
+
108
+ ## Configuration
109
+
110
+ ```typescript
111
+ interface OrchestratorConfig {
112
+ // Execution settings
113
+ maxParallelTasks: number;
114
+ defaultTimeout: number; // ms
115
+ retryPolicy: RetryPolicy;
116
+
117
+ // Quality settings
118
+ validateIntermediateOutputs: boolean;
119
+ evaluateBeforeDelivery: boolean;
120
+
121
+ // Reporting
122
+ enableProgressUpdates: boolean;
123
+ updateFrequency: number; // ms
124
+ }
125
+
126
+ interface RetryPolicy {
127
+ maxRetries: number;
128
+ backoffMultiplier: number;
129
+ retryableErrors: string[];
130
+ }
131
+
132
+ const defaultConfig: OrchestratorConfig = {
133
+ maxParallelTasks: 5,
134
+ defaultTimeout: 60000,
135
+ retryPolicy: {
136
+ maxRetries: 3,
137
+ backoffMultiplier: 2,
138
+ retryableErrors: ["RATE_LIMIT", "TIMEOUT", "TEMPORARY_ERROR"]
139
+ },
140
+ validateIntermediateOutputs: true,
141
+ evaluateBeforeDelivery: false,
142
+ enableProgressUpdates: true,
143
+ updateFrequency: 5000
144
+ };
145
+ ```
146
+
147
+ ## Usage Example
148
+
149
+ ```typescript
150
+ import { orchestratorAgent } from "./agents/orchestrator-agent";
151
+
152
+ const result = await orchestratorAgent.generate({
153
+ prompt: `Complete the following research and analysis task:
154
+
155
+ 1. Research current best practices for LLM evaluation
156
+ 2. Analyze the trade-offs between different evaluation methods
157
+ 3. Generate a recommendation report
158
+ 4. Evaluate the quality of the report
159
+
160
+ Ensure the final output is comprehensive but accessible to technical leaders.`
161
+ });
162
+ ```
163
+
164
+ ## Orchestration Patterns
165
+
166
+ ### Sequential Pipeline
167
+ ```mermaid
168
+ graph LR
169
+ A[Task] --> B[Research Agent]
170
+ B --> C[Analyst Agent]
171
+ C --> D[Writer Agent]
172
+ D --> E[Evaluator Agent]
173
+ E --> F[Final Output]
174
+ ```
175
+
176
+ ### Parallel with Aggregation
177
+ ```mermaid
178
+ graph TD
179
+ A[Task] --> B[Parallel Dispatch]
180
+ B --> C[Agent 1]
181
+ B --> D[Agent 2]
182
+ B --> E[Agent 3]
183
+ C --> F[Aggregation]
184
+ D --> F
185
+ E --> F
186
+ F --> G[Synthesis]
187
+ ```
188
+
189
+ ### Iterative Refinement
190
+ ```mermaid
191
+ graph TD
192
+ A[Draft] --> B[Evaluator]
193
+ B --> C{Score OK?}
194
+ C -->|No| D[Refine]
195
+ D --> A
196
+ C -->|Yes| E[Final Output]
197
+ ```
198
+
199
+ ## Integration Points
200
+
201
+ - **API Gateway**: Primary entry point for complex requests
202
+ - **Job Queue**: Handle long-running orchestrated tasks
203
+ - **Monitoring**: Track multi-agent execution metrics
204
+ - **Audit Log**: Record all delegations and decisions
205
+
@@ -0,0 +1,183 @@
1
+ # Research Agent
2
+
3
+ ## Purpose
4
+
5
+ The Research Agent gathers, synthesizes, and summarizes information from multiple sources to answer complex research questions. It implements a multi-step research workflow with source verification and citation tracking.
6
+
7
+ ## Agent Definition
8
+
9
+ ```typescript
10
+ import { ToolLoopAgent } from "ai";
11
+ import { openai } from "@ai-sdk/openai";
12
+ import { researchTools } from "../tools";
13
+
14
+ export const researchAgent = new ToolLoopAgent({
15
+ name: "researcher",
16
+ model: openai("gpt-4o"),
17
+ instructions: `You are an expert research analyst.
18
+
19
+ Your role is to:
20
+ 1. Break down complex research questions into searchable queries
21
+ 2. Gather information from multiple sources
22
+ 3. Verify and cross-reference claims
23
+ 4. Synthesize findings into coherent summaries
24
+ 5. Provide proper citations for all claims
25
+
26
+ Research Methodology:
27
+ - Start with broad searches to understand the landscape
28
+ - Narrow down to specific sources for detailed information
29
+ - Always verify facts from multiple sources when possible
30
+ - Distinguish between facts, claims, and opinions
31
+ - Note the recency and authority of sources
32
+
33
+ Quality Standards:
34
+ - Never fabricate information or sources
35
+ - Clearly indicate when information is uncertain
36
+ - Provide direct quotes when precision matters
37
+ - Include source URLs/references for verification`,
38
+
39
+ tools: {
40
+ webSearch: researchTools.webSearch,
41
+ readUrl: researchTools.readUrl,
42
+ extractClaims: researchTools.extractClaims,
43
+ verifyClaim: researchTools.verifyClaim,
44
+ synthesize: researchTools.synthesize
45
+ }
46
+ });
47
+ ```
48
+
49
+ ## Capabilities
50
+
51
+ ### Web Search
52
+ Search the web for relevant information.
53
+
54
+ **Input:**
55
+ - Search query
56
+ - Optional filters (date, source type)
57
+
58
+ **Output:**
59
+ - List of relevant results
60
+ - Snippets and URLs
61
+ - Source metadata
62
+
63
+ ### URL Reading
64
+ Extract content from a specific URL.
65
+
66
+ **Input:**
67
+ - URL to read
68
+ - Content type (article, paper, documentation)
69
+
70
+ **Output:**
71
+ - Extracted text content
72
+ - Key sections identified
73
+ - Publication metadata
74
+
75
+ ### Claim Extraction
76
+ Identify distinct claims from a source.
77
+
78
+ **Input:**
79
+ - Source text
80
+ - Claim types to extract
81
+
82
+ **Output:**
83
+ - List of claims
84
+ - Confidence level
85
+ - Supporting context
86
+
87
+ ### Claim Verification
88
+ Cross-reference a claim against other sources.
89
+
90
+ **Input:**
91
+ - Claim to verify
92
+ - Original source
93
+
94
+ **Output:**
95
+ - Verification status
96
+ - Supporting/contradicting sources
97
+ - Confidence assessment
98
+
99
+ ### Synthesis
100
+ Combine findings into a coherent summary.
101
+
102
+ **Input:**
103
+ - Research findings
104
+ - Target format
105
+ - Key questions to answer
106
+
107
+ **Output:**
108
+ - Synthesized summary
109
+ - Key insights
110
+ - Source citations
111
+
112
+ ## Configuration
113
+
114
+ ```typescript
115
+ interface ResearchConfig {
116
+ // Search configuration
117
+ maxSearchResults: number;
118
+ preferredSources: string[];
119
+ excludedDomains: string[];
120
+
121
+ // Verification settings
122
+ minSourcesForVerification: number;
123
+ requireRecentSources: boolean;
124
+ maxSourceAge: "1month" | "6months" | "1year" | "any";
125
+
126
+ // Output configuration
127
+ citationStyle: "inline" | "footnote" | "endnote";
128
+ summaryLength: "brief" | "standard" | "comprehensive";
129
+ includeSourceQuality: boolean;
130
+ }
131
+
132
+ const defaultConfig: ResearchConfig = {
133
+ maxSearchResults: 10,
134
+ preferredSources: [],
135
+ excludedDomains: [],
136
+ minSourcesForVerification: 2,
137
+ requireRecentSources: false,
138
+ maxSourceAge: "any",
139
+ citationStyle: "inline",
140
+ summaryLength: "standard",
141
+ includeSourceQuality: true
142
+ };
143
+ ```
144
+
145
+ ## Usage Example
146
+
147
+ ```typescript
148
+ import { researchAgent } from "./agents/research-agent";
149
+
150
+ const research = await researchAgent.generate({
151
+ prompt: `Research the current state of LLM evaluation methods.
152
+
153
+ I need to understand:
154
+ 1. What are the main approaches to evaluating LLM outputs?
155
+ 2. What are the limitations of human evaluation?
156
+ 3. How reliable are LLM-based evaluators compared to humans?
157
+ 4. What are best practices for implementing LLM-as-a-Judge?
158
+
159
+ Provide a comprehensive summary with citations.`
160
+ });
161
+ ```
162
+
163
+ ## Research Workflow
164
+
165
+ ```mermaid
166
+ graph TD
167
+ A[Research Question] --> B[Query Decomposition]
168
+ B --> C[Initial Search]
169
+ C --> D[Source Selection]
170
+ D --> E[Deep Reading]
171
+ E --> F[Claim Extraction]
172
+ F --> G[Cross-Verification]
173
+ G --> H[Synthesis]
174
+ H --> I[Final Report]
175
+ ```
176
+
177
+ ## Integration Points
178
+
179
+ - **Knowledge Base Building**: Populate internal knowledge stores
180
+ - **Fact Checking**: Verify claims in generated content
181
+ - **Market Research**: Gather competitive intelligence
182
+ - **Technical Documentation**: Research implementation approaches
183
+
@@ -0,0 +1,6 @@
1
+ # OpenAI Configuration
2
+ OPENAI_API_KEY=your_openai_api_key_here
3
+ OPENAI_MODEL=gpt-4o
4
+
5
+ # Optional: Anthropic for alternative models
6
+ # ANTHROPIC_API_KEY=your_anthropic_api_key_here
@@ -0,0 +1,18 @@
1
+ import eslint from '@eslint/js';
2
+ import tseslint from 'typescript-eslint';
3
+
4
+ export default tseslint.config(
5
+ eslint.configs.recommended,
6
+ ...tseslint.configs.recommended,
7
+ {
8
+ ignores: ['dist/', 'node_modules/', 'coverage/']
9
+ },
10
+ {
11
+ rules: {
12
+ '@typescript-eslint/no-unused-vars': ['error', { argsIgnorePattern: '^_' }],
13
+ '@typescript-eslint/explicit-function-return-type': 'off',
14
+ '@typescript-eslint/no-explicit-any': 'warn'
15
+ }
16
+ }
17
+ );
18
+