@trieungoctam/vibekit 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (352) hide show
  1. package/LICENSE +21 -0
  2. package/README.md +85 -0
  3. package/agents/debugger.md +158 -0
  4. package/agents/docs-manager.md +220 -0
  5. package/agents/planner.md +129 -0
  6. package/agents/researcher.md +58 -0
  7. package/agents/reviewer.md +152 -0
  8. package/agents/tester.md +126 -0
  9. package/bin/vibekit.js +18 -0
  10. package/hooks/lib/ck-config-utils.cjs +831 -0
  11. package/hooks/lib/colors.cjs +95 -0
  12. package/hooks/lib/config-counter.cjs +103 -0
  13. package/hooks/lib/context-builder.cjs +616 -0
  14. package/hooks/lib/git-info-cache.cjs +143 -0
  15. package/hooks/lib/hook-logger.cjs +92 -0
  16. package/hooks/lib/privacy-checker.cjs +297 -0
  17. package/hooks/lib/project-detector.cjs +474 -0
  18. package/hooks/lib/scout-checker.cjs +263 -0
  19. package/hooks/lib/transcript-parser.cjs +181 -0
  20. package/hooks/post-edit-simplify-reminder.cjs +156 -0
  21. package/hooks/privacy-block.cjs +166 -0
  22. package/hooks/scout-block.cjs +147 -0
  23. package/hooks/session-init.cjs +360 -0
  24. package/package.json +41 -0
  25. package/rules/development-rules.md +52 -0
  26. package/rules/documentation-management.md +121 -0
  27. package/rules/orchestration-protocol.md +43 -0
  28. package/rules/primary-workflow.md +57 -0
  29. package/rules/team-coordination-rules.md +90 -0
  30. package/skills/ai/agent-browser/SKILL.md +294 -0
  31. package/skills/ai/agent-browser/references/.gitkeep +0 -0
  32. package/skills/ai/agent-browser/references/agent-browser-vs-chrome-devtools.md +112 -0
  33. package/skills/ai/agent-browser/references/browserbase-cloud-setup.md +161 -0
  34. package/skills/ai/ai-artist/SKILL.md +122 -0
  35. package/skills/ai/ai-artist/data/awesome-prompts.csv +3592 -0
  36. package/skills/ai/ai-artist/data/lighting.csv +19 -0
  37. package/skills/ai/ai-artist/data/nano-banana-templates.csv +17 -0
  38. package/skills/ai/ai-artist/data/platforms.csv +11 -0
  39. package/skills/ai/ai-artist/data/styles.csv +26 -0
  40. package/skills/ai/ai-artist/data/techniques.csv +19 -0
  41. package/skills/ai/ai-artist/data/use-cases.csv +16 -0
  42. package/skills/ai/ai-artist/references/advanced-techniques.md +184 -0
  43. package/skills/ai/ai-artist/references/awesome-nano-banana-pro-prompts.md +8575 -0
  44. package/skills/ai/ai-artist/references/domain-code.md +66 -0
  45. package/skills/ai/ai-artist/references/domain-data.md +72 -0
  46. package/skills/ai/ai-artist/references/domain-marketing.md +66 -0
  47. package/skills/ai/ai-artist/references/domain-patterns.md +33 -0
  48. package/skills/ai/ai-artist/references/domain-writing.md +68 -0
  49. package/skills/ai/ai-artist/references/image-prompting.md +141 -0
  50. package/skills/ai/ai-artist/references/llm-prompting.md +165 -0
  51. package/skills/ai/ai-artist/references/nano-banana.md +136 -0
  52. package/skills/ai/ai-artist/references/reasoning-techniques.md +201 -0
  53. package/skills/ai/ai-artist/references/validation-workflow.md +117 -0
  54. package/skills/ai/ai-artist/scripts/core.py +197 -0
  55. package/skills/ai/ai-artist/scripts/extract_prompts.py +102 -0
  56. package/skills/ai/ai-artist/scripts/generate.py +370 -0
  57. package/skills/ai/ai-artist/scripts/search.py +147 -0
  58. package/skills/ai/ai-multimodal/.env.example +204 -0
  59. package/skills/ai/ai-multimodal/SKILL.md +110 -0
  60. package/skills/ai/ai-multimodal/references/audio-processing.md +387 -0
  61. package/skills/ai/ai-multimodal/references/image-generation.md +939 -0
  62. package/skills/ai/ai-multimodal/references/music-generation.md +311 -0
  63. package/skills/ai/ai-multimodal/references/video-analysis.md +515 -0
  64. package/skills/ai/ai-multimodal/references/video-generation.md +457 -0
  65. package/skills/ai/ai-multimodal/references/vision-understanding.md +492 -0
  66. package/skills/ai/ai-multimodal/scripts/.coverage +0 -0
  67. package/skills/ai/ai-multimodal/scripts/check_setup.py +315 -0
  68. package/skills/ai/ai-multimodal/scripts/document_converter.py +395 -0
  69. package/skills/ai/ai-multimodal/scripts/gemini_batch_process.py +1185 -0
  70. package/skills/ai/ai-multimodal/scripts/media_optimizer.py +506 -0
  71. package/skills/ai/ai-multimodal/scripts/requirements.txt +26 -0
  72. package/skills/ai/ai-multimodal/scripts/tests/.coverage +0 -0
  73. package/skills/ai/ai-multimodal/scripts/tests/requirements.txt +20 -0
  74. package/skills/ai/ai-multimodal/scripts/tests/test_document_converter.py +74 -0
  75. package/skills/ai/ai-multimodal/scripts/tests/test_gemini_batch_process.py +362 -0
  76. package/skills/ai/ai-multimodal/scripts/tests/test_media_optimizer.py +373 -0
  77. package/skills/ai/mcp-management/README.md +219 -0
  78. package/skills/ai/mcp-management/SKILL.md +210 -0
  79. package/skills/ai/mcp-management/assets/tools.json +3146 -0
  80. package/skills/ai/mcp-management/references/configuration.md +114 -0
  81. package/skills/ai/mcp-management/references/gemini-cli-integration.md +221 -0
  82. package/skills/ai/mcp-management/references/mcp-protocol.md +116 -0
  83. package/skills/ai/mcp-management/scripts/.env.example +10 -0
  84. package/skills/ai/mcp-management/scripts/cli.ts +195 -0
  85. package/skills/ai/mcp-management/scripts/dist/analyze-tools.js +70 -0
  86. package/skills/ai/mcp-management/scripts/dist/cli.js +160 -0
  87. package/skills/ai/mcp-management/scripts/dist/mcp-client.js +183 -0
  88. package/skills/ai/mcp-management/scripts/mcp-client.ts +230 -0
  89. package/skills/ai/mcp-management/scripts/package.json +20 -0
  90. package/skills/ai/mcp-management/scripts/tsconfig.json +15 -0
  91. package/skills/core/brainstorm/SKILL.md +164 -0
  92. package/skills/core/brainstorm/scripts/frame-template.html +214 -0
  93. package/skills/core/brainstorm/scripts/helper.js +88 -0
  94. package/skills/core/brainstorm/scripts/server.cjs +338 -0
  95. package/skills/core/brainstorm/scripts/start-server.sh +153 -0
  96. package/skills/core/brainstorm/scripts/stop-server.sh +55 -0
  97. package/skills/core/brainstorm/spec-document-reviewer-prompt.md +49 -0
  98. package/skills/core/brainstorm/visual-companion.md +286 -0
  99. package/skills/core/code-review/SKILL.md +147 -0
  100. package/skills/core/code-review/references/code-review-reception.md +113 -0
  101. package/skills/core/code-review/references/codebase-scan-workflow.md +29 -0
  102. package/skills/core/code-review/references/edge-case-scouting.md +119 -0
  103. package/skills/core/code-review/references/parallel-review-workflow.md +69 -0
  104. package/skills/core/code-review/references/requesting-code-review.md +116 -0
  105. package/skills/core/code-review/references/task-management-reviews.md +140 -0
  106. package/skills/core/code-review/references/verification-before-completion.md +139 -0
  107. package/skills/core/cook/README.md +86 -0
  108. package/skills/core/cook/SKILL.md +113 -0
  109. package/skills/core/cook/references/intent-detection.md +101 -0
  110. package/skills/core/cook/references/review-cycle.md +75 -0
  111. package/skills/core/cook/references/subagent-patterns.md +75 -0
  112. package/skills/core/cook/references/workflow-steps.md +172 -0
  113. package/skills/core/debug/SKILL.md +121 -0
  114. package/skills/core/debug/references/defense-in-depth.md +124 -0
  115. package/skills/core/debug/references/frontend-verification.md +103 -0
  116. package/skills/core/debug/references/investigation-methodology.md +101 -0
  117. package/skills/core/debug/references/log-and-ci-analysis.md +97 -0
  118. package/skills/core/debug/references/performance-diagnostics.md +113 -0
  119. package/skills/core/debug/references/reporting-standards.md +122 -0
  120. package/skills/core/debug/references/root-cause-tracing.md +122 -0
  121. package/skills/core/debug/references/systematic-debugging.md +102 -0
  122. package/skills/core/debug/references/task-management-debugging.md +155 -0
  123. package/skills/core/debug/references/verification.md +123 -0
  124. package/skills/core/debug/scripts/find-polluter.sh +63 -0
  125. package/skills/core/debug/scripts/find-polluter.test.md +102 -0
  126. package/skills/core/execute/SKILL.md +70 -0
  127. package/skills/core/fix/SKILL.md +111 -0
  128. package/skills/core/fix/references/complexity-assessment.md +72 -0
  129. package/skills/core/fix/references/mode-selection.md +46 -0
  130. package/skills/core/fix/references/parallel-exploration.md +100 -0
  131. package/skills/core/fix/references/review-cycle.md +77 -0
  132. package/skills/core/fix/references/skill-activation-matrix.md +78 -0
  133. package/skills/core/fix/references/task-orchestration.md +103 -0
  134. package/skills/core/fix/references/workflow-ci.md +28 -0
  135. package/skills/core/fix/references/workflow-deep.md +122 -0
  136. package/skills/core/fix/references/workflow-logs.md +72 -0
  137. package/skills/core/fix/references/workflow-quick.md +59 -0
  138. package/skills/core/fix/references/workflow-standard.md +111 -0
  139. package/skills/core/fix/references/workflow-test.md +75 -0
  140. package/skills/core/fix/references/workflow-types.md +33 -0
  141. package/skills/core/fix/references/workflow-ui.md +75 -0
  142. package/skills/core/plan/SKILL.md +145 -0
  143. package/skills/core/plan/plan-document-reviewer-prompt.md +49 -0
  144. package/skills/core/subagent-dev/SKILL.md +277 -0
  145. package/skills/core/subagent-dev/code-quality-reviewer-prompt.md +26 -0
  146. package/skills/core/subagent-dev/implementer-prompt.md +113 -0
  147. package/skills/core/subagent-dev/spec-reviewer-prompt.md +61 -0
  148. package/skills/core/tdd/SKILL.md +371 -0
  149. package/skills/core/tdd/testing-anti-patterns.md +299 -0
  150. package/skills/core/test/SKILL.md +109 -0
  151. package/skills/core/test/references/report-format.md +58 -0
  152. package/skills/core/test/references/test-execution-workflow.md +103 -0
  153. package/skills/core/test/references/ui-testing-workflow.md +65 -0
  154. package/skills/core/verify/SKILL.md +139 -0
  155. package/skills/dev/backend-dev/SKILL.md +96 -0
  156. package/skills/dev/backend-dev/references/backend-api-design.md +495 -0
  157. package/skills/dev/backend-dev/references/backend-architecture.md +454 -0
  158. package/skills/dev/backend-dev/references/backend-authentication.md +338 -0
  159. package/skills/dev/backend-dev/references/backend-code-quality.md +659 -0
  160. package/skills/dev/backend-dev/references/backend-debugging.md +904 -0
  161. package/skills/dev/backend-dev/references/backend-devops.md +494 -0
  162. package/skills/dev/backend-dev/references/backend-mindset.md +387 -0
  163. package/skills/dev/backend-dev/references/backend-performance.md +397 -0
  164. package/skills/dev/backend-dev/references/backend-security.md +290 -0
  165. package/skills/dev/backend-dev/references/backend-technologies.md +256 -0
  166. package/skills/dev/backend-dev/references/backend-testing.md +429 -0
  167. package/skills/dev/context-engineering/SKILL.md +108 -0
  168. package/skills/dev/context-engineering/references/context-compression.md +84 -0
  169. package/skills/dev/context-engineering/references/context-degradation.md +93 -0
  170. package/skills/dev/context-engineering/references/context-fundamentals.md +75 -0
  171. package/skills/dev/context-engineering/references/context-optimization.md +82 -0
  172. package/skills/dev/context-engineering/references/evaluation.md +89 -0
  173. package/skills/dev/context-engineering/references/memory-systems.md +88 -0
  174. package/skills/dev/context-engineering/references/multi-agent-patterns.md +90 -0
  175. package/skills/dev/context-engineering/references/project-development.md +97 -0
  176. package/skills/dev/context-engineering/references/runtime-awareness.md +202 -0
  177. package/skills/dev/context-engineering/references/tool-design.md +86 -0
  178. package/skills/dev/context-engineering/scripts/compression_evaluator.py +349 -0
  179. package/skills/dev/context-engineering/scripts/context_analyzer.py +317 -0
  180. package/skills/dev/context-engineering/scripts/tests/test_edge_cases.py +246 -0
  181. package/skills/dev/databases/SKILL.md +84 -0
  182. package/skills/dev/databases/analytics.md +198 -0
  183. package/skills/dev/databases/db-design.md +188 -0
  184. package/skills/dev/databases/incremental-etl.md +213 -0
  185. package/skills/dev/databases/references/mongodb-aggregation.md +447 -0
  186. package/skills/dev/databases/references/mongodb-atlas.md +465 -0
  187. package/skills/dev/databases/references/mongodb-crud.md +408 -0
  188. package/skills/dev/databases/references/mongodb-indexing.md +442 -0
  189. package/skills/dev/databases/references/postgresql-administration.md +594 -0
  190. package/skills/dev/databases/references/postgresql-performance.md +527 -0
  191. package/skills/dev/databases/references/postgresql-psql-cli.md +467 -0
  192. package/skills/dev/databases/references/postgresql-queries.md +475 -0
  193. package/skills/dev/databases/scripts/.coverage +0 -0
  194. package/skills/dev/databases/scripts/db_backup.py +502 -0
  195. package/skills/dev/databases/scripts/db_migrate.py +426 -0
  196. package/skills/dev/databases/scripts/db_performance_check.py +457 -0
  197. package/skills/dev/databases/scripts/requirements.txt +20 -0
  198. package/skills/dev/databases/scripts/tests/coverage-db.json +1 -0
  199. package/skills/dev/databases/scripts/tests/requirements.txt +4 -0
  200. package/skills/dev/databases/scripts/tests/test_db_backup.py +340 -0
  201. package/skills/dev/databases/scripts/tests/test_db_migrate.py +277 -0
  202. package/skills/dev/databases/scripts/tests/test_db_performance_check.py +370 -0
  203. package/skills/dev/databases/stacks/bigquery.md +231 -0
  204. package/skills/dev/databases/stacks/d1_cloudflare.md +137 -0
  205. package/skills/dev/databases/stacks/mysql.md +216 -0
  206. package/skills/dev/databases/stacks/postgres.md +235 -0
  207. package/skills/dev/databases/stacks/sqlite.md +244 -0
  208. package/skills/dev/databases/transactional.md +176 -0
  209. package/skills/dev/devops/.env.example +76 -0
  210. package/skills/dev/devops/SKILL.md +97 -0
  211. package/skills/dev/devops/references/browser-rendering.md +305 -0
  212. package/skills/dev/devops/references/cloudflare-d1-kv.md +123 -0
  213. package/skills/dev/devops/references/cloudflare-platform.md +271 -0
  214. package/skills/dev/devops/references/cloudflare-r2-storage.md +280 -0
  215. package/skills/dev/devops/references/cloudflare-workers-advanced.md +312 -0
  216. package/skills/dev/devops/references/cloudflare-workers-apis.md +309 -0
  217. package/skills/dev/devops/references/cloudflare-workers-basics.md +418 -0
  218. package/skills/dev/devops/references/docker-basics.md +297 -0
  219. package/skills/dev/devops/references/docker-compose.md +292 -0
  220. package/skills/dev/devops/references/gcloud-platform.md +297 -0
  221. package/skills/dev/devops/references/gcloud-services.md +304 -0
  222. package/skills/dev/devops/references/kubernetes-basics.md +99 -0
  223. package/skills/dev/devops/references/kubernetes-helm-advanced.md +75 -0
  224. package/skills/dev/devops/references/kubernetes-helm.md +81 -0
  225. package/skills/dev/devops/references/kubernetes-kubectl.md +74 -0
  226. package/skills/dev/devops/references/kubernetes-security-advanced.md +98 -0
  227. package/skills/dev/devops/references/kubernetes-security.md +95 -0
  228. package/skills/dev/devops/references/kubernetes-troubleshooting-advanced.md +74 -0
  229. package/skills/dev/devops/references/kubernetes-troubleshooting.md +49 -0
  230. package/skills/dev/devops/references/kubernetes-workflows-advanced.md +75 -0
  231. package/skills/dev/devops/references/kubernetes-workflows.md +78 -0
  232. package/skills/dev/devops/scripts/cloudflare_deploy.py +269 -0
  233. package/skills/dev/devops/scripts/docker_optimize.py +332 -0
  234. package/skills/dev/devops/scripts/requirements.txt +20 -0
  235. package/skills/dev/devops/scripts/tests/requirements.txt +3 -0
  236. package/skills/dev/devops/scripts/tests/test_cloudflare_deploy.py +285 -0
  237. package/skills/dev/devops/scripts/tests/test_docker_optimize.py +436 -0
  238. package/skills/dev/frontend-design/SKILL.md +78 -0
  239. package/skills/dev/frontend-design/references/ai-multimodal-overview.md +165 -0
  240. package/skills/dev/frontend-design/references/analysis-best-practices.md +80 -0
  241. package/skills/dev/frontend-design/references/analysis-prompts.md +141 -0
  242. package/skills/dev/frontend-design/references/analysis-techniques.md +118 -0
  243. package/skills/dev/frontend-design/references/animejs.md +396 -0
  244. package/skills/dev/frontend-design/references/asset-generation.md +337 -0
  245. package/skills/dev/frontend-design/references/design-extraction-overview.md +71 -0
  246. package/skills/dev/frontend-design/references/extraction-best-practices.md +141 -0
  247. package/skills/dev/frontend-design/references/extraction-output-templates.md +162 -0
  248. package/skills/dev/frontend-design/references/extraction-prompts.md +127 -0
  249. package/skills/dev/frontend-design/references/technical-accessibility.md +119 -0
  250. package/skills/dev/frontend-design/references/technical-best-practices.md +97 -0
  251. package/skills/dev/frontend-design/references/technical-optimization.md +44 -0
  252. package/skills/dev/frontend-design/references/technical-overview.md +90 -0
  253. package/skills/dev/frontend-design/references/technical-workflows.md +150 -0
  254. package/skills/dev/frontend-design/references/visual-analysis-overview.md +95 -0
  255. package/skills/dev/frontend-design/references/workflow-3d.md +102 -0
  256. package/skills/dev/frontend-design/references/workflow-describe.md +87 -0
  257. package/skills/dev/frontend-design/references/workflow-immersive.md +87 -0
  258. package/skills/dev/frontend-design/references/workflow-quick.md +57 -0
  259. package/skills/dev/frontend-design/references/workflow-screenshot.md +63 -0
  260. package/skills/dev/frontend-design/references/workflow-video.md +74 -0
  261. package/skills/dev/frontend-dev/SKILL.md +400 -0
  262. package/skills/dev/frontend-dev/resources/common-patterns.md +331 -0
  263. package/skills/dev/frontend-dev/resources/complete-examples.md +872 -0
  264. package/skills/dev/frontend-dev/resources/component-patterns.md +502 -0
  265. package/skills/dev/frontend-dev/resources/data-fetching.md +767 -0
  266. package/skills/dev/frontend-dev/resources/file-organization.md +502 -0
  267. package/skills/dev/frontend-dev/resources/loading-and-error-states.md +501 -0
  268. package/skills/dev/frontend-dev/resources/performance.md +406 -0
  269. package/skills/dev/frontend-dev/resources/routing-guide.md +364 -0
  270. package/skills/dev/frontend-dev/resources/styling-guide.md +428 -0
  271. package/skills/dev/frontend-dev/resources/typescript-standards.md +418 -0
  272. package/skills/dev/git/SKILL.md +114 -0
  273. package/skills/dev/git/references/branch-management.md +88 -0
  274. package/skills/dev/git/references/commit-standards.md +46 -0
  275. package/skills/dev/git/references/gh-cli-guide.md +109 -0
  276. package/skills/dev/git/references/safety-protocols.md +69 -0
  277. package/skills/dev/git/references/workflow-commit.md +58 -0
  278. package/skills/dev/git/references/workflow-merge.md +48 -0
  279. package/skills/dev/git/references/workflow-pr.md +58 -0
  280. package/skills/dev/git/references/workflow-push.md +52 -0
  281. package/skills/dev/git-worktree/SKILL.md +218 -0
  282. package/skills/utils/ask/SKILL.md +58 -0
  283. package/skills/utils/bootstrap/SKILL.md +101 -0
  284. package/skills/utils/bootstrap/references/shared-phases.md +59 -0
  285. package/skills/utils/bootstrap/references/workflow-auto.md +52 -0
  286. package/skills/utils/bootstrap/references/workflow-fast.md +50 -0
  287. package/skills/utils/bootstrap/references/workflow-full.md +60 -0
  288. package/skills/utils/bootstrap/references/workflow-parallel.md +59 -0
  289. package/skills/utils/ck-help/SKILL.md +102 -0
  290. package/skills/utils/ck-help/scripts/ck-help.py +1321 -0
  291. package/skills/utils/ck-help/scripts/commands_data.yaml +3 -0
  292. package/skills/utils/ck-help/scripts/skills_data.yaml +593 -0
  293. package/skills/utils/copywriting/SKILL.md +94 -0
  294. package/skills/utils/copywriting/references/copy-formulas.md +150 -0
  295. package/skills/utils/copywriting/references/cta-patterns.md +168 -0
  296. package/skills/utils/copywriting/references/email-copy.md +193 -0
  297. package/skills/utils/copywriting/references/headline-templates.md +140 -0
  298. package/skills/utils/copywriting/references/landing-page-copy.md +175 -0
  299. package/skills/utils/copywriting/references/power-words.md +189 -0
  300. package/skills/utils/copywriting/references/social-media-copy.md +222 -0
  301. package/skills/utils/copywriting/references/workflow-cro.md +83 -0
  302. package/skills/utils/copywriting/references/workflow-enhance.md +32 -0
  303. package/skills/utils/copywriting/references/workflow-fast.md +29 -0
  304. package/skills/utils/copywriting/references/workflow-good.md +39 -0
  305. package/skills/utils/copywriting/references/writing-styles.md +247 -0
  306. package/skills/utils/copywriting/scripts/extract-writing-styles.py +308 -0
  307. package/skills/utils/copywriting/templates/copy-brief.md +49 -0
  308. package/skills/utils/docs/SKILL.md +55 -0
  309. package/skills/utils/docs/references/init-workflow.md +32 -0
  310. package/skills/utils/docs/references/summarize-workflow.md +18 -0
  311. package/skills/utils/docs/references/update-workflow.md +59 -0
  312. package/skills/utils/journal/SKILL.md +11 -0
  313. package/skills/utils/kanban/SKILL.md +99 -0
  314. package/skills/utils/preview/SKILL.md +75 -0
  315. package/skills/utils/preview/references/generation-modes.md +95 -0
  316. package/skills/utils/preview/references/view-mode.md +42 -0
  317. package/skills/utils/repomix/SKILL.md +248 -0
  318. package/skills/utils/repomix/references/configuration.md +211 -0
  319. package/skills/utils/repomix/references/usage-patterns.md +232 -0
  320. package/skills/utils/repomix/scripts/.coverage +0 -0
  321. package/skills/utils/repomix/scripts/README.md +179 -0
  322. package/skills/utils/repomix/scripts/repomix_batch.py +455 -0
  323. package/skills/utils/repomix/scripts/repos.example.json +15 -0
  324. package/skills/utils/repomix/scripts/requirements.txt +15 -0
  325. package/skills/utils/repomix/scripts/tests/test_repomix_batch.py +531 -0
  326. package/skills/utils/research/SKILL.md +171 -0
  327. package/skills/utils/scout/SKILL.md +89 -0
  328. package/skills/utils/scout/references/external-scouting.md +140 -0
  329. package/skills/utils/scout/references/internal-scouting.md +119 -0
  330. package/skills/utils/scout/references/task-management-scouting.md +125 -0
  331. package/skills/utils/sequential-thinking/.env.example +8 -0
  332. package/skills/utils/sequential-thinking/README.md +183 -0
  333. package/skills/utils/sequential-thinking/SKILL.md +95 -0
  334. package/skills/utils/sequential-thinking/package.json +31 -0
  335. package/skills/utils/sequential-thinking/references/advanced-strategies.md +79 -0
  336. package/skills/utils/sequential-thinking/references/advanced-techniques.md +76 -0
  337. package/skills/utils/sequential-thinking/references/core-patterns.md +95 -0
  338. package/skills/utils/sequential-thinking/references/examples-api.md +88 -0
  339. package/skills/utils/sequential-thinking/references/examples-architecture.md +94 -0
  340. package/skills/utils/sequential-thinking/references/examples-debug.md +90 -0
  341. package/skills/utils/sequential-thinking/scripts/format-thought.js +159 -0
  342. package/skills/utils/sequential-thinking/scripts/process-thought.js +236 -0
  343. package/skills/utils/sequential-thinking/tests/format-thought.test.js +133 -0
  344. package/skills/utils/sequential-thinking/tests/process-thought.test.js +215 -0
  345. package/skills/utils/write-skill/SKILL.md +655 -0
  346. package/skills/utils/write-skill/anthropic-best-practices.md +1150 -0
  347. package/skills/utils/write-skill/examples/CLAUDE_MD_TESTING.md +189 -0
  348. package/skills/utils/write-skill/graphviz-conventions.dot +172 -0
  349. package/skills/utils/write-skill/persuasion-principles.md +187 -0
  350. package/skills/utils/write-skill/render-graphs.js +168 -0
  351. package/skills/utils/write-skill/testing-skills-with-subagents.md +384 -0
  352. package/src/commands/init.js +238 -0
@@ -0,0 +1,315 @@
1
+ #!/usr/bin/env python3
2
+ """
3
+ Validate ai-multimodal skill setup and configuration.
4
+
5
+ Checks:
6
+ - API key presence and format
7
+ - Python dependencies
8
+ - Centralized resolver availability
9
+ - Directory structure
10
+ """
11
+
12
+ import os
13
+ import sys
14
+ from pathlib import Path
15
+
16
+ # Fix Windows cp1252 encoding: Unicode symbols (✓, ⚠, ✗) can't encode on Windows.
17
+ # Reconfigure stdout to UTF-8 with replacement (Python 3.7+).
18
+ if sys.stdout.encoding and sys.stdout.encoding.lower() != "utf-8":
19
+ if hasattr(sys.stdout, 'reconfigure'):
20
+ sys.stdout.reconfigure(encoding="utf-8", errors="replace")
21
+ if hasattr(sys.stderr, 'reconfigure'):
22
+ sys.stderr.reconfigure(encoding="utf-8", errors="replace")
23
+
24
+ # Color codes for terminal output
25
+ GREEN = '\033[92m'
26
+ YELLOW = '\033[93m'
27
+ RED = '\033[91m'
28
+ BLUE = '\033[94m'
29
+ RESET = '\033[0m'
30
+ BOLD = '\033[1m'
31
+
32
+
33
+ def print_header(text):
34
+ """Print section header."""
35
+ print(f"\n{BOLD}{BLUE}{'='*60}{RESET}")
36
+ print(f"{BOLD}{BLUE}{text}{RESET}")
37
+ print(f"{BOLD}{BLUE}{'='*60}{RESET}\n")
38
+
39
+
40
+ def print_success(text):
41
+ """Print success message."""
42
+ print(f"{GREEN}✓ {text}{RESET}")
43
+
44
+
45
+ def print_warning(text):
46
+ """Print warning message."""
47
+ print(f"{YELLOW}⚠ {text}{RESET}")
48
+
49
+
50
+ def print_error(text):
51
+ """Print error message."""
52
+ print(f"{RED}✗ {text}{RESET}")
53
+
54
+
55
+ def print_info(text):
56
+ """Print info message."""
57
+ print(f"{BLUE}ℹ {text}{RESET}")
58
+
59
+
60
+ def check_dependencies():
61
+ """Check if required Python packages are installed."""
62
+ print_header("Checking Python Dependencies")
63
+
64
+ dependencies = {
65
+ 'google.genai': 'google-genai',
66
+ 'dotenv': 'python-dotenv',
67
+ 'PIL': 'pillow'
68
+ }
69
+
70
+ missing = []
71
+
72
+ for module_name, package_name in dependencies.items():
73
+ try:
74
+ __import__(module_name)
75
+ print_success(f"{package_name} is installed")
76
+ except ImportError:
77
+ print_error(f"{package_name} is NOT installed")
78
+ missing.append(package_name)
79
+
80
+ if missing:
81
+ print_error("\nMissing dependencies detected!")
82
+ print_info(f"Install with: pip install {' '.join(missing)}")
83
+ return False
84
+
85
+ return True
86
+
87
+
88
+ def check_centralized_resolver():
89
+ """Check if centralized resolver is available."""
90
+ print_header("Checking Centralized Resolver")
91
+
92
+ claude_root = Path(__file__).parent.parent.parent.parent
93
+ resolver_path = claude_root / 'scripts' / 'resolve_env.py'
94
+
95
+ if resolver_path.exists():
96
+ print_success(f"Centralized resolver found: {resolver_path}")
97
+
98
+ # Try to import it
99
+ sys.path.insert(0, str(resolver_path.parent))
100
+ try:
101
+ from resolve_env import resolve_env
102
+ print_success("Centralized resolver can be imported")
103
+ return True
104
+ except ImportError as e:
105
+ print_error(f"Centralized resolver exists but cannot be imported: {e}")
106
+ return False
107
+ else:
108
+ print_warning(f"Centralized resolver not found: {resolver_path}")
109
+ print_info("Skill will use fallback resolution logic")
110
+ return True # Not critical, fallback works
111
+
112
+
113
+ def find_api_key():
114
+ """Find and validate API key using centralized resolver."""
115
+ print_header("Checking API Key Configuration")
116
+
117
+ # Try to use centralized resolver
118
+ claude_root = Path(__file__).parent.parent.parent.parent
119
+ sys.path.insert(0, str(claude_root / 'scripts'))
120
+ try:
121
+ from resolve_env import resolve_env
122
+
123
+ print_info("Using centralized resolver...")
124
+ api_key = resolve_env('GEMINI_API_KEY', skill='ai-multimodal')
125
+
126
+ if api_key:
127
+ print_success("API key found via centralized resolver")
128
+ print_info(f"Key preview: {api_key[:20]}...{api_key[-4:]}")
129
+
130
+ # Show hierarchy
131
+ print_info("\nTo see where the key was found, run:")
132
+ print_info("python ~/.claude/scripts/resolve_env.py GEMINI_API_KEY --skill ai-multimodal --verbose")
133
+
134
+ return api_key
135
+ else:
136
+ print_error("API key not found in any location")
137
+ return None
138
+
139
+ except ImportError:
140
+ print_warning("Centralized resolver not available, using fallback")
141
+
142
+ # Fallback: check environment
143
+ api_key = os.getenv('GEMINI_API_KEY')
144
+ if api_key:
145
+ print_success("API key found in process.env")
146
+ print_info(f"Key preview: {api_key[:20]}...{api_key[-4:]}")
147
+ return api_key
148
+ else:
149
+ print_error("API key not found")
150
+ return None
151
+
152
+
153
+ def validate_api_key_format(api_key):
154
+ """Basic validation of API key format."""
155
+ if not api_key:
156
+ return False
157
+
158
+ # Google AI Studio keys typically start with 'AIza'
159
+ if api_key.startswith('AIza'):
160
+ print_success("API key format looks valid (Google AI Studio)")
161
+ return True
162
+ elif len(api_key) > 20:
163
+ print_warning("API key format not recognized (may be Vertex AI or custom)")
164
+ return True
165
+ else:
166
+ print_error("API key format looks invalid (too short)")
167
+ return False
168
+
169
+
170
+ def test_api_connection(api_key):
171
+ """Test API connection with a simple request."""
172
+ print_header("Testing API Connection")
173
+
174
+ try:
175
+ from google import genai
176
+
177
+ print_info("Initializing Gemini client...")
178
+ client = genai.Client(api_key=api_key)
179
+
180
+ print_info("Fetching available models...")
181
+ # List models to verify API key works
182
+ models = list(client.models.list())
183
+
184
+ print_success(f"API connection successful! Found {len(models)} available models")
185
+
186
+ # Show some available models
187
+ print_info("\nSample available models:")
188
+ for model in models[:5]:
189
+ print(f" - {model.name}")
190
+
191
+ return True
192
+
193
+ except ImportError:
194
+ print_error("google-genai package not installed")
195
+ return False
196
+ except Exception as e:
197
+ print_error(f"API connection failed: {str(e)}")
198
+ return False
199
+
200
+
201
+ def check_directory_structure():
202
+ """Verify skill directory structure."""
203
+ print_header("Checking Directory Structure")
204
+
205
+ script_dir = Path(__file__).parent
206
+ skill_dir = script_dir.parent
207
+
208
+ required_files = [
209
+ ('SKILL.md', skill_dir / 'SKILL.md'),
210
+ ('.env.example', skill_dir / '.env.example'),
211
+ ('gemini_batch_process.py', script_dir / 'gemini_batch_process.py'),
212
+ ]
213
+
214
+ all_exist = True
215
+
216
+ for name, path in required_files:
217
+ if path.exists():
218
+ print_success(f"{name} exists")
219
+ else:
220
+ print_error(f"{name} NOT found at {path}")
221
+ all_exist = False
222
+
223
+ return all_exist
224
+
225
+
226
+ def provide_setup_instructions():
227
+ """Provide setup instructions if configuration is incomplete."""
228
+ print_header("Setup Instructions")
229
+
230
+ print_info("To configure the ai-multimodal skill:")
231
+ print("\n1. Get a Gemini API key:")
232
+ print(" → Visit: https://aistudio.google.com/apikey")
233
+
234
+ print("\n2. Configure the API key (choose one method):")
235
+
236
+ print(f"\n Option A: User global config (recommended)")
237
+ print(f" $ echo 'GEMINI_API_KEY=your-api-key-here' >> ~/.claude/.env")
238
+
239
+ script_dir = Path(__file__).parent
240
+ skill_dir = script_dir.parent
241
+
242
+ print(f"\n Option B: Skill-specific config")
243
+ print(f" $ cd {skill_dir}")
244
+ print(f" $ cp .env.example .env")
245
+ print(f" $ # Edit .env and add your API key")
246
+
247
+ print(f"\n Option C: Runtime environment (temporary)")
248
+ print(f" $ export GEMINI_API_KEY='your-api-key-here'")
249
+
250
+ print("\n3. Verify setup:")
251
+ print(f" $ python {Path(__file__)}")
252
+
253
+ print("\n4. Debug if needed:")
254
+ print(f" $ python ~/.claude/scripts/resolve_env.py --show-hierarchy --skill ai-multimodal")
255
+ print(f" $ python ~/.claude/scripts/resolve_env.py GEMINI_API_KEY --skill ai-multimodal --verbose")
256
+
257
+
258
+ def main():
259
+ """Run all setup checks."""
260
+ print(f"\n{BOLD}AI Multimodal Skill - Setup Checker{RESET}")
261
+
262
+ all_passed = True
263
+
264
+ # Check directory structure
265
+ if not check_directory_structure():
266
+ all_passed = False
267
+
268
+ # Check centralized resolver
269
+ check_centralized_resolver()
270
+
271
+ # Check dependencies
272
+ if not check_dependencies():
273
+ all_passed = False
274
+ provide_setup_instructions()
275
+ sys.exit(1)
276
+
277
+ # Check API key
278
+ api_key = find_api_key()
279
+
280
+ if not api_key:
281
+ print_error("\n❌ GEMINI_API_KEY not found in any location")
282
+ all_passed = False
283
+ provide_setup_instructions()
284
+ sys.exit(1)
285
+
286
+ # Validate API key format
287
+ if not validate_api_key_format(api_key):
288
+ all_passed = False
289
+
290
+ # Test API connection
291
+ if not test_api_connection(api_key):
292
+ all_passed = False
293
+
294
+ # Final summary
295
+ print_header("Setup Summary")
296
+
297
+ if all_passed:
298
+ print_success("✅ All checks passed! The ai-multimodal skill is ready to use.")
299
+ print_info("\nNext steps:")
300
+ print(" • Read SKILL.md for usage examples")
301
+ print(" • Try: python scripts/gemini_batch_process.py --help")
302
+ print("\nImage generation models:")
303
+ print(" • gemini-2.5-flash-image - Nano Banana Flash (DEFAULT - fast)")
304
+ print(" • imagen-4.0-generate-001 - Imagen 4 (alternative - production)")
305
+ print(" • gemini-3-pro-image-preview - Nano Banana Pro (4K text, reasoning)")
306
+ print("\nExample (uses default model):")
307
+ print(" python scripts/gemini_batch_process.py --task generate \\")
308
+ print(" --prompt 'A sunset over mountains' --aspect-ratio 16:9 --size 2K")
309
+ else:
310
+ print_error("❌ Some checks failed. Please fix the issues above.")
311
+ sys.exit(1)
312
+
313
+
314
+ if __name__ == '__main__':
315
+ main()
@@ -0,0 +1,395 @@
1
+ #!/usr/bin/env python3
2
+ """
3
+ Convert documents to Markdown using Gemini API.
4
+
5
+ Supports all document types:
6
+ - PDF documents (native vision processing)
7
+ - Images (JPEG, PNG, WEBP, HEIC)
8
+ - Office documents (DOCX, XLSX, PPTX)
9
+ - HTML, TXT, and other text formats
10
+
11
+ Features:
12
+ - Converts to clean markdown format
13
+ - Preserves structure, tables, and formatting
14
+ - Extracts text from images and scanned documents
15
+ - Batch conversion support
16
+ - Saves to docs/assets/document-extraction.md by default
17
+ """
18
+
19
+ import argparse
20
+ import os
21
+ import sys
22
+ import time
23
+ from pathlib import Path
24
+ from typing import Optional, List, Dict, Any
25
+
26
+ try:
27
+ from google import genai
28
+ from google.genai import types
29
+ except ImportError:
30
+ print("Error: google-genai package not installed")
31
+ print("Install with: pip install google-genai")
32
+ sys.exit(1)
33
+
34
+ try:
35
+ from dotenv import load_dotenv
36
+ except ImportError:
37
+ load_dotenv = None
38
+
39
+
40
+ def find_api_key() -> Optional[str]:
41
+ """Find Gemini API key using correct priority order.
42
+
43
+ Priority order (highest to lowest):
44
+ 1. process.env (runtime environment variables)
45
+ 2. .claude/skills/ai-multimodal/.env (skill-specific config)
46
+ 3. .claude/skills/.env (shared skills config)
47
+ 4. .claude/.env (Claude global config)
48
+ """
49
+ # Priority 1: Already in process.env (highest)
50
+ api_key = os.getenv('GEMINI_API_KEY')
51
+ if api_key:
52
+ return api_key
53
+
54
+ # Load .env files if dotenv available
55
+ if load_dotenv:
56
+ # Determine base paths
57
+ script_dir = Path(__file__).parent
58
+ skill_dir = script_dir.parent # .claude/skills/ai-multimodal
59
+ skills_dir = skill_dir.parent # .claude/skills
60
+ claude_dir = skills_dir.parent # .claude
61
+
62
+ # Priority 2: Skill-specific .env
63
+ env_file = skill_dir / '.env'
64
+ if env_file.exists():
65
+ load_dotenv(env_file)
66
+ api_key = os.getenv('GEMINI_API_KEY')
67
+ if api_key:
68
+ return api_key
69
+
70
+ # Priority 3: Shared skills .env
71
+ env_file = skills_dir / '.env'
72
+ if env_file.exists():
73
+ load_dotenv(env_file)
74
+ api_key = os.getenv('GEMINI_API_KEY')
75
+ if api_key:
76
+ return api_key
77
+
78
+ # Priority 4: Claude global .env
79
+ env_file = claude_dir / '.env'
80
+ if env_file.exists():
81
+ load_dotenv(env_file)
82
+ api_key = os.getenv('GEMINI_API_KEY')
83
+ if api_key:
84
+ return api_key
85
+
86
+ return None
87
+
88
+
89
+ def find_project_root() -> Path:
90
+ """Find project root directory."""
91
+ script_dir = Path(__file__).parent
92
+
93
+ # Look for .git or .claude directory
94
+ for parent in [script_dir] + list(script_dir.parents):
95
+ if (parent / '.git').exists() or (parent / '.claude').exists():
96
+ return parent
97
+
98
+ return script_dir
99
+
100
+
101
+ def get_mime_type(file_path: str) -> str:
102
+ """Determine MIME type from file extension."""
103
+ ext = Path(file_path).suffix.lower()
104
+
105
+ mime_types = {
106
+ # Documents
107
+ '.pdf': 'application/pdf',
108
+ '.txt': 'text/plain',
109
+ '.html': 'text/html',
110
+ '.htm': 'text/html',
111
+ '.md': 'text/markdown',
112
+ '.csv': 'text/csv',
113
+ # Images
114
+ '.jpg': 'image/jpeg',
115
+ '.jpeg': 'image/jpeg',
116
+ '.png': 'image/png',
117
+ '.webp': 'image/webp',
118
+ '.heic': 'image/heic',
119
+ '.heif': 'image/heif',
120
+ # Office (need to be uploaded as binary)
121
+ '.docx': 'application/vnd.openxmlformats-officedocument.wordprocessingml.document',
122
+ '.xlsx': 'application/vnd.openxmlformats-officedocument.spreadsheetml.sheet',
123
+ '.pptx': 'application/vnd.openxmlformats-officedocument.presentationml.presentation',
124
+ }
125
+
126
+ return mime_types.get(ext, 'application/octet-stream')
127
+
128
+
129
+ def upload_file(client: genai.Client, file_path: str, verbose: bool = False) -> Any:
130
+ """Upload file to Gemini File API."""
131
+ if verbose:
132
+ print(f"Uploading {file_path}...")
133
+
134
+ myfile = client.files.upload(file=file_path)
135
+
136
+ # Wait for processing if needed
137
+ max_wait = 300 # 5 minutes
138
+ elapsed = 0
139
+ while myfile.state.name == 'PROCESSING' and elapsed < max_wait:
140
+ time.sleep(2)
141
+ myfile = client.files.get(name=myfile.name)
142
+ elapsed += 2
143
+ if verbose and elapsed % 10 == 0:
144
+ print(f" Processing... {elapsed}s")
145
+
146
+ if myfile.state.name == 'FAILED':
147
+ raise ValueError(f"File processing failed: {file_path}")
148
+
149
+ if myfile.state.name == 'PROCESSING':
150
+ raise TimeoutError(f"Processing timeout after {max_wait}s: {file_path}")
151
+
152
+ if verbose:
153
+ print(f" Uploaded: {myfile.name}")
154
+
155
+ return myfile
156
+
157
+
158
+ def convert_to_markdown(
159
+ client: genai.Client,
160
+ file_path: str,
161
+ model: str = 'gemini-2.5-flash',
162
+ custom_prompt: Optional[str] = None,
163
+ verbose: bool = False,
164
+ max_retries: int = 3
165
+ ) -> Dict[str, Any]:
166
+ """Convert a document to markdown using Gemini."""
167
+
168
+ for attempt in range(max_retries):
169
+ try:
170
+ file_path_obj = Path(file_path)
171
+ file_size = file_path_obj.stat().st_size
172
+ use_file_api = file_size > 20 * 1024 * 1024 # >20MB
173
+
174
+ # Default prompt for markdown conversion
175
+ if custom_prompt:
176
+ prompt = custom_prompt
177
+ else:
178
+ prompt = """Convert this document to clean, well-formatted Markdown.
179
+
180
+ Requirements:
181
+ - Preserve all content, structure, and formatting
182
+ - Convert tables to markdown table format
183
+ - Maintain heading hierarchy (# ## ### etc)
184
+ - Preserve lists, code blocks, and quotes
185
+ - Extract text from images if present
186
+ - Keep formatting consistent and readable
187
+
188
+ Output only the markdown content without any preamble or explanation."""
189
+
190
+ # Upload or inline the file
191
+ if use_file_api:
192
+ myfile = upload_file(client, str(file_path), verbose)
193
+ content = [prompt, myfile]
194
+ else:
195
+ with open(file_path, 'rb') as f:
196
+ file_bytes = f.read()
197
+
198
+ mime_type = get_mime_type(str(file_path))
199
+ content = [
200
+ prompt,
201
+ types.Part.from_bytes(data=file_bytes, mime_type=mime_type)
202
+ ]
203
+
204
+ # Generate markdown
205
+ response = client.models.generate_content(
206
+ model=model,
207
+ contents=content
208
+ )
209
+
210
+ markdown_content = response.text if hasattr(response, 'text') else ''
211
+
212
+ return {
213
+ 'file': str(file_path),
214
+ 'status': 'success',
215
+ 'markdown': markdown_content
216
+ }
217
+
218
+ except Exception as e:
219
+ if attempt == max_retries - 1:
220
+ return {
221
+ 'file': str(file_path),
222
+ 'status': 'error',
223
+ 'error': str(e),
224
+ 'markdown': None
225
+ }
226
+
227
+ wait_time = 2 ** attempt
228
+ if verbose:
229
+ print(f" Retry {attempt + 1} after {wait_time}s: {e}")
230
+ time.sleep(wait_time)
231
+
232
+
233
+ def batch_convert(
234
+ files: List[str],
235
+ output_file: Optional[str] = None,
236
+ auto_name: bool = False,
237
+ model: str = 'gemini-2.5-flash',
238
+ custom_prompt: Optional[str] = None,
239
+ verbose: bool = False
240
+ ) -> List[Dict[str, Any]]:
241
+ """Batch convert multiple files to markdown."""
242
+
243
+ api_key = find_api_key()
244
+ if not api_key:
245
+ print("Error: GEMINI_API_KEY not found")
246
+ print("Set via: export GEMINI_API_KEY='your-key'")
247
+ print("Or create .env file with: GEMINI_API_KEY=your-key")
248
+ sys.exit(1)
249
+
250
+ client = genai.Client(api_key=api_key)
251
+ results = []
252
+
253
+ # Determine output path
254
+ if not output_file:
255
+ project_root = find_project_root()
256
+ output_dir = project_root / 'docs' / 'assets'
257
+
258
+ if auto_name and len(files) == 1:
259
+ # Auto-generate meaningful filename from input
260
+ input_path = Path(files[0])
261
+ base_name = input_path.stem
262
+ output_file = str(output_dir / f"{base_name}-extraction.md")
263
+ else:
264
+ output_file = str(output_dir / 'document-extraction.md')
265
+
266
+ output_path = Path(output_file)
267
+ output_path.parent.mkdir(parents=True, exist_ok=True)
268
+
269
+ # Process each file
270
+ for i, file_path in enumerate(files, 1):
271
+ if verbose:
272
+ print(f"\n[{i}/{len(files)}] Converting: {file_path}")
273
+
274
+ result = convert_to_markdown(
275
+ client=client,
276
+ file_path=file_path,
277
+ model=model,
278
+ custom_prompt=custom_prompt,
279
+ verbose=verbose
280
+ )
281
+
282
+ results.append(result)
283
+
284
+ if verbose:
285
+ status = result.get('status', 'unknown')
286
+ print(f" Status: {status}")
287
+
288
+ # Save combined markdown
289
+ with open(output_path, 'w', encoding='utf-8') as f:
290
+ f.write("# Document Extraction Results\n\n")
291
+ f.write(f"Converted {len(files)} document(s) to markdown.\n\n")
292
+ f.write("---\n\n")
293
+
294
+ for result in results:
295
+ f.write(f"## {Path(result['file']).name}\n\n")
296
+
297
+ if result['status'] == 'success' and result.get('markdown'):
298
+ f.write(result['markdown'])
299
+ f.write("\n\n")
300
+ elif result['status'] == 'success':
301
+ f.write("**Note**: Conversion succeeded but no content was returned.\n\n")
302
+ else:
303
+ f.write(f"**Error**: {result.get('error', 'Unknown error')}\n\n")
304
+
305
+ f.write("---\n\n")
306
+
307
+ if verbose or True: # Always show output location
308
+ print(f"\n{'='*50}")
309
+ print(f"Converted: {len(results)} file(s)")
310
+ print(f"Success: {sum(1 for r in results if r['status'] == 'success')}")
311
+ print(f"Failed: {sum(1 for r in results if r['status'] == 'error')}")
312
+ print(f"Output saved to: {output_path}")
313
+
314
+ return results
315
+
316
+
317
+ def main():
318
+ parser = argparse.ArgumentParser(
319
+ description='Convert documents to Markdown using Gemini API',
320
+ formatter_class=argparse.RawDescriptionHelpFormatter,
321
+ epilog="""
322
+ Examples:
323
+ # Convert single PDF to markdown (default name)
324
+ %(prog)s --input document.pdf
325
+
326
+ # Auto-generate meaningful filename
327
+ %(prog)s --input testpdf.pdf --auto-name
328
+ # Output: docs/assets/testpdf-extraction.md
329
+
330
+ # Convert multiple files
331
+ %(prog)s --input doc1.pdf doc2.docx image.png
332
+
333
+ # Specify custom output location
334
+ %(prog)s --input document.pdf --output ./output.md
335
+
336
+ # Use custom prompt
337
+ %(prog)s --input document.pdf --prompt "Extract only the tables as markdown"
338
+
339
+ # Batch convert directory
340
+ %(prog)s --input ./documents/*.pdf --verbose
341
+
342
+ Supported formats:
343
+ - PDF documents (up to 1,000 pages)
344
+ - Images (JPEG, PNG, WEBP, HEIC)
345
+ - Office documents (DOCX, XLSX, PPTX)
346
+ - Text formats (TXT, HTML, Markdown, CSV)
347
+
348
+ Default output: <project-root>/docs/assets/document-extraction.md
349
+ """
350
+ )
351
+
352
+ parser.add_argument('--input', '-i', nargs='+', required=True,
353
+ help='Input file(s) to convert')
354
+ parser.add_argument('--output', '-o',
355
+ help='Output markdown file (default: docs/assets/document-extraction.md)')
356
+ parser.add_argument('--auto-name', '-a', action='store_true',
357
+ help='Auto-generate meaningful output filename from input (e.g., document.pdf -> document-extraction.md)')
358
+ parser.add_argument('--model', default='gemini-2.5-flash',
359
+ help='Gemini model to use (default: gemini-2.5-flash)')
360
+ parser.add_argument('--prompt', '-p',
361
+ help='Custom prompt for conversion')
362
+ parser.add_argument('--verbose', '-v', action='store_true',
363
+ help='Verbose output')
364
+
365
+ args = parser.parse_args()
366
+
367
+ # Validate input files
368
+ files = []
369
+ for file_pattern in args.input:
370
+ file_path = Path(file_pattern)
371
+ if file_path.exists() and file_path.is_file():
372
+ files.append(str(file_path))
373
+ else:
374
+ # Try glob pattern
375
+ import glob
376
+ matched = glob.glob(file_pattern)
377
+ files.extend([f for f in matched if Path(f).is_file()])
378
+
379
+ if not files:
380
+ print("Error: No valid input files found")
381
+ sys.exit(1)
382
+
383
+ # Convert files
384
+ batch_convert(
385
+ files=files,
386
+ output_file=args.output,
387
+ auto_name=args.auto_name,
388
+ model=args.model,
389
+ custom_prompt=args.prompt,
390
+ verbose=args.verbose
391
+ )
392
+
393
+
394
+ if __name__ == '__main__':
395
+ main()