skillstore-cli 1.0.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (231) hide show
  1. package/README.md +95 -0
  2. package/data/bundles/devflow-complete.json +19 -0
  3. package/data/free-skills/devflow-agile/manifest.json +19 -0
  4. package/data/free-skills/devflow-agile/plugin/commands/agile/retro.md +23 -0
  5. package/data/free-skills/devflow-agile/plugin/commands/agile/review.md +21 -0
  6. package/data/free-skills/devflow-agile/plugin/commands/agile/sprint.md +30 -0
  7. package/data/free-skills/devflow-agile/plugin/commands/agile/standup.md +20 -0
  8. package/data/free-skills/devflow-agile/plugin/commands/agile.md +35 -0
  9. package/data/free-skills/devflow-agile/plugin/commands/devflow.md +42 -0
  10. package/data/free-skills/devflow-agile/plugin/skills/developer/SKILL.md +93 -0
  11. package/data/free-skills/devflow-agile/plugin/skills/developer/assets/sample-output.md +182 -0
  12. package/data/free-skills/devflow-agile/plugin/skills/developer/references/clean-architecture.md +361 -0
  13. package/data/free-skills/devflow-agile/plugin/skills/developer/references/clean-code-guide.md +207 -0
  14. package/data/free-skills/devflow-agile/plugin/skills/developer/references/debugging-methodology.md +191 -0
  15. package/data/free-skills/devflow-agile/template/agents/agile-coach.md +76 -0
  16. package/data/free-skills/devflow-agile/template/workflows/agile-sprint-workflow.md +81 -0
  17. package/data/free-skills/devflow-bootstrap/manifest.json +8 -0
  18. package/data/free-skills/devflow-bootstrap/plugin/commands/bootstrap/auto.md +31 -0
  19. package/data/free-skills/devflow-bootstrap/plugin/commands/bootstrap.md +38 -0
  20. package/data/free-skills/devflow-bootstrap/plugin/commands/devflow.md +20 -0
  21. package/data/free-skills/devflow-bootstrap/plugin/skills/project-scaffold/SKILL.md +56 -0
  22. package/data/free-skills/devflow-bootstrap/plugin/skills/project-scaffold/assets/sample-output.md +216 -0
  23. package/data/free-skills/devflow-bootstrap/plugin/skills/project-scaffold/references/architecture-decisions.md +254 -0
  24. package/data/free-skills/devflow-bootstrap/plugin/skills/project-scaffold/references/stack-templates.md +400 -0
  25. package/data/free-skills/devflow-bootstrap/template/agents/bootstrap-specialist.md +56 -0
  26. package/data/free-skills/devflow-bootstrap/template/workflows/bootstrap-workflow.md +70 -0
  27. package/data/free-skills/devflow-docs/manifest.json +8 -0
  28. package/data/free-skills/devflow-docs/plugin/commands/devflow.md +20 -0
  29. package/data/free-skills/devflow-docs/plugin/commands/docs/generate.md +17 -0
  30. package/data/free-skills/devflow-docs/plugin/commands/docs/parse.md +19 -0
  31. package/data/free-skills/devflow-docs/plugin/commands/docs.md +26 -0
  32. package/data/free-skills/devflow-docs/plugin/skills/pdf-processor/SKILL.md +59 -0
  33. package/data/free-skills/devflow-docs/plugin/skills/pdf-processor/assets/sample-output.md +114 -0
  34. package/data/free-skills/devflow-docs/plugin/skills/pdf-processor/references/extraction-techniques.md +115 -0
  35. package/data/free-skills/devflow-docs/plugin/skills/pdf-processor/references/ocr-strategies.md +167 -0
  36. package/data/free-skills/devflow-docs/template/agents/docs-specialist.md +35 -0
  37. package/data/free-skills/devflow-docs/template/workflows/docs-workflow.md +70 -0
  38. package/data/free-skills/devflow-postproject/manifest.json +13 -0
  39. package/data/free-skills/devflow-postproject/plugin/commands/devflow.md +34 -0
  40. package/data/free-skills/devflow-postproject/plugin/commands/postproject/handover.md +21 -0
  41. package/data/free-skills/devflow-postproject/plugin/commands/postproject/retro.md +21 -0
  42. package/data/free-skills/devflow-postproject/plugin/commands/postproject/support.md +21 -0
  43. package/data/free-skills/devflow-postproject/plugin/commands/postproject.md +32 -0
  44. package/data/free-skills/devflow-postproject/plugin/skills/retrospective/SKILL.md +70 -0
  45. package/data/free-skills/devflow-postproject/plugin/skills/retrospective/assets/sample-output.md +79 -0
  46. package/data/free-skills/devflow-postproject/plugin/skills/retrospective/references/facilitation-techniques.md +178 -0
  47. package/data/free-skills/devflow-postproject/plugin/skills/retrospective/references/lessons-learned-template.md +118 -0
  48. package/data/free-skills/devflow-postproject/plugin/skills/retrospective/references/retro-techniques.md +100 -0
  49. package/data/free-skills/devflow-postproject/template/agents/transition-manager.md +71 -0
  50. package/data/free-skills/devflow-postproject/template/workflows/transition-workflow.md +72 -0
  51. package/data/free-skills/devflow-presale/manifest.json +15 -0
  52. package/data/free-skills/devflow-presale/plugin/commands/devflow.md +47 -0
  53. package/data/free-skills/devflow-presale/plugin/commands/presale/analyze.md +30 -0
  54. package/data/free-skills/devflow-presale/plugin/commands/presale/estimate.md +30 -0
  55. package/data/free-skills/devflow-presale/plugin/commands/presale/price.md +30 -0
  56. package/data/free-skills/devflow-presale/plugin/commands/presale/propose.md +30 -0
  57. package/data/free-skills/devflow-presale/plugin/commands/presale.md +42 -0
  58. package/data/free-skills/devflow-presale/plugin/skills/requirement-analysis/SKILL.md +63 -0
  59. package/data/free-skills/devflow-presale/plugin/skills/requirement-analysis/assets/sample-output.md +129 -0
  60. package/data/free-skills/devflow-presale/plugin/skills/requirement-analysis/references/extraction-framework.md +140 -0
  61. package/data/free-skills/devflow-presale/plugin/skills/requirement-analysis/references/output-template.md +132 -0
  62. package/data/free-skills/devflow-presale/template/agents/presale-lead.md +83 -0
  63. package/data/free-skills/devflow-presale/template/agents/proposal-reviewer.md +63 -0
  64. package/data/free-skills/devflow-presale/template/workflows/presale-workflow.md +70 -0
  65. package/data/registry/categories.json +7 -0
  66. package/data/registry/packages.json +184 -0
  67. package/data/shared/framework/agents/brainstormer.md +74 -0
  68. package/data/shared/framework/agents/code-reviewer.md +87 -0
  69. package/data/shared/framework/agents/debugger.md +84 -0
  70. package/data/shared/framework/agents/docs-manager.md +55 -0
  71. package/data/shared/framework/agents/git-manager.md +59 -0
  72. package/data/shared/framework/agents/planner.md +68 -0
  73. package/data/shared/framework/agents/researcher.md +66 -0
  74. package/data/shared/framework/agents/tester.md +65 -0
  75. package/data/shared/framework/commands/cook/auto.md +27 -0
  76. package/data/shared/framework/commands/cook.md +45 -0
  77. package/data/shared/framework/commands/fix/ci.md +21 -0
  78. package/data/shared/framework/commands/fix/test.md +26 -0
  79. package/data/shared/framework/commands/fix/types.md +29 -0
  80. package/data/shared/framework/commands/fix.md +26 -0
  81. package/data/shared/framework/commands/git/cm.md +37 -0
  82. package/data/shared/framework/commands/git/pr.md +40 -0
  83. package/data/shared/framework/config/CLAUDE.md.template +26 -0
  84. package/data/shared/framework/config/settings.json +41 -0
  85. package/data/shared/framework/config/skillstore.config.json +29 -0
  86. package/data/shared/framework/hooks/discord-notify.sh +85 -0
  87. package/data/shared/framework/hooks/docs-sync.sh +53 -0
  88. package/data/shared/framework/hooks/modularization-hook.js +103 -0
  89. package/data/shared/framework/hooks/notification.js +94 -0
  90. package/data/shared/framework/hooks/quality-gate.js +109 -0
  91. package/data/shared/framework/hooks/scout-block.js +77 -0
  92. package/data/shared/framework/hooks/telegram-notify.sh +77 -0
  93. package/data/shared/framework/protocols/error-recovery.md +80 -0
  94. package/data/shared/framework/protocols/orchestration-protocol.md +112 -0
  95. package/data/shared/framework/quality/review-protocol.md +76 -0
  96. package/data/shared/framework/quality/verification-protocol.md +66 -0
  97. package/data/shared/framework/rules/development-rules.md +75 -0
  98. package/data/shared/framework/skills/backend-development/SKILL.md +77 -0
  99. package/data/shared/framework/skills/backend-development/assets/sample-output.md +175 -0
  100. package/data/shared/framework/skills/backend-development/references/advanced-patterns.md +180 -0
  101. package/data/shared/framework/skills/backend-development/references/api-design-guide.md +160 -0
  102. package/data/shared/framework/skills/backend-development/references/architecture-patterns.md +183 -0
  103. package/data/shared/framework/skills/backend-development/references/observability-resilience.md +155 -0
  104. package/data/shared/framework/skills/backend-development/references/troubleshooting.md +199 -0
  105. package/data/shared/framework/skills/codebase-analysis/SKILL.md +72 -0
  106. package/data/shared/framework/skills/codebase-analysis/assets/sample-output.md +263 -0
  107. package/data/shared/framework/skills/codebase-analysis/references/analysis-techniques.md +241 -0
  108. package/data/shared/framework/skills/codebase-analysis/references/dependency-mapping.md +280 -0
  109. package/data/shared/framework/skills/codebase-analysis/references/tech-debt-assessment.md +208 -0
  110. package/data/shared/framework/skills/databases/SKILL.md +72 -0
  111. package/data/shared/framework/skills/databases/assets/sample-output.md +212 -0
  112. package/data/shared/framework/skills/databases/references/advanced-data-patterns.md +259 -0
  113. package/data/shared/framework/skills/databases/references/query-optimization.md +214 -0
  114. package/data/shared/framework/skills/databases/references/schema-design.md +159 -0
  115. package/data/shared/framework/skills/databases/references/troubleshooting.md +214 -0
  116. package/data/shared/framework/skills/debugging-investigation/SKILL.md +84 -0
  117. package/data/shared/framework/skills/debugging-investigation/assets/sample-output.md +314 -0
  118. package/data/shared/framework/skills/debugging-investigation/references/systematic-debugging.md +197 -0
  119. package/data/shared/framework/skills/debugging-investigation/references/tool-specific-guides.md +202 -0
  120. package/data/shared/framework/skills/debugging-investigation/references/troubleshooting-patterns.md +196 -0
  121. package/data/shared/framework/skills/frontend-development/SKILL.md +67 -0
  122. package/data/shared/framework/skills/frontend-development/assets/sample-output.md +110 -0
  123. package/data/shared/framework/skills/frontend-development/references/component-patterns.md +112 -0
  124. package/data/shared/framework/skills/frontend-development/references/performance-guide.md +169 -0
  125. package/data/shared/framework/skills/frontend-development/references/routing-forms-realtime.md +374 -0
  126. package/data/shared/framework/skills/frontend-development/references/ssr-rsc-patterns.md +284 -0
  127. package/data/shared/framework/skills/frontend-development/references/troubleshooting.md +154 -0
  128. package/data/shared/framework/skills/mobile-development/SKILL.md +67 -0
  129. package/data/shared/framework/skills/mobile-development/assets/sample-output.md +382 -0
  130. package/data/shared/framework/skills/mobile-development/references/mobile-patterns.md +681 -0
  131. package/data/shared/framework/skills/mobile-development/references/mobile-performance.md +524 -0
  132. package/data/shared/framework/skills/mobile-development/references/troubleshooting.md +158 -0
  133. package/data/shared/framework/skills/security-audit/SKILL.md +83 -0
  134. package/data/shared/framework/skills/security-audit/assets/sample-output.md +451 -0
  135. package/data/shared/framework/skills/security-audit/references/owasp-checklist.md +580 -0
  136. package/data/shared/framework/skills/security-audit/references/secure-coding-patterns.md +433 -0
  137. package/data/shared/framework/skills/security-audit/references/vulnerability-remediation.md +331 -0
  138. package/data/shared/framework/skills/ui-generation/SKILL.md +70 -0
  139. package/data/shared/framework/skills/ui-generation/assets/sample-output.md +139 -0
  140. package/data/shared/framework/skills/ui-generation/references/accessibility-responsive.md +127 -0
  141. package/data/shared/framework/skills/ui-generation/references/compound-components.md +252 -0
  142. package/data/shared/framework/skills/ui-generation/references/generation-patterns.md +110 -0
  143. package/data/shared/framework/skills/ui-generation/references/storybook-design-system.md +278 -0
  144. package/data/shared/framework/skills/ui-generation/references/troubleshooting.md +198 -0
  145. package/data/shared/framework/workflows/documentation-management.md +58 -0
  146. package/data/shared/framework/workflows/primary-workflow.md +88 -0
  147. package/dist/commands/activate.d.ts +3 -0
  148. package/dist/commands/activate.d.ts.map +1 -0
  149. package/dist/commands/activate.js +34 -0
  150. package/dist/commands/activate.js.map +1 -0
  151. package/dist/commands/bundle.d.ts +3 -0
  152. package/dist/commands/bundle.d.ts.map +1 -0
  153. package/dist/commands/bundle.js +64 -0
  154. package/dist/commands/bundle.js.map +1 -0
  155. package/dist/commands/install.d.ts +3 -0
  156. package/dist/commands/install.d.ts.map +1 -0
  157. package/dist/commands/install.js +99 -0
  158. package/dist/commands/install.js.map +1 -0
  159. package/dist/commands/list.d.ts +3 -0
  160. package/dist/commands/list.d.ts.map +1 -0
  161. package/dist/commands/list.js +37 -0
  162. package/dist/commands/list.js.map +1 -0
  163. package/dist/commands/search.d.ts +3 -0
  164. package/dist/commands/search.d.ts.map +1 -0
  165. package/dist/commands/search.js +30 -0
  166. package/dist/commands/search.js.map +1 -0
  167. package/dist/commands/status.d.ts +3 -0
  168. package/dist/commands/status.d.ts.map +1 -0
  169. package/dist/commands/status.js +35 -0
  170. package/dist/commands/status.js.map +1 -0
  171. package/dist/commands/update.d.ts +3 -0
  172. package/dist/commands/update.d.ts.map +1 -0
  173. package/dist/commands/update.js +68 -0
  174. package/dist/commands/update.js.map +1 -0
  175. package/dist/download/cache.d.ts +3 -0
  176. package/dist/download/cache.d.ts.map +1 -0
  177. package/dist/download/cache.js +18 -0
  178. package/dist/download/cache.js.map +1 -0
  179. package/dist/download/client.d.ts +2 -0
  180. package/dist/download/client.d.ts.map +1 -0
  181. package/dist/download/client.js +58 -0
  182. package/dist/download/client.js.map +1 -0
  183. package/dist/index.d.ts +3 -0
  184. package/dist/index.d.ts.map +1 -0
  185. package/dist/index.js +23 -0
  186. package/dist/index.js.map +1 -0
  187. package/dist/installer/file-copier.d.ts +6 -0
  188. package/dist/installer/file-copier.d.ts.map +1 -0
  189. package/dist/installer/file-copier.js +32 -0
  190. package/dist/installer/file-copier.js.map +1 -0
  191. package/dist/installer/plugin-installer.d.ts +12 -0
  192. package/dist/installer/plugin-installer.d.ts.map +1 -0
  193. package/dist/installer/plugin-installer.js +33 -0
  194. package/dist/installer/plugin-installer.js.map +1 -0
  195. package/dist/installer/template-installer.d.ts +12 -0
  196. package/dist/installer/template-installer.d.ts.map +1 -0
  197. package/dist/installer/template-installer.js +45 -0
  198. package/dist/installer/template-installer.js.map +1 -0
  199. package/dist/license/crypto.d.ts +16 -0
  200. package/dist/license/crypto.d.ts.map +1 -0
  201. package/dist/license/crypto.js +50 -0
  202. package/dist/license/crypto.js.map +1 -0
  203. package/dist/license/license-store.d.ts +19 -0
  204. package/dist/license/license-store.d.ts.map +1 -0
  205. package/dist/license/license-store.js +99 -0
  206. package/dist/license/license-store.js.map +1 -0
  207. package/dist/license/validator.d.ts +32 -0
  208. package/dist/license/validator.d.ts.map +1 -0
  209. package/dist/license/validator.js +81 -0
  210. package/dist/license/validator.js.map +1 -0
  211. package/dist/registry/loader.d.ts +30 -0
  212. package/dist/registry/loader.d.ts.map +1 -0
  213. package/dist/registry/loader.js +22 -0
  214. package/dist/registry/loader.js.map +1 -0
  215. package/dist/registry/search-engine.d.ts +9 -0
  216. package/dist/registry/search-engine.d.ts.map +1 -0
  217. package/dist/registry/search-engine.js +30 -0
  218. package/dist/registry/search-engine.js.map +1 -0
  219. package/dist/utils/config.d.ts +14 -0
  220. package/dist/utils/config.d.ts.map +1 -0
  221. package/dist/utils/config.js +28 -0
  222. package/dist/utils/config.js.map +1 -0
  223. package/dist/utils/logger.d.ts +9 -0
  224. package/dist/utils/logger.d.ts.map +1 -0
  225. package/dist/utils/logger.js +22 -0
  226. package/dist/utils/logger.js.map +1 -0
  227. package/dist/utils/paths.d.ts +20 -0
  228. package/dist/utils/paths.d.ts.map +1 -0
  229. package/dist/utils/paths.js +79 -0
  230. package/dist/utils/paths.js.map +1 -0
  231. package/package.json +54 -0
@@ -0,0 +1,114 @@
1
+ # Sample Output: Government IT Modernization RFP
2
+
3
+ **Source**: `GOV-IT-Modernization-RFP-2026.pdf` (42 pages)
4
+ **Extraction Quality**: HIGH (native text PDF)
5
+ **Processed**: 42/42 pages
6
+
7
+ ---
8
+
9
+ ## Document Metadata
10
+
11
+ | Field | Value |
12
+ |-------|-------|
13
+ | Title | Request for Proposal: IT Infrastructure Modernization |
14
+ | Author | Department of Digital Services |
15
+ | Created | 2026-01-15 |
16
+ | Version | 2.1 (Final) |
17
+ | Pages | 42 |
18
+
19
+ ---
20
+
21
+ ## Executive Summary (Pages 1-3)
22
+
23
+ The Department of Digital Services seeks proposals for a comprehensive IT infrastructure modernization program. The program covers migration of 12 legacy systems to cloud-native architecture, implementation of zero-trust security framework, and establishment of a modern DevOps pipeline.
24
+
25
+ **Budget Range**: $8.5M - $12M over 3 years
26
+ **Submission Deadline**: 2026-04-30
27
+ **Contract Duration**: 36 months with 2 optional 12-month extensions
28
+
29
+ ---
30
+
31
+ ## Extracted Requirements Table (Pages 8-15)
32
+
33
+ | Req ID | Category | Description | Priority | Compliance |
34
+ |--------|----------|-------------|----------|------------|
35
+ | REQ-001 | Infrastructure | Migrate all 12 legacy systems to AWS GovCloud | Must Have | Mandatory |
36
+ | REQ-002 | Infrastructure | Achieve 99.95% uptime SLA for Tier 1 systems | Must Have | Mandatory |
37
+ | REQ-003 | Security | Implement zero-trust architecture per NIST 800-207 | Must Have | Mandatory |
38
+ | REQ-004 | Security | FedRAMP High authorization for all cloud services | Must Have | Mandatory |
39
+ | REQ-005 | DevOps | CI/CD pipeline with automated security scanning | Should Have | Scored |
40
+ | REQ-006 | DevOps | Infrastructure as Code for all deployments | Should Have | Scored |
41
+ | REQ-007 | Data | Data lake implementation for analytics workloads | Nice to Have | Scored |
42
+ | REQ-008 | Data | Real-time dashboard for system health monitoring | Should Have | Scored |
43
+ | REQ-009 | Training | Staff training program (min 200 personnel) | Must Have | Mandatory |
44
+ | REQ-010 | Support | 24/7 Tier 3 support during transition period | Must Have | Mandatory |
45
+
46
+ **Total Requirements Extracted**: 47 (10 shown above)
47
+ - Must Have: 23
48
+ - Should Have: 16
49
+ - Nice to Have: 8
50
+
51
+ ---
52
+
53
+ ## Budget Section (Pages 18-22)
54
+
55
+ ### Cost Breakdown by Phase
56
+
57
+ | Phase | Duration | Budget Allocation |
58
+ |-------|----------|-------------------|
59
+ | Phase 1: Assessment & Planning | Months 1-4 | $1.2M |
60
+ | Phase 2: Infrastructure Build | Months 5-14 | $4.5M |
61
+ | Phase 3: Migration & Testing | Months 15-26 | $3.8M |
62
+ | Phase 4: Optimization & Handover | Months 27-36 | $2.5M |
63
+ | **Total** | **36 months** | **$12.0M (max)** |
64
+
65
+ ### Budget Constraints
66
+ - Travel expenses capped at 5% of total contract value
67
+ - Hardware costs must not exceed 30% of Phase 2 budget
68
+ - Training budget: minimum $500K allocated
69
+
70
+ ---
71
+
72
+ ## Timeline (Pages 23-27)
73
+
74
+ ### Key Milestones
75
+
76
+ | Milestone | Target Date | Dependencies |
77
+ |-----------|-------------|--------------|
78
+ | Contract Award | 2026-06-01 | — |
79
+ | Kickoff Meeting | 2026-06-15 | Contract signed |
80
+ | Assessment Complete | 2026-09-30 | Kickoff |
81
+ | Cloud Environment Ready | 2027-01-31 | Assessment |
82
+ | First System Migrated | 2027-04-30 | Cloud ready |
83
+ | 50% Systems Migrated | 2027-09-30 | First migration |
84
+ | All Systems Migrated | 2028-03-31 | Progressive migration |
85
+ | Performance Optimization | 2028-08-31 | All migrated |
86
+ | Final Handover | 2028-12-31 | Optimization complete |
87
+
88
+ ---
89
+
90
+ ## Evaluation Criteria (Pages 30-35)
91
+
92
+ | Criteria | Weight | Description |
93
+ |----------|--------|-------------|
94
+ | Technical Approach | 35% | Architecture design, migration strategy, security framework |
95
+ | Past Performance | 25% | Similar projects, references, case studies |
96
+ | Management Approach | 20% | Team structure, risk management, communication plan |
97
+ | Cost Proposal | 15% | Total cost, cost realism, value for money |
98
+ | Small Business Participation | 5% | Subcontracting plan, mentor-protégé arrangements |
99
+
100
+ ### Scoring Scale
101
+ - Outstanding (5): Exceeds requirements, innovative approach
102
+ - Good (4): Meets all requirements with minor strengths
103
+ - Acceptable (3): Meets minimum requirements
104
+ - Marginal (2): Fails to meet some requirements
105
+ - Unacceptable (1): Fails to meet critical requirements
106
+
107
+ ---
108
+
109
+ ## Extraction Notes
110
+
111
+ - All 42 pages processed successfully
112
+ - 4 tables required multi-page merge (pages 8-15 requirements table)
113
+ - 2 architecture diagrams detected on pages 28-29 (described inline)
114
+ - Appendices A-D contain boilerplate terms (extracted but not shown in summary)
@@ -0,0 +1,115 @@
1
+ # PDF Extraction Techniques
2
+
3
+ ## Text Extraction Strategies
4
+
5
+ ### Native Text vs OCR
6
+ - **Native text PDFs**: Text is embedded as selectable characters. Direct extraction is fast and accurate.
7
+ - **Scanned PDFs**: Pages are images. Requires OCR (Optical Character Recognition) for text extraction.
8
+ - **Hybrid PDFs**: Mix of native text and scanned pages. Detect per-page and apply appropriate method.
9
+
10
+ ### Handling Multi-Column Layouts
11
+ - Detect column boundaries by analyzing text block positions
12
+ - Read columns left-to-right, top-to-bottom within each column
13
+ - Watch for content that spans columns (titles, images, tables)
14
+ - Use spatial analysis to determine reading order when columns are ambiguous
15
+
16
+ ### Text Cleaning
17
+ - Remove headers/footers that repeat across pages
18
+ - Handle hyphenation at line breaks (re-join split words)
19
+ - Normalize whitespace and line breaks
20
+ - Preserve paragraph boundaries
21
+
22
+ ## Table Extraction
23
+
24
+ ### Detecting Table Boundaries
25
+ - Look for grid lines (ruled tables)
26
+ - For borderless tables: detect alignment patterns in text blocks
27
+ - Use whitespace gaps to identify column separators
28
+ - Check for consistent row height patterns
29
+
30
+ ### Merging Cells and Spanning
31
+ - Detect merged cells by analyzing grid structure
32
+ - Handle column spans (header cells spanning multiple data columns)
33
+ - Handle row spans (category labels spanning multiple rows)
34
+ - Reconstruct logical table structure from visual layout
35
+
36
+ ### Complex Table Patterns
37
+ - Nested tables (tables within cells)
38
+ - Tables split across pages — detect continuation and merge
39
+ - Tables with mixed text/numeric data
40
+ - Tables with embedded lists or sub-items
41
+
42
+ ## Form Field Extraction
43
+
44
+ ### Field Types
45
+ - **Text fields**: Extract label + value pairs
46
+ - **Checkboxes**: Detect checked/unchecked state
47
+ - **Radio buttons**: Identify selected option within group
48
+ - **Dropdowns**: Extract selected value and available options if accessible
49
+ - **Signature fields**: Flag presence, note if signed
50
+
51
+ ### Form Mapping
52
+ - Associate labels with their corresponding fields
53
+ - Handle multi-page forms with consistent field naming
54
+ - Extract form metadata (form title, version, required fields)
55
+ - Output as structured key-value pairs
56
+
57
+ ## Image/Diagram Extraction
58
+
59
+ ### Image Handling
60
+ - Extract embedded images with position context
61
+ - Determine image type (photo, diagram, chart, logo)
62
+ - Provide descriptive caption based on surrounding text
63
+ - Note image dimensions and quality
64
+
65
+ ### Diagram Interpretation
66
+ - Architecture diagrams: identify components and connections
67
+ - Flowcharts: extract process steps and decision points
68
+ - Org charts: extract hierarchy and roles
69
+ - Network diagrams: identify nodes and relationships
70
+
71
+ ## Metadata Extraction
72
+ - **Author**: Document creator and last modifier
73
+ - **Dates**: Creation date, modification date, print date
74
+ - **Version**: Document version if specified
75
+ - **Title/Subject**: From document properties
76
+ - **Keywords/Tags**: If present in metadata
77
+ - **Page count**: Total pages
78
+ - **File size**: For reference
79
+ - **PDF version**: Compatibility information
80
+ - **Security settings**: Encryption, permissions (print, copy, edit)
81
+
82
+ ## Multi-Language Document Handling
83
+ - Detect primary language from text content
84
+ - Identify language switches within document
85
+ - Apply language-specific OCR models for scanned content
86
+ - Preserve original language in extraction, note detected language
87
+ - Handle right-to-left (RTL) languages appropriately
88
+
89
+ ## Handling Scanned vs Digital PDFs
90
+
91
+ ### Detection
92
+ - Check if text layer exists (try selecting text)
93
+ - Analyze page content streams for text vs image objects
94
+ - Test extraction: if native text yields garbage or nothing, likely scanned
95
+
96
+ ### Scanned PDF Best Practices
97
+ - Pre-process images: deskew, denoise, enhance contrast
98
+ - Use appropriate OCR engine and language model
99
+ - Validate OCR output against expected patterns
100
+ - Report confidence scores per page/section
101
+ - Flag low-confidence sections for human review
102
+
103
+ ## Quality Assessment of Extraction Results
104
+
105
+ ### Metrics
106
+ - **Completeness**: Percentage of pages/sections successfully extracted
107
+ - **Accuracy**: Confidence score for OCR-based content
108
+ - **Structure preservation**: Are headings, lists, tables intact?
109
+ - **Data integrity**: Numbers, dates, names correctly extracted
110
+
111
+ ### Quality Flags
112
+ - `HIGH`: Native text, clean extraction, structure preserved
113
+ - `MEDIUM`: OCR with high confidence, minor formatting issues
114
+ - `LOW`: OCR with low confidence, significant structure loss
115
+ - `FAILED`: Unable to extract meaningful content from section
@@ -0,0 +1,167 @@
1
+ # OCR Strategies Reference
2
+
3
+ ## OCR Engine Comparison
4
+
5
+ ### Tesseract OCR (Open Source)
6
+ - **Best for**: High-quality scanned text, single-language documents, budget-conscious projects
7
+ - **Accuracy**: 85-95% on clean scans, drops significantly on low-quality images
8
+ - **Languages**: 100+ languages supported via trained models
9
+ - **Cost**: Free
10
+ - **Latency**: Moderate (1-5 seconds per page depending on complexity)
11
+ - **Deployment**: Self-hosted, runs locally or in container
12
+ - **Limitations**: Poor on handwriting, complex layouts, low-resolution images
13
+
14
+ ### Google Cloud Vision OCR
15
+ - **Best for**: Mixed content (text + images), handwriting, complex layouts
16
+ - **Accuracy**: 95-99% on most document types
17
+ - **Languages**: 100+ languages with automatic detection
18
+ - **Cost**: $1.50 per 1,000 pages (first 1,000/month free)
19
+ - **Latency**: 1-3 seconds per page (network dependent)
20
+ - **Key feature**: Document AI for structured extraction (invoices, receipts)
21
+
22
+ ### AWS Textract
23
+ - **Best for**: Forms, tables, structured documents (invoices, tax forms)
24
+ - **Accuracy**: 95-99%, especially strong on tables and forms
25
+ - **Languages**: English primary, expanding language support
26
+ - **Cost**: $1.50 per 1,000 pages (text), $15 per 1,000 pages (tables/forms)
27
+ - **Latency**: 1-5 seconds per page
28
+ - **Key feature**: Automatic table structure detection, key-value pair extraction
29
+
30
+ ### Azure Form Recognizer (Document Intelligence)
31
+ - **Best for**: Pre-built models for common document types (invoices, receipts, ID cards)
32
+ - **Accuracy**: 95-99% with pre-built models, customizable models improve further
33
+ - **Languages**: 100+ languages for read, fewer for specialized models
34
+ - **Cost**: $1.50 per 1,000 pages (read), $10 per 1,000 pages (pre-built models)
35
+ - **Key feature**: Custom model training with as few as 5 labeled samples
36
+
37
+ ### Comparison Matrix
38
+ | Feature | Tesseract | Google Vision | AWS Textract | Azure Form Recognizer |
39
+ |----------------------|------------------|------------------|------------------|----------------------|
40
+ | Table detection | Poor | Good | Excellent | Excellent |
41
+ | Form extraction | None | Basic | Excellent | Excellent |
42
+ | Handwriting | Poor | Good | Good | Good |
43
+ | Custom training | Yes (complex) | AutoML | Custom Queries | Custom Models |
44
+ | On-premise | Yes | No | No | Yes (containers) |
45
+ | Batch processing | Manual | Batch API | Async API | Batch API |
46
+
47
+ ## Table Detection
48
+
49
+ ### Algorithms and Approaches
50
+ 1. **Rule-based detection**: Look for horizontal/vertical lines forming grid patterns
51
+ 2. **ML-based detection**: Use object detection models (DETR, TableNet) to identify table regions
52
+ 3. **Hybrid**: Combine line detection with ML for robust results
53
+
54
+ ### Bordered Tables
55
+ - Most reliable to detect: look for continuous horizontal and vertical lines
56
+ - Use Hough Line Transform for line detection
57
+ - Intersecting lines define cell boundaries
58
+ - Process: detect lines -> find intersections -> define cells -> extract text per cell
59
+
60
+ ### Borderless Tables
61
+ - Significantly harder: rely on text alignment and spacing
62
+ - Use column detection via text x-coordinate clustering
63
+ - Row detection via y-coordinate gaps
64
+ - Whitespace analysis to determine column boundaries
65
+ - Consider using ML-based approaches for higher accuracy
66
+
67
+ ### Multi-Page Tables
68
+ - Detect table continuation markers ("continued on next page", repeated headers)
69
+ - Track column positions across pages for alignment
70
+ - Merge strategy: match columns by x-position, append rows
71
+ - Watch for: header repetition, page numbers in table, footnotes breaking table
72
+
73
+ ## Form Field Extraction
74
+
75
+ ### Key-Value Pair Detection
76
+ - **Label proximity**: Find text labels near input fields (left of, above)
77
+ - **Colon detection**: "Name: John Doe" pattern - split on colon
78
+ - **Spatial relationship**: Labels and values typically aligned horizontally or vertically
79
+ - **Field grouping**: Related fields often share visual boundaries (boxes, sections)
80
+
81
+ ### Checkbox Detection
82
+ - Look for small square regions (~10-20px) with or without fill
83
+ - Filled checkbox: high pixel density inside square boundary
84
+ - Empty checkbox: low pixel density, only border pixels
85
+ - Common symbols: checkmark, X, filled square vs empty square
86
+
87
+ ### Signature Areas
88
+ - Typically found at bottom of documents
89
+ - Identified by: horizontal line above text "Signature", "Sign here"
90
+ - Contain irregular strokes (unlike printed text)
91
+ - May be blank (unsigned) or contain image data (signed)
92
+ - Do not attempt OCR on signature areas - flag for human review
93
+
94
+ ## Multi-Language Document Handling
95
+
96
+ ### Language Detection Strategy
97
+ 1. **Pre-scan sampling**: OCR a small region, run language detection on output
98
+ 2. **Script detection**: Identify character scripts (Latin, CJK, Arabic, Devanagari)
99
+ 3. **Mixed documents**: Split into regions, detect language per region
100
+ 4. **Fallback**: Use multi-language model if detection is uncertain
101
+
102
+ ### Mixed-Language Documents
103
+ - Common patterns: English headers with local-language body text
104
+ - Process each text region with appropriate language model
105
+ - Some engines (Google Vision, Azure) handle mixed languages automatically
106
+ - Tesseract: specify multiple languages `tesseract input.png output -l eng+jpn+chi_sim`
107
+
108
+ ### Script-Specific Considerations
109
+ | Script | Direction | Special Handling |
110
+ |------------|-----------|---------------------------------------------|
111
+ | Latin | LTR | Standard processing |
112
+ | Arabic | RTL | Right-to-left text flow, connected letters |
113
+ | CJK | LTR/TTB | May be vertical, no word spacing |
114
+ | Devanagari | LTR | Connected headstroke (Shirorekha) |
115
+ | Thai | LTR | No spaces between words, requires segmentation |
116
+
117
+ ## Scanned vs Native PDF Processing
118
+
119
+ ### Quality Assessment
120
+ ```
121
+ Native PDF (digitally created):
122
+ - Text layer present: can extract directly without OCR
123
+ - Perfect accuracy: text is already encoded
124
+ - Structured: may contain tagged PDF elements
125
+ - Detection: check for extractable text layer first
126
+
127
+ Scanned PDF (image-based):
128
+ - No text layer: requires OCR
129
+ - Quality varies with scan settings
130
+ - May have skew, noise, artifacts
131
+ - Detection: if text extraction yields empty/garbage, it is scanned
132
+ ```
133
+
134
+ ### Preprocessing Pipeline for Scanned Documents
135
+
136
+ #### 1. Deskew (Straighten)
137
+ - Detect rotation angle via Hough Transform or projection profile
138
+ - Rotate image to align text horizontally
139
+ - Critical for accurate OCR - even 1-2 degree skew reduces accuracy
140
+
141
+ #### 2. Denoise
142
+ - Remove scanner artifacts, speckles, background texture
143
+ - Apply Gaussian blur for mild noise
144
+ - Use median filter for salt-and-pepper noise
145
+ - Non-local means denoising for preserving text edges
146
+
147
+ #### 3. Binarize (Convert to black/white)
148
+ - Adaptive thresholding (Otsu's method) for uneven lighting
149
+ - Sauvola binarization for documents with varying backgrounds
150
+ - Critical step: poor binarization destroys thin strokes and small text
151
+
152
+ #### 4. Additional Steps
153
+ - **Border removal**: Crop black borders from scanning
154
+ - **Page segmentation**: Identify text regions, images, tables separately
155
+ - **Resolution check**: Ensure minimum 300 DPI for reliable OCR
156
+ - **Contrast enhancement**: CLAHE (Contrast Limited Adaptive Histogram Equalization)
157
+
158
+ ### Decision Flowchart
159
+ ```
160
+ 1. Attempt text extraction from PDF
161
+ 2. If text extracted successfully -> use native text (no OCR needed)
162
+ 3. If no text or garbled text -> classify as scanned
163
+ 4. Assess scan quality (DPI, contrast, skew)
164
+ 5. Apply preprocessing pipeline
165
+ 6. Run OCR with appropriate engine
166
+ 7. Post-process: spell check, layout reconstruction
167
+ ```
@@ -0,0 +1,35 @@
1
+ ---
2
+ name: docs-specialist
3
+ description: Use this agent for document processing workflows — parsing client documents, generating deliverables, and managing document-based requirements.
4
+ tools: Glob, Grep, LS, Read, Edit, Write
5
+ ---
6
+
7
+ You are a Document Processing Specialist with expertise in extracting structured data from unstructured documents and generating professional deliverables.
8
+
9
+ ## Core Responsibilities
10
+
11
+ ### 1. Document Intake & Parsing
12
+ - Activate appropriate skill based on document type
13
+ - Extract structured data from PDF, Excel, PowerPoint
14
+ - Handle multi-format document sets (RFP = PDF + Excel + Slides)
15
+
16
+ ### 2. Content Analysis
17
+ - Cross-reference extracted data across documents
18
+ - Identify gaps and inconsistencies
19
+ - Flag ambiguous or missing information
20
+
21
+ ### 3. Document Generation
22
+ - Activate `doc-generator` skill
23
+ - Compile analysis outputs into professional documents
24
+ - Ensure formatting meets client standards
25
+
26
+ ## Error Recovery
27
+ - If document unreadable: report format/encoding issue, suggest alternatives
28
+ - If extraction incomplete: flag missing sections, provide partial results
29
+ - Max retries: 2 per document processing attempt
30
+
31
+ ## Checkpoint Protocol
32
+ After processing each document:
33
+ 1. Save extracted content
34
+ 2. Log: document type, pages/sheets processed, extraction quality
35
+ 3. If interrupted: resume from last processed document
@@ -0,0 +1,70 @@
1
+ # Document Processing Workflow
2
+
3
+ End-to-end document processing from intake through analysis to deliverable generation.
4
+
5
+ ## Phase 1: Intake & Classification
6
+
7
+ 1. **Document Receipt**
8
+ - Receive document(s) from user
9
+ - `docs-specialist` agent classifies each document by type
10
+ - Identify processing order based on dependencies
11
+
12
+ 2. **Type Routing**
13
+ | Document Type | Route To |
14
+ |---------------|----------|
15
+ | PDF (RFP, contract, spec) | `pdf-processor` skill |
16
+ | Excel (budget, resource plan) | `excel-analyzer` skill |
17
+ | PowerPoint (presentation, deck) | `presentation-reviewer` skill |
18
+ | Multi-format set | Process in order: PDF → Excel → PowerPoint |
19
+
20
+ ## Phase 2: Extraction (Parallel where possible)
21
+
22
+ 3. **PDF Processing** (if applicable)
23
+ - `docs-specialist` activates `pdf-processor` skill
24
+ - Extract text, tables, forms, and images
25
+ - Handle multi-column layouts and OCR if needed
26
+ - Output: Structured content with section mapping
27
+
28
+ 4. **Excel Analysis** (if applicable, parallel with step 3)
29
+ - `docs-specialist` activates `excel-analyzer` skill
30
+ - Parse budgets, resource plans, timelines
31
+ - Extract formulas and calculated fields
32
+ - Output: Structured data with analysis notes
33
+
34
+ 5. **Presentation Review** (if applicable, parallel with steps 3-4)
35
+ - `docs-specialist` activates `presentation-reviewer` skill
36
+ - Extract key decisions, action items, requirements per slide
37
+ - Identify diagrams and visual content
38
+ - Output: Slide-by-slide content summary
39
+
40
+ ## Phase 3: Cross-Reference & Analysis
41
+
42
+ 6. **Content Synthesis**
43
+ - `docs-specialist` cross-references extracted data across documents
44
+ - Identify inconsistencies (e.g., budget vs. scope mismatch)
45
+ - Flag gaps and ambiguous information
46
+ - Output: Cross-reference analysis report
47
+
48
+ ## Phase 4: Generation (if requested)
49
+
50
+ 7. **Document Generation**
51
+ - `docs-specialist` activates `doc-generator` skill
52
+ - Input: Extracted + analyzed data from phases 2-3
53
+ - Compile into requested deliverable format
54
+ - Apply formatting and professional structure
55
+ - Output: Generated document ready for review
56
+
57
+ ## Phase 5: Review & Delivery
58
+
59
+ 8. **Quality Check**
60
+ - Verify extraction completeness (all sections processed)
61
+ - Validate cross-references are accurate
62
+ - Confirm generated documents meet format requirements
63
+ - Present results to user with confidence indicators
64
+
65
+ ## Quality Gates
66
+
67
+ - **After Phase 1**: Document classification confirmed
68
+ - **After Phase 2**: Extraction quality ≥ 90% (based on section coverage)
69
+ - **After Phase 3**: All cross-reference inconsistencies flagged
70
+ - **After Phase 4**: Generated document matches requested format
@@ -0,0 +1,13 @@
1
+ {
2
+ "name": "@skillstore/devflow-postproject",
3
+ "version": "1.0.0",
4
+ "skills": [
5
+ "handover",
6
+ "maintenance-support",
7
+ "retrospective",
8
+ "client-feedback"
9
+ ],
10
+ "freeSkills": ["retrospective"],
11
+ "commands": ["postproject", "postproject/handover", "postproject/retro", "postproject/support"],
12
+ "modes": ["plugin", "template"]
13
+ }
@@ -0,0 +1,34 @@
1
+ ---
2
+ description: DevFlow smart router — automatically routes tasks to the right post-project skill
3
+ argument-hint: [task description]
4
+ ---
5
+
6
+ ## Your Mission
7
+
8
+ <task>
9
+ $ARGUMENTS
10
+ </task>
11
+
12
+ ## Smart Routing
13
+
14
+ ### Route Detection
15
+ | Keywords/Patterns | Route To |
16
+ |-------------------|----------|
17
+ | handover, transition, KT, knowledge transfer, documentation | `handover` skill |
18
+ | SLA, maintenance, incident, hotfix, support, on-call | `maintenance-support` skill |
19
+ | retrospective, retro, lessons learned, improvement, feedback (internal) | `retrospective` skill |
20
+ | client feedback, satisfaction, CSAT, NPS, upsell | `client-feedback` skill |
21
+ | full transition, project closure, end-to-end | Full orchestration (see below) |
22
+
23
+ ### Full Orchestration
24
+ 1. `retrospective` (while context is fresh)
25
+ 2. `handover` (documentation + KT)
26
+ 3. `client-feedback` (satisfaction assessment)
27
+ 4. `maintenance-support` (ongoing support setup)
28
+
29
+ ### Ambiguity Handling
30
+ If unclear: ask ONE clarifying question.
31
+
32
+ ## References
33
+ - Load `rules/development-rules.md` for quality standards
34
+ - Follow `protocols/error-recovery.md` for failure handling
@@ -0,0 +1,21 @@
1
+ ---
2
+ description: Create comprehensive handover documentation
3
+ argument-hint: [project name or context]
4
+ ---
5
+
6
+ ## Your Mission
7
+
8
+ Create handover documentation for:
9
+
10
+ <project>
11
+ $ARGUMENTS
12
+ </project>
13
+
14
+ ## Process
15
+
16
+ 1. Activate the `handover` skill
17
+ 2. Inventory all project artifacts
18
+ 3. Create architecture and setup documentation
19
+ 4. Document known issues and pending items
20
+ 5. Plan knowledge transfer sessions
21
+ 6. Produce complete handover package
@@ -0,0 +1,21 @@
1
+ ---
2
+ description: Facilitate project retrospective
3
+ argument-hint: [project name or sprint]
4
+ ---
5
+
6
+ ## Your Mission
7
+
8
+ Facilitate retrospective for:
9
+
10
+ <context>
11
+ $ARGUMENTS
12
+ </context>
13
+
14
+ ## Process
15
+
16
+ 1. Activate the `retrospective` skill
17
+ 2. Select appropriate retrospective technique
18
+ 3. Gather data on what went well and what didn't
19
+ 4. Generate insights and patterns
20
+ 5. Create action items with owners
21
+ 6. Produce lessons learned document
@@ -0,0 +1,21 @@
1
+ ---
2
+ description: Setup maintenance and support framework
3
+ argument-hint: [project or service context]
4
+ ---
5
+
6
+ ## Your Mission
7
+
8
+ Setup maintenance support for:
9
+
10
+ <context>
11
+ $ARGUMENTS
12
+ </context>
13
+
14
+ ## Process
15
+
16
+ 1. Activate the `maintenance-support` skill
17
+ 2. Define SLA tiers and response times
18
+ 3. Setup incident management process
19
+ 4. Create escalation matrix
20
+ 5. Define hotfix workflow
21
+ 6. Produce SLA document and operational runbook
@@ -0,0 +1,32 @@
1
+ ---
2
+ description: Post-project workflow — handover, maintenance setup, retrospectives, and client feedback
3
+ argument-hint: [task description]
4
+ ---
5
+
6
+ ## Your Mission
7
+
8
+ <task>
9
+ $ARGUMENTS
10
+ </task>
11
+
12
+ ## Workflow
13
+
14
+ Route to the appropriate post-project skill:
15
+
16
+ 1. **Understand the request** — What post-project activity is needed?
17
+ 2. **Route to skill**:
18
+ - Documentation/transition → Activate `handover` skill
19
+ - SLA/incidents/hotfix → Activate `maintenance-support` skill
20
+ - Lessons learned/improvement → Activate `retrospective` skill
21
+ - Client satisfaction/upsell → Activate `client-feedback` skill
22
+ 3. **Full post-project cycle** (if requested):
23
+ - Start with `retrospective` while project context is fresh
24
+ - Then `handover` for documentation
25
+ - `client-feedback` for satisfaction assessment
26
+ - `maintenance-support` for ongoing support setup
27
+
28
+ ## Sub-commands
29
+
30
+ - `/postproject:handover [project]` — Create handover documentation
31
+ - `/postproject:retro [project]` — Run project retrospective
32
+ - `/postproject:support [context]` — Setup maintenance support