mega-brain-ai 1.3.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (510) hide show
  1. package/.antigravity/README.md +46 -0
  2. package/.antigravity/rules/.gitkeep +0 -0
  3. package/.antigravity/rules/mega-brain.md +39 -0
  4. package/.claude/CLAUDE.md +172 -0
  5. package/.claude/agents.yaml +44 -0
  6. package/.claude/commands/agents.md +161 -0
  7. package/.claude/commands/ask.md +117 -0
  8. package/.claude/commands/benchmark.md +224 -0
  9. package/.claude/commands/chat.md +343 -0
  10. package/.claude/commands/compare.md +116 -0
  11. package/.claude/commands/conclave.md +196 -0
  12. package/.claude/commands/config.md +133 -0
  13. package/.claude/commands/create-agent.md +467 -0
  14. package/.claude/commands/debate.md +159 -0
  15. package/.claude/commands/documentation/create-architecture-documentation.md +175 -0
  16. package/.claude/commands/dossiers.md +180 -0
  17. package/.claude/commands/evolve.md +223 -0
  18. package/.claude/commands/extract-dna.md +172 -0
  19. package/.claude/commands/extract-knowledge.md +507 -0
  20. package/.claude/commands/gsd/add-phase.md +43 -0
  21. package/.claude/commands/gsd/add-tests.md +41 -0
  22. package/.claude/commands/gsd/add-todo.md +47 -0
  23. package/.claude/commands/gsd/audit-milestone.md +36 -0
  24. package/.claude/commands/gsd/check-todos.md +45 -0
  25. package/.claude/commands/gsd/cleanup.md +18 -0
  26. package/.claude/commands/gsd/complete-milestone.md +136 -0
  27. package/.claude/commands/gsd/debug.md +167 -0
  28. package/.claude/commands/gsd/discuss-phase.md +83 -0
  29. package/.claude/commands/gsd/execute-phase.md +41 -0
  30. package/.claude/commands/gsd/health.md +22 -0
  31. package/.claude/commands/gsd/help.md +22 -0
  32. package/.claude/commands/gsd/insert-phase.md +32 -0
  33. package/.claude/commands/gsd/join-discord.md +18 -0
  34. package/.claude/commands/gsd/list-phase-assumptions.md +46 -0
  35. package/.claude/commands/gsd/map-codebase.md +71 -0
  36. package/.claude/commands/gsd/new-milestone.md +44 -0
  37. package/.claude/commands/gsd/new-project.md +42 -0
  38. package/.claude/commands/gsd/pause-work.md +38 -0
  39. package/.claude/commands/gsd/plan-milestone-gaps.md +34 -0
  40. package/.claude/commands/gsd/plan-phase.md +45 -0
  41. package/.claude/commands/gsd/progress.md +24 -0
  42. package/.claude/commands/gsd/quick.md +41 -0
  43. package/.claude/commands/gsd/reapply-patches.md +110 -0
  44. package/.claude/commands/gsd/remove-phase.md +31 -0
  45. package/.claude/commands/gsd/research-phase.md +189 -0
  46. package/.claude/commands/gsd/resume-work.md +40 -0
  47. package/.claude/commands/gsd/set-profile.md +34 -0
  48. package/.claude/commands/gsd/settings.md +36 -0
  49. package/.claude/commands/gsd/update.md +37 -0
  50. package/.claude/commands/gsd/verify-work.md +38 -0
  51. package/.claude/commands/inbox.md +296 -0
  52. package/.claude/commands/ingest-empresa.md +191 -0
  53. package/.claude/commands/ingest.md +183 -0
  54. package/.claude/commands/jarvis-briefing.md +67 -0
  55. package/.claude/commands/jarvis-control.md +169 -0
  56. package/.claude/commands/jarvis-full.md +182 -0
  57. package/.claude/commands/jarvis.md +212 -0
  58. package/.claude/commands/ler-drive.md +212 -0
  59. package/.claude/commands/log.md +158 -0
  60. package/.claude/commands/loop.md +133 -0
  61. package/.claude/commands/loops.md +73 -0
  62. package/.claude/commands/mission-autopilot.md +538 -0
  63. package/.claude/commands/mission.md +353 -0
  64. package/.claude/commands/process-inbox.md +148 -0
  65. package/.claude/commands/process-jarvis.md +3036 -0
  66. package/.claude/commands/process-video.md +131 -0
  67. package/.claude/commands/rag-search.md +78 -0
  68. package/.claude/commands/resume.md +33 -0
  69. package/.claude/commands/save.md +38 -0
  70. package/.claude/commands/scan-inbox.md +125 -0
  71. package/.claude/commands/setup.md +99 -0
  72. package/.claude/commands/system-digest.md +243 -0
  73. package/.claude/commands/verify.md +182 -0
  74. package/.claude/commands/view-dna.md +169 -0
  75. package/.claude/get-shit-done/VERSION +1 -0
  76. package/.claude/get-shit-done/bin/gsd-tools.cjs +588 -0
  77. package/.claude/get-shit-done/bin/lib/commands.cjs +553 -0
  78. package/.claude/get-shit-done/bin/lib/config.cjs +162 -0
  79. package/.claude/get-shit-done/bin/lib/core.cjs +411 -0
  80. package/.claude/get-shit-done/bin/lib/frontmatter.cjs +299 -0
  81. package/.claude/get-shit-done/bin/lib/init.cjs +710 -0
  82. package/.claude/get-shit-done/bin/lib/milestone.cjs +216 -0
  83. package/.claude/get-shit-done/bin/lib/phase.cjs +871 -0
  84. package/.claude/get-shit-done/bin/lib/roadmap.cjs +298 -0
  85. package/.claude/get-shit-done/bin/lib/state.cjs +679 -0
  86. package/.claude/get-shit-done/bin/lib/template.cjs +222 -0
  87. package/.claude/get-shit-done/bin/lib/verify.cjs +773 -0
  88. package/.claude/get-shit-done/references/checkpoints.md +776 -0
  89. package/.claude/get-shit-done/references/continuation-format.md +249 -0
  90. package/.claude/get-shit-done/references/decimal-phase-calculation.md +65 -0
  91. package/.claude/get-shit-done/references/git-integration.md +248 -0
  92. package/.claude/get-shit-done/references/git-planning-commit.md +38 -0
  93. package/.claude/get-shit-done/references/model-profile-resolution.md +34 -0
  94. package/.claude/get-shit-done/references/model-profiles.md +92 -0
  95. package/.claude/get-shit-done/references/phase-argument-parsing.md +61 -0
  96. package/.claude/get-shit-done/references/planning-config.md +196 -0
  97. package/.claude/get-shit-done/references/questioning.md +145 -0
  98. package/.claude/get-shit-done/references/tdd.md +263 -0
  99. package/.claude/get-shit-done/references/ui-brand.md +160 -0
  100. package/.claude/get-shit-done/references/verification-patterns.md +612 -0
  101. package/.claude/get-shit-done/templates/DEBUG.md +164 -0
  102. package/.claude/get-shit-done/templates/UAT.md +247 -0
  103. package/.claude/get-shit-done/templates/VALIDATION.md +76 -0
  104. package/.claude/get-shit-done/templates/codebase/architecture.md +255 -0
  105. package/.claude/get-shit-done/templates/codebase/concerns.md +310 -0
  106. package/.claude/get-shit-done/templates/codebase/conventions.md +307 -0
  107. package/.claude/get-shit-done/templates/codebase/integrations.md +280 -0
  108. package/.claude/get-shit-done/templates/codebase/stack.md +186 -0
  109. package/.claude/get-shit-done/templates/codebase/structure.md +285 -0
  110. package/.claude/get-shit-done/templates/codebase/testing.md +480 -0
  111. package/.claude/get-shit-done/templates/config.json +37 -0
  112. package/.claude/get-shit-done/templates/context.md +283 -0
  113. package/.claude/get-shit-done/templates/continue-here.md +78 -0
  114. package/.claude/get-shit-done/templates/debug-subagent-prompt.md +91 -0
  115. package/.claude/get-shit-done/templates/discovery.md +146 -0
  116. package/.claude/get-shit-done/templates/milestone-archive.md +123 -0
  117. package/.claude/get-shit-done/templates/milestone.md +115 -0
  118. package/.claude/get-shit-done/templates/phase-prompt.md +569 -0
  119. package/.claude/get-shit-done/templates/planner-subagent-prompt.md +117 -0
  120. package/.claude/get-shit-done/templates/project.md +184 -0
  121. package/.claude/get-shit-done/templates/requirements.md +231 -0
  122. package/.claude/get-shit-done/templates/research-project/ARCHITECTURE.md +204 -0
  123. package/.claude/get-shit-done/templates/research-project/FEATURES.md +147 -0
  124. package/.claude/get-shit-done/templates/research-project/PITFALLS.md +200 -0
  125. package/.claude/get-shit-done/templates/research-project/STACK.md +120 -0
  126. package/.claude/get-shit-done/templates/research-project/SUMMARY.md +170 -0
  127. package/.claude/get-shit-done/templates/research.md +552 -0
  128. package/.claude/get-shit-done/templates/retrospective.md +54 -0
  129. package/.claude/get-shit-done/templates/roadmap.md +202 -0
  130. package/.claude/get-shit-done/templates/state.md +176 -0
  131. package/.claude/get-shit-done/templates/summary-complex.md +59 -0
  132. package/.claude/get-shit-done/templates/summary-minimal.md +41 -0
  133. package/.claude/get-shit-done/templates/summary-standard.md +48 -0
  134. package/.claude/get-shit-done/templates/summary.md +248 -0
  135. package/.claude/get-shit-done/templates/user-setup.md +311 -0
  136. package/.claude/get-shit-done/templates/verification-report.md +322 -0
  137. package/.claude/get-shit-done/workflows/add-phase.md +111 -0
  138. package/.claude/get-shit-done/workflows/add-tests.md +350 -0
  139. package/.claude/get-shit-done/workflows/add-todo.md +157 -0
  140. package/.claude/get-shit-done/workflows/audit-milestone.md +297 -0
  141. package/.claude/get-shit-done/workflows/check-todos.md +176 -0
  142. package/.claude/get-shit-done/workflows/cleanup.md +152 -0
  143. package/.claude/get-shit-done/workflows/complete-milestone.md +763 -0
  144. package/.claude/get-shit-done/workflows/diagnose-issues.md +219 -0
  145. package/.claude/get-shit-done/workflows/discovery-phase.md +289 -0
  146. package/.claude/get-shit-done/workflows/discuss-phase.md +542 -0
  147. package/.claude/get-shit-done/workflows/execute-phase.md +449 -0
  148. package/.claude/get-shit-done/workflows/execute-plan.md +448 -0
  149. package/.claude/get-shit-done/workflows/health.md +156 -0
  150. package/.claude/get-shit-done/workflows/help.md +489 -0
  151. package/.claude/get-shit-done/workflows/insert-phase.md +129 -0
  152. package/.claude/get-shit-done/workflows/list-phase-assumptions.md +178 -0
  153. package/.claude/get-shit-done/workflows/map-codebase.md +315 -0
  154. package/.claude/get-shit-done/workflows/new-milestone.md +382 -0
  155. package/.claude/get-shit-done/workflows/new-project.md +1116 -0
  156. package/.claude/get-shit-done/workflows/pause-work.md +122 -0
  157. package/.claude/get-shit-done/workflows/plan-milestone-gaps.md +274 -0
  158. package/.claude/get-shit-done/workflows/plan-phase.md +569 -0
  159. package/.claude/get-shit-done/workflows/progress.md +381 -0
  160. package/.claude/get-shit-done/workflows/quick.md +453 -0
  161. package/.claude/get-shit-done/workflows/remove-phase.md +154 -0
  162. package/.claude/get-shit-done/workflows/research-phase.md +73 -0
  163. package/.claude/get-shit-done/workflows/resume-project.md +306 -0
  164. package/.claude/get-shit-done/workflows/set-profile.md +80 -0
  165. package/.claude/get-shit-done/workflows/settings.md +213 -0
  166. package/.claude/get-shit-done/workflows/transition.md +544 -0
  167. package/.claude/get-shit-done/workflows/update.md +219 -0
  168. package/.claude/get-shit-done/workflows/verify-phase.md +242 -0
  169. package/.claude/get-shit-done/workflows/verify-work.md +569 -0
  170. package/.claude/gsd-file-manifest.json +144 -0
  171. package/.claude/hooks/agent_creation_trigger.py +168 -0
  172. package/.claude/hooks/agent_index_updater.py +255 -0
  173. package/.claude/hooks/agent_memory_persister.py +203 -0
  174. package/.claude/hooks/claude_md_agent_sync.py +162 -0
  175. package/.claude/hooks/claude_md_guard.py +154 -0
  176. package/.claude/hooks/continuous_save.py +414 -0
  177. package/.claude/hooks/creation_validator.py +360 -0
  178. package/.claude/hooks/enforce_dual_location.py +501 -0
  179. package/.claude/hooks/enforce_plan_mode.py +220 -0
  180. package/.claude/hooks/gsd-check-update.js +62 -0
  181. package/.claude/hooks/gsd-context-monitor.js +122 -0
  182. package/.claude/hooks/gsd-statusline.js +108 -0
  183. package/.claude/hooks/inbox_age_alert.py +367 -0
  184. package/.claude/hooks/ledger_updater.py +303 -0
  185. package/.claude/hooks/memory_hints_injector.py +251 -0
  186. package/.claude/hooks/memory_updater.py +202 -0
  187. package/.claude/hooks/notification_system.py +115 -0
  188. package/.claude/hooks/pending_tracker.py +188 -0
  189. package/.claude/hooks/pipeline_checkpoint.py +583 -0
  190. package/.claude/hooks/post_batch_cascading.py +1740 -0
  191. package/.claude/hooks/post_tool_use.py +120 -0
  192. package/.claude/hooks/quality_watchdog.py +394 -0
  193. package/.claude/hooks/ralph_wiggum.py +286 -0
  194. package/.claude/hooks/session-source-sync.py +223 -0
  195. package/.claude/hooks/session_autosave_v2.py +1135 -0
  196. package/.claude/hooks/session_end.py +203 -0
  197. package/.claude/hooks/session_start.py +939 -0
  198. package/.claude/hooks/skill_indexer.py +48 -0
  199. package/.claude/hooks/skill_router.py +358 -0
  200. package/.claude/hooks/stop_hook_completeness.py +187 -0
  201. package/.claude/hooks/user_prompt_submit.py +125 -0
  202. package/.claude/package.json +1 -0
  203. package/.claude/rules/ANTHROPIC-STANDARDS.md +384 -0
  204. package/.claude/rules/CLAUDE-LITE.md +201 -0
  205. package/.claude/rules/RULE-GROUP-1.md +320 -0
  206. package/.claude/rules/RULE-GROUP-2.md +307 -0
  207. package/.claude/rules/RULE-GROUP-3.md +248 -0
  208. package/.claude/rules/RULE-GROUP-4.md +427 -0
  209. package/.claude/rules/RULE-GROUP-5.md +388 -0
  210. package/.claude/rules/RULE-GROUP-6.md +387 -0
  211. package/.claude/rules/RULE-GSD-MANDATORY.md +106 -0
  212. package/.claude/rules/agent-cognition.md +779 -0
  213. package/.claude/rules/agent-integrity.md +692 -0
  214. package/.claude/rules/epistemic-standards.md +333 -0
  215. package/.claude/rules/logging.md +53 -0
  216. package/.claude/rules/mcp-governance.md +128 -0
  217. package/.claude/rules/pipeline.md +60 -0
  218. package/.claude/rules/state-management.md +93 -0
  219. package/.claude/scripts/apply-tags.py +77 -0
  220. package/.claude/scripts/batch-extract-transcriptions.py +132 -0
  221. package/.claude/scripts/build-complete-index.py +250 -0
  222. package/.claude/scripts/build-planilha-index.py +170 -0
  223. package/.claude/scripts/complete-tag-matching.py +250 -0
  224. package/.claude/scripts/deduplicate-inbox.py +139 -0
  225. package/.claude/scripts/docx-xml-extractor.py +141 -0
  226. package/.claude/scripts/extract-docx-text.py +58 -0
  227. package/.claude/scripts/extract-single-transcription.py +74 -0
  228. package/.claude/scripts/extract_docx_from_gdrive.py +77 -0
  229. package/.claude/scripts/jarvis_orchestrator.py +5 -0
  230. package/.claude/scripts/organized-downloader.py +246 -0
  231. package/.claude/scripts/planilha-tagger.py +187 -0
  232. package/.claude/scripts/revert-tags.py +70 -0
  233. package/.claude/scripts/source-sync.py +265 -0
  234. package/.claude/scripts/tag-inbox-files.py +276 -0
  235. package/.claude/scripts/tag-inbox-v2.py +253 -0
  236. package/.claude/scripts/test-extraction.py +35 -0
  237. package/.claude/scripts/test-full-extraction.py +74 -0
  238. package/.claude/scripts/validate_cascading_integrity.py +409 -0
  239. package/.claude/settings.json +215 -0
  240. package/.claude/skills/DETECTION-PROTOCOL.md +217 -0
  241. package/.claude/skills/README.md +240 -0
  242. package/.claude/skills/SKILL-REGISTRY.md +283 -0
  243. package/.claude/skills/SKILL-SUGGESTIONS.md +114 -0
  244. package/.claude/skills/_TEMPLATES/SKILL-WRITER-GUIDE.md +385 -0
  245. package/.claude/skills/agent-creation/SKILL.md +374 -0
  246. package/.claude/skills/ask-company/SKILL.md +198 -0
  247. package/.claude/skills/brainstorming/SKILL.md +72 -0
  248. package/.claude/skills/chronicler/SKILL.md +146 -0
  249. package/.claude/skills/chronicler/chronicler_core.py +468 -0
  250. package/.claude/skills/code-review/SKILL.md +160 -0
  251. package/.claude/skills/convert-to-company-docs/SKILL.md +68 -0
  252. package/.claude/skills/convert-to-company-docs/convert.py +532 -0
  253. package/.claude/skills/dispatching-parallel-agents/SKILL.md +193 -0
  254. package/.claude/skills/docs-megabrain/SKILL.md +251 -0
  255. package/.claude/skills/executing-plans/SKILL.md +114 -0
  256. package/.claude/skills/executor/SKILL.md +161 -0
  257. package/.claude/skills/fase-2-5-tagging/SKILL.md +182 -0
  258. package/.claude/skills/feature-dev/SKILL.md +154 -0
  259. package/.claude/skills/frontend-design/SKILL.md +165 -0
  260. package/.claude/skills/gdrive-transcription-downloader/SKILL.md +249 -0
  261. package/.claude/skills/gemini-fallback/SKILL.md +67 -0
  262. package/.claude/skills/gemini-fallback/gemini_fetch.py +0 -0
  263. package/.claude/skills/gha/SKILL.md +96 -0
  264. package/.claude/skills/gha/gha_diagnostic.py +227 -0
  265. package/.claude/skills/github-workflow/SKILL.md +190 -0
  266. package/.claude/skills/hookify/SKILL.md +134 -0
  267. package/.claude/skills/hybrid-source-reading/SKILL.md +265 -0
  268. package/.claude/skills/jarvis/SKILL.md +546 -0
  269. package/.claude/skills/jarvis-briefing/SKILL.md +340 -0
  270. package/.claude/skills/knowledge-extraction/SKILL.md +318 -0
  271. package/.claude/skills/ler-planilha/SKILL.md +281 -0
  272. package/.claude/skills/pipeline-jarvis/SKILL.md +430 -0
  273. package/.claude/skills/plugin-dev/SKILL.md +176 -0
  274. package/.claude/skills/pr-review-toolkit/SKILL.md +178 -0
  275. package/.claude/skills/process-company-inbox/SKILL.md +183 -0
  276. package/.claude/skills/python-megabrain/SKILL.md +323 -0
  277. package/.claude/skills/resume/SKILL.md +61 -0
  278. package/.claude/skills/save/SKILL.md +87 -0
  279. package/.claude/skills/skill-creator-internal/SKILL.md +186 -0
  280. package/.claude/skills/skill-writer/SKILL.md +153 -0
  281. package/.claude/skills/skill-writer/examples.md +191 -0
  282. package/.claude/skills/skill-writer/troubleshooting.md +205 -0
  283. package/.claude/skills/smart-download-tagger/SKILL.md +148 -0
  284. package/.claude/skills/source-sync/SKILL.md +240 -0
  285. package/.claude/skills/sync-docs/SKILL.md +193 -0
  286. package/.claude/skills/sync-docs/config.json +37 -0
  287. package/.claude/skills/sync-docs/gdrive_sync.py +358 -0
  288. package/.claude/skills/sync-docs/reauth.py +71 -0
  289. package/.claude/skills/using-superpowers/SKILL.md +105 -0
  290. package/.claude/skills/verification-before-completion/SKILL.md +130 -0
  291. package/.claude/skills/verify/SKILL.md +154 -0
  292. package/.claude/skills/verify/verify_runner.py +0 -0
  293. package/.claude/skills/verify-6-levels/SKILL.md +234 -0
  294. package/.claude/skills/writing-plans/SKILL.md +184 -0
  295. package/.claude/templates/BATCH-LOG-TEMPLATE.md +221 -0
  296. package/.claudeignore +9 -0
  297. package/.cursor/agents.yaml +44 -0
  298. package/.cursor/rules/mega-brain.md +39 -0
  299. package/.gitattributes +19 -0
  300. package/.github/CODEOWNERS +8 -0
  301. package/.github/ISSUE_TEMPLATE/agent.md +96 -0
  302. package/.github/ISSUE_TEMPLATE/bug.md +67 -0
  303. package/.github/ISSUE_TEMPLATE/feature.md +56 -0
  304. package/.github/ISSUE_TEMPLATE/pipeline.md +70 -0
  305. package/.github/PULL_REQUEST_TEMPLATE.md +30 -0
  306. package/.github/assets/banner.svg +152 -0
  307. package/.github/assets/logo-dark.svg +79 -0
  308. package/.github/assets/social-preview.png +0 -0
  309. package/.github/layer1-allowlist.txt +196 -0
  310. package/.github/layer2-manifest.txt +42 -0
  311. package/.github/layer3-manifest.txt +94 -0
  312. package/.github/workflows/claude-code-pr.yml +198 -0
  313. package/.github/workflows/claude-code-review.yml +57 -0
  314. package/.github/workflows/claude.yml +76 -0
  315. package/.github/workflows/publish-pro.yml +72 -0
  316. package/.github/workflows/publish.yml +86 -0
  317. package/.github/workflows/verification.yml +251 -0
  318. package/.gitignore +244 -0
  319. package/.gitleaks.toml +118 -0
  320. package/.windsurf/agents.yaml +44 -0
  321. package/.windsurf/rules/mega-brain.md +39 -0
  322. package/CONTRIBUTING.md +62 -0
  323. package/QUICK-START.md +231 -0
  324. package/README.md +168 -0
  325. package/agents/AGENT-INDEX.yaml +107 -0
  326. package/agents/MASTER-AGENT.md +612 -0
  327. package/agents/README.md +48 -0
  328. package/agents/_templates/INDEX.md +741 -0
  329. package/agents/_templates/TEMPLATE-AGENT-MD-ULTRA-ROBUSTO-V3.md +2399 -0
  330. package/agents/boardroom/CHECKLIST-MASTER.md +281 -0
  331. package/agents/boardroom/INTEGRATION-GUIDE.md +406 -0
  332. package/agents/boardroom/README.md +238 -0
  333. package/agents/boardroom/config/BOARDROOM-CONFIG.md +186 -0
  334. package/agents/boardroom/config/TTS-INTEGRATION.md +258 -0
  335. package/agents/boardroom/config/VOICE-PROFILES.md +624 -0
  336. package/agents/boardroom/scripts/audio_generator.py +375 -0
  337. package/agents/boardroom/scripts/audio_generator_edge.py +353 -0
  338. package/agents/boardroom/scripts/jarvis_boardroom_hook.py +415 -0
  339. package/agents/boardroom/scripts/notebooklm_generator.py +578 -0
  340. package/agents/boardroom/templates/EPISODE-TEMPLATE.md +367 -0
  341. package/agents/boardroom/templates/scene-templates/SCENE-AGENT-DEBATE.md +252 -0
  342. package/agents/boardroom/templates/scene-templates/SCENE-COUNCIL.md +270 -0
  343. package/agents/boardroom/templates/scene-templates/SCENE-DNA-CONSULTATION.md +126 -0
  344. package/agents/boardroom/templates/scene-templates/SCENE-QUESTION.md +174 -0
  345. package/agents/boardroom/workflows/WORKFLOW-AUDIO-GENERATION.md +421 -0
  346. package/agents/conclave/CRITIC.md +197 -0
  347. package/agents/conclave/DEVILS-ADVOCATE.md +274 -0
  348. package/agents/conclave/README.md +35 -0
  349. package/agents/conclave/SYNTHESIZER.md +293 -0
  350. package/agents/conclave/advogado-do-diabo/AGENT.md +502 -0
  351. package/agents/conclave/advogado-do-diabo/SOUL.md +100 -0
  352. package/agents/conclave/critico-metodologico/AGENT.md +683 -0
  353. package/agents/conclave/critico-metodologico/SOUL.md +107 -0
  354. package/agents/conclave/sintetizador/AGENT.md +571 -0
  355. package/agents/conclave/sintetizador/SOUL.md +94 -0
  356. package/agents/constitution/BASE-CONSTITUTION.md +254 -0
  357. package/agents/persona-registry.yaml +300 -0
  358. package/agents/sua-empresa/.gitkeep +0 -0
  359. package/agents/sua-empresa/README.md +44 -0
  360. package/agents/sua-empresa/_example/jds/EXAMPLE-JD.md +42 -0
  361. package/agents/sua-empresa/_example/org/EXAMPLE-ORG.md +32 -0
  362. package/agents/sua-empresa/_example/roles/EXAMPLE-ROLE.md +38 -0
  363. package/artifacts/README.md +11 -0
  364. package/artifacts/canonical/.gitkeep +0 -0
  365. package/artifacts/chunks/.gitkeep +0 -0
  366. package/artifacts/insights/.gitkeep +0 -0
  367. package/artifacts/narratives/.gitkeep +0 -0
  368. package/bin/cli.js +2 -0
  369. package/bin/lib/ascii-art.js +202 -0
  370. package/bin/lib/feature-gate.js +46 -0
  371. package/bin/lib/installer.js +593 -0
  372. package/bin/lib/license.js +59 -0
  373. package/bin/lib/pro-commands.js +75 -0
  374. package/bin/lib/setup-wizard.js +547 -0
  375. package/bin/lib/validate-email.js +113 -0
  376. package/bin/mega-brain.js +136 -0
  377. package/bin/pre-publish-gate.js +229 -0
  378. package/bin/push.js +1056 -0
  379. package/bin/templates/env.example +27 -0
  380. package/bin/utils/pro-detector.js +50 -0
  381. package/bin/validate-package.js +190 -0
  382. package/core/__init__.py +2 -0
  383. package/core/glossary/INDEX.md +63 -0
  384. package/core/glossary/digital.md +243 -0
  385. package/core/glossary/finance.md +49 -0
  386. package/core/glossary/marketing.md +69 -0
  387. package/core/glossary/operations.md +50 -0
  388. package/core/glossary/sales.md +690 -0
  389. package/core/intelligence/__init__.py +41 -0
  390. package/core/intelligence/agent_trigger.py +468 -0
  391. package/core/intelligence/audit_layers.py +491 -0
  392. package/core/intelligence/autonomous_processor.py +796 -0
  393. package/core/intelligence/bootstrap_registry.py +550 -0
  394. package/core/intelligence/business_model_detector.py +476 -0
  395. package/core/intelligence/dossier_trigger.py +336 -0
  396. package/core/intelligence/entity_normalizer.py +565 -0
  397. package/core/intelligence/org_chain_detector.py +411 -0
  398. package/core/intelligence/review_dashboard.py +338 -0
  399. package/core/intelligence/role_detector.py +855 -0
  400. package/core/intelligence/session_autosave.py +46 -0
  401. package/core/intelligence/skill_generator.py +601 -0
  402. package/core/intelligence/sow_generator.py +711 -0
  403. package/core/intelligence/sync_package_files.py +504 -0
  404. package/core/intelligence/task_orchestrator.py +780 -0
  405. package/core/intelligence/theme_analyzer.py +562 -0
  406. package/core/intelligence/tool_discovery.py +432 -0
  407. package/core/intelligence/validate_json_integrity.py +106 -0
  408. package/core/intelligence/validate_layers.py +310 -0
  409. package/core/intelligence/verify_classifications.py +94 -0
  410. package/core/intelligence/viability_scorer.py +592 -0
  411. package/core/jarvis/02-JARVIS-SOUL.md +390 -0
  412. package/core/jarvis/03-JARVIS-DNA.yaml +312 -0
  413. package/core/jarvis/AGENT.md +191 -0
  414. package/core/jarvis/agent-creator/AGENT.md +199 -0
  415. package/core/jarvis/agent-creator/SOUL.md +82 -0
  416. package/core/jarvis/agent-creator/tasks/create-agent.md +133 -0
  417. package/core/jarvis/agent-creator/tasks/sync-agents.md +100 -0
  418. package/core/jarvis/agent-creator/workflows/wf-create-agent.yaml +110 -0
  419. package/core/jarvis/agent-creator/workflows/wf-pipeline-trigger.yaml +111 -0
  420. package/core/jarvis/autonomous/benchmark/AGENT.md +347 -0
  421. package/core/jarvis/autonomous/benchmark/SOUL.md +78 -0
  422. package/core/jarvis/autonomous/critic/AGENT.md +324 -0
  423. package/core/jarvis/autonomous/critic/SOUL.md +78 -0
  424. package/core/jarvis/autonomous/evolver/AGENT.md +294 -0
  425. package/core/jarvis/autonomous/evolver/SOUL.md +85 -0
  426. package/core/jarvis/autonomous/playbook-generator/AGENT.md +399 -0
  427. package/core/jarvis/autonomous/playbook-generator/SOUL.md +80 -0
  428. package/core/patterns/_ROLE_PATTERNS.yaml +547 -0
  429. package/core/patterns/quality_gates.yaml +259 -0
  430. package/core/patterns/trigger_config.yaml +193 -0
  431. package/core/schemas/SCHEMA-INDEX.md +94 -0
  432. package/core/schemas/canonical-map.schema.json +98 -0
  433. package/core/schemas/chunks-state.schema.json +131 -0
  434. package/core/schemas/decisions-registry.schema.json +120 -0
  435. package/core/schemas/file-registry.schema.json +69 -0
  436. package/core/schemas/insights-state.schema.json +111 -0
  437. package/core/schemas/narratives-state.schema.json +150 -0
  438. package/core/tasks/CHANGELOG.md +55 -0
  439. package/core/tasks/TASK-REGISTRY.md +113 -0
  440. package/core/tasks/_templates/task-tmpl.md +105 -0
  441. package/core/tasks/analyze-themes.md +84 -0
  442. package/core/tasks/detect-role.md +82 -0
  443. package/core/tasks/extract-dna.md +114 -0
  444. package/core/tasks/normalize-entities.md +82 -0
  445. package/core/tasks/process-batch.md +111 -0
  446. package/core/tasks/validate-cascade.md +105 -0
  447. package/core/templates/README.md +27 -0
  448. package/core/templates/agents/dna-config-template.yaml +181 -0
  449. package/core/templates/agents/enrichment-protocol.md +408 -0
  450. package/core/templates/agents/memory-template.md +567 -0
  451. package/core/templates/agents/reasoning-model.md +331 -0
  452. package/core/templates/agents/soul-template.md +416 -0
  453. package/core/templates/agents/template-evolution.md +544 -0
  454. package/core/templates/debates/CONCLAVE-LOG-TEMPLATE-v2.md +309 -0
  455. package/core/templates/debates/conclave-log-template.md +309 -0
  456. package/core/templates/debates/conclave-protocol.md +518 -0
  457. package/core/templates/debates/debate-dynamics-config.yaml +322 -0
  458. package/core/templates/debates/debate-dynamics.md +613 -0
  459. package/core/templates/debates/debate-protocol.md +323 -0
  460. package/core/templates/logs/LOG-TEMPLATES.md +1068 -0
  461. package/core/templates/logs/batch-visual-template.md +841 -0
  462. package/core/templates/logs/log-structure.md +65 -0
  463. package/core/templates/logs/visual-diff.md +159 -0
  464. package/core/templates/phases/dossier-compilation.md +790 -0
  465. package/core/templates/phases/narrative-metabolism.md +292 -0
  466. package/core/templates/phases/narrative-synthesis.md +278 -0
  467. package/core/templates/phases/phase4-checkpoint.md +146 -0
  468. package/core/templates/phases/prompt-1.1-chunking.md +154 -0
  469. package/core/templates/phases/prompt-1.2-entity-resolution.md +186 -0
  470. package/core/templates/phases/prompt-2.1-dna-tags.md +208 -0
  471. package/core/templates/phases/prompt-2.1-insight-extraction.md +191 -0
  472. package/core/templates/phases/prompt-3.1-narrative.md +331 -0
  473. package/core/templates/phases/sources-compilation.md +340 -0
  474. package/core/workflows/PIPELINE-JARVIS-DOCS.md +606 -0
  475. package/core/workflows/wf-conclave.yaml +139 -0
  476. package/core/workflows/wf-extract-dna.yaml +158 -0
  477. package/core/workflows/wf-ingest.yaml +88 -0
  478. package/core/workflows/wf-pipeline-full.yaml +138 -0
  479. package/docs/API-KEYS-GUIDE.md +372 -0
  480. package/docs/INTEGRATION-POINTS.md +501 -0
  481. package/docs/LAYERS.md +403 -0
  482. package/docs/PLAN-MODE-PROTOCOL.md +388 -0
  483. package/docs/RESTORE-AND-INDEX.md +203 -0
  484. package/docs/TAG-RESOLVER-IMPLEMENTATION.md +597 -0
  485. package/docs/conselho.md +337 -0
  486. package/docs/context7-readme.md +28 -0
  487. package/docs/jarvis-logging-protocol.md +380 -0
  488. package/docs/pipeline-completa-v4.md +1315 -0
  489. package/docs/prompts/meta_agente_mapeamento_processos.md +297 -0
  490. package/docs/quick-start.md +197 -0
  491. package/docs/readme-ralph-cascateamento.md +207 -0
  492. package/docs/template-master.md +727 -0
  493. package/docs/templates/phase5/IMPLEMENTATION-GUIDE.md +355 -0
  494. package/docs/templates/phase5/MOGA-BRAIN-PHASE5-TEMPLATES.md +1284 -0
  495. package/docs/templates/phase5/README.md +165 -0
  496. package/docs/workflow-continuous-claude.md +2232 -0
  497. package/inbox/.gitkeep +0 -0
  498. package/inbox/README.md +15 -0
  499. package/knowledge/NAVIGATION-MAP.json +292 -0
  500. package/knowledge/README.md +11 -0
  501. package/knowledge/dna/.gitkeep +0 -0
  502. package/knowledge/dossiers/persons/.gitkeep +0 -0
  503. package/knowledge/dossiers/system/.gitkeep +0 -0
  504. package/knowledge/dossiers/themes/.gitkeep +0 -0
  505. package/knowledge/playbooks/.gitkeep +0 -0
  506. package/knowledge/sources/.gitkeep +0 -0
  507. package/logs/.gitkeep +0 -0
  508. package/logs/README.md +11 -0
  509. package/package.json +180 -0
  510. package/requirements.txt +4 -0
@@ -0,0 +1,562 @@
1
+ #!/usr/bin/env python3
2
+ """
3
+ THEME ANALYZER - Intelligence Layer v1.0
4
+ ==========================================
5
+ Extrai e normaliza temas de TODOS os formatos de chunk e insight do Mega Brain.
6
+
7
+ Formatos suportados:
8
+ - AH-BP001: key_concepts[], section, framework_name
9
+ - CG-SM001: temas[], pessoas[], meta.speaker
10
+ - RAG migrated: metadata.theme, topic_hint, mentions[]
11
+ - SS001 legacy: topic, entities[], keywords[]
12
+ - Insights: themes[], type (METRIC/FRAMEWORK/PRINCIPLE/TACTIC)
13
+
14
+ Para cada tema extraido:
15
+ 1. Normaliza via entity_normalizer
16
+ 2. Atualiza occurrence_count no ENTITY-REGISTRY
17
+ 3. Mapeia tema -> dominio via DOMAINS-TAXONOMY
18
+ 4. Detecta roles mencionados e associa ao tema
19
+
20
+ Output: {themes_found, themes_new, roles_mentioned, domains_touched, persons_found}
21
+
22
+ Versao: 1.0.0
23
+ Data: 2026-02-24
24
+ """
25
+
26
+ import json
27
+ import os
28
+ import re
29
+ import sys
30
+ from pathlib import Path
31
+ from datetime import datetime, timezone
32
+ from collections import Counter
33
+
34
+ # Local imports
35
+ sys.path.insert(0, str(Path(__file__).parent))
36
+ from entity_normalizer import (
37
+ load_registry, save_registry, normalize_entity,
38
+ normalize_text, get_domain_aliases, load_taxonomy
39
+ )
40
+
41
+ # ---------------------------------------------------------------------------
42
+ # PATHS
43
+ # ---------------------------------------------------------------------------
44
+ BASE_DIR = Path(__file__).parent.parent
45
+ CHUNKS_DIR = BASE_DIR / "processing" / "chunks"
46
+ INSIGHTS_DIR = BASE_DIR / "processing" / "insights"
47
+
48
+ # ---------------------------------------------------------------------------
49
+ # DOSSIER THEME ID MAP
50
+ # ---------------------------------------------------------------------------
51
+ # Maps known dossier theme IDs (used in CG-SM001 format) to readable names
52
+ DOSSIER_THEME_MAP = {
53
+ "01-ESTRUTURA-TIME": "estrutura-time-vendas",
54
+ "02-PROCESSO-VENDAS": "processo-vendas",
55
+ "03-OUTBOUND": "outbound",
56
+ "04-COMISSIONAMENTO": "comissionamento",
57
+ "05-METRICAS": "metricas-vendas",
58
+ "06-FUNIL-APLICACAO": "funil-aplicacao",
59
+ "07-PRICING": "pricing-ofertas",
60
+ "08-HIRING": "hiring-contratacao",
61
+ "09-GESTAO": "gestao-lideranca",
62
+ "10-CULTURA": "cultura-organizacional",
63
+ "11-SCRIPTS-VENDAS": "scripts-vendas",
64
+ "12-OBJECOES": "objecoes",
65
+ "13-FOLLOW-UP": "follow-up",
66
+ "14-SHOW-RATES": "show-rates",
67
+ "15-CALL-FUNNELS": "call-funnels",
68
+ "16-ONBOARDING": "onboarding",
69
+ "17-CUSTOMER-SUCCESS": "customer-success",
70
+ "18-REFERRAL": "referral",
71
+ "19-RETENTION": "retention",
72
+ "20-SCALING": "scaling-operacoes",
73
+ "21-MINDSET": "mindset",
74
+ "22-OFERTAS": "ofertas",
75
+ }
76
+
77
+
78
+ # ---------------------------------------------------------------------------
79
+ # CHUNK PROCESSORS (one per format)
80
+ # ---------------------------------------------------------------------------
81
+ def process_ah_format(chunk, source_id):
82
+ """
83
+ Process AH-BP001 format chunks.
84
+ Fields: key_concepts[], section, type, framework_name, content
85
+ """
86
+ themes = []
87
+ roles = []
88
+ persons = []
89
+
90
+ # Extract from key_concepts
91
+ for concept in chunk.get("key_concepts", []):
92
+ themes.append(concept)
93
+
94
+ # framework_name is a strong theme signal
95
+ fw = chunk.get("framework_name")
96
+ if fw:
97
+ themes.append(fw)
98
+
99
+ # section can hint at theme
100
+ section = chunk.get("section", "")
101
+ if section and section not in ("START HERE",):
102
+ themes.append(section)
103
+
104
+ return {"themes": themes, "roles": roles, "persons": persons}
105
+
106
+
107
+ def process_cg_format(chunk, source_id):
108
+ """
109
+ Process CG-SM001 format chunks.
110
+ Fields: temas[], pessoas[], meta.speaker, texto
111
+ """
112
+ themes = []
113
+ roles = []
114
+ persons = []
115
+
116
+ # temas already mapped to dossier IDs
117
+ for tema_id in chunk.get("temas", []):
118
+ readable = DOSSIER_THEME_MAP.get(tema_id, tema_id)
119
+ themes.append(readable)
120
+
121
+ # pessoas explicitly listed
122
+ for pessoa in chunk.get("pessoas", []):
123
+ persons.append(pessoa)
124
+
125
+ # Speaker from meta
126
+ meta = chunk.get("meta", {})
127
+ speaker = meta.get("speaker")
128
+ if speaker:
129
+ persons.append(speaker)
130
+
131
+ return {"themes": themes, "roles": roles, "persons": persons}
132
+
133
+
134
+ def process_rag_format(chunk, source_id):
135
+ """
136
+ Process RAG-migrated format chunks.
137
+ Fields: metadata.theme, topic_hint, text, mentions[]
138
+ """
139
+ themes = []
140
+ roles = []
141
+ persons = []
142
+
143
+ meta = chunk.get("metadata", {})
144
+ theme = meta.get("theme")
145
+ if theme:
146
+ readable = DOSSIER_THEME_MAP.get(theme, theme)
147
+ themes.append(readable)
148
+
149
+ topic = chunk.get("topic_hint", "")
150
+ if topic and not topic.startswith("#"):
151
+ themes.append(topic)
152
+
153
+ for mention in chunk.get("mentions", []):
154
+ persons.append(mention)
155
+
156
+ return {"themes": themes, "roles": roles, "persons": persons}
157
+
158
+
159
+ def process_ss_format(chunk, source_id):
160
+ """
161
+ Process SS001 legacy format (individual chunk files).
162
+ Fields: topic, entities[], keywords[], content, speaker
163
+ """
164
+ themes = []
165
+ roles = []
166
+ persons = []
167
+
168
+ topic = chunk.get("topic", "")
169
+ if topic:
170
+ # Convert SCREAMING_SNAKE to readable
171
+ readable = topic.lower().replace("_", " ").strip()
172
+ if readable and readable not in ("intro context",):
173
+ themes.append(readable)
174
+
175
+ for entity in chunk.get("entities", []):
176
+ persons.append(entity)
177
+
178
+ for kw in chunk.get("keywords", []):
179
+ themes.append(kw)
180
+
181
+ speaker = chunk.get("speaker", "")
182
+ if speaker:
183
+ persons.append(speaker.replace("_", " ").title())
184
+
185
+ return {"themes": themes, "roles": roles, "persons": persons}
186
+
187
+
188
+ def process_insight(insight, source_id):
189
+ """
190
+ Process insight format.
191
+ Fields: themes[], type, insight text, source.speaker
192
+ """
193
+ themes = []
194
+ roles = []
195
+ persons = []
196
+
197
+ for theme_id in insight.get("themes", []):
198
+ readable = DOSSIER_THEME_MAP.get(theme_id, theme_id)
199
+ themes.append(readable)
200
+
201
+ # The insight text itself may contain framework names
202
+ insight_text = insight.get("insight", "")
203
+ itype = insight.get("type", "")
204
+ if itype in ("FRAMEWORK", "METHODOLOGY") and insight_text:
205
+ # Extract framework name (usually before the colon)
206
+ match = re.match(r"^([^:]+):", insight_text)
207
+ if match:
208
+ themes.append(match.group(1).strip())
209
+
210
+ speaker = insight.get("source", {}).get("speaker")
211
+ if speaker:
212
+ persons.append(speaker)
213
+
214
+ return {"themes": themes, "roles": roles, "persons": persons}
215
+
216
+
217
+ # ---------------------------------------------------------------------------
218
+ # FORMAT DETECTOR
219
+ # ---------------------------------------------------------------------------
220
+ def detect_chunk_format(chunk):
221
+ """Detect which format a chunk uses."""
222
+ if "key_concepts" in chunk and "section" in chunk:
223
+ return "ah"
224
+ if "temas" in chunk and "meta" in chunk:
225
+ return "cg"
226
+ if "metadata" in chunk and "migrated_from_rag" in chunk.get("metadata", {}):
227
+ return "rag"
228
+ if "metadata" in chunk and "theme" in chunk.get("metadata", {}):
229
+ return "rag"
230
+ if "topic" in chunk and "entities" in chunk:
231
+ return "ss"
232
+ if "key_concepts" in chunk:
233
+ return "ah"
234
+ if "temas" in chunk:
235
+ return "cg"
236
+ return "unknown"
237
+
238
+
239
+ FORMAT_PROCESSORS = {
240
+ "ah": process_ah_format,
241
+ "cg": process_cg_format,
242
+ "rag": process_rag_format,
243
+ "ss": process_ss_format,
244
+ }
245
+
246
+
247
+ # ---------------------------------------------------------------------------
248
+ # CORE: ANALYZE FILE
249
+ # ---------------------------------------------------------------------------
250
+ def analyze_chunk_file(filepath, registry=None):
251
+ """
252
+ Analyze a single chunk file. Extracts themes, persons, roles.
253
+
254
+ Args:
255
+ filepath: path to chunk .json file
256
+ registry: shared ENTITY-REGISTRY dict
257
+
258
+ Returns:
259
+ {
260
+ "source_id": str,
261
+ "themes_found": [str],
262
+ "themes_new": [str],
263
+ "roles_mentioned": [str],
264
+ "persons_found": [str],
265
+ "domains_touched": [str],
266
+ "chunk_count": int,
267
+ "format": str
268
+ }
269
+ """
270
+ if registry is None:
271
+ registry = load_registry()
272
+
273
+ filepath = Path(filepath)
274
+ if not filepath.exists():
275
+ return {"error": f"File not found: {filepath}"}
276
+
277
+ with open(filepath, "r", encoding="utf-8") as f:
278
+ data = json.load(f)
279
+
280
+ source_id = data.get("source_id", data.get("source_hash", filepath.stem))
281
+
282
+ # Handle both consolidated files (with "chunks" array) and individual chunk files
283
+ if "chunks" in data:
284
+ chunks = data["chunks"]
285
+ elif "insights" in data:
286
+ # Insight files
287
+ return _analyze_insights_file(data, source_id, registry)
288
+ else:
289
+ # Individual chunk file (SS001 format)
290
+ chunks = [data]
291
+
292
+ all_themes = []
293
+ all_persons = []
294
+ all_roles = []
295
+ detected_format = "unknown"
296
+
297
+ for chunk in chunks:
298
+ fmt = detect_chunk_format(chunk)
299
+ if fmt == "unknown":
300
+ continue
301
+ detected_format = fmt
302
+
303
+ processor = FORMAT_PROCESSORS[fmt]
304
+ result = processor(chunk, source_id)
305
+
306
+ all_themes.extend(result["themes"])
307
+ all_persons.extend(result["persons"])
308
+ all_roles.extend(result["roles"])
309
+
310
+ # Normalize and deduplicate
311
+ return _normalize_and_compile(
312
+ all_themes, all_persons, all_roles,
313
+ source_id, len(chunks), detected_format, registry
314
+ )
315
+
316
+
317
+ def _analyze_insights_file(data, source_id, registry):
318
+ """Analyze an insights file."""
319
+ all_themes = []
320
+ all_persons = []
321
+ all_roles = []
322
+
323
+ for insight in data.get("insights", []):
324
+ result = process_insight(insight, source_id)
325
+ all_themes.extend(result["themes"])
326
+ all_persons.extend(result["persons"])
327
+ all_roles.extend(result["roles"])
328
+
329
+ count = data.get("insights_extracted", len(data.get("insights", [])))
330
+ return _normalize_and_compile(
331
+ all_themes, all_persons, all_roles,
332
+ source_id, count, "insight", registry
333
+ )
334
+
335
+
336
+ def _normalize_and_compile(all_themes, all_persons, all_roles,
337
+ source_id, chunk_count, detected_format, registry):
338
+ """Normalize extracted data and compile results."""
339
+ domain_aliases = get_domain_aliases()
340
+
341
+ # Normalize themes
342
+ themes_found = []
343
+ themes_new = []
344
+ domains_touched = set()
345
+
346
+ seen_themes = set()
347
+ for raw_theme in all_themes:
348
+ norm = normalize_text(raw_theme)
349
+ if not norm or len(norm) < 2 or norm in seen_themes:
350
+ continue
351
+ seen_themes.add(norm)
352
+
353
+ result = normalize_entity(
354
+ raw_theme, "theme", registry=registry,
355
+ source_id=source_id, auto_save=False
356
+ )
357
+ themes_found.append(result["canonical"])
358
+ if result["created"]:
359
+ themes_new.append(result["canonical"])
360
+
361
+ # Map to domain
362
+ if norm in domain_aliases:
363
+ domains_touched.add(domain_aliases[norm])
364
+ # Also check entity data for domain_ids
365
+ theme_data = registry.get("themes", {}).get(result["canonical"], {})
366
+ for did in theme_data.get("domain_ids", []):
367
+ domains_touched.add(did)
368
+
369
+ # Normalize persons
370
+ persons_found = []
371
+ seen_persons = set()
372
+ for raw_person in all_persons:
373
+ norm = normalize_text(raw_person)
374
+ if not norm or len(norm) < 2 or norm in seen_persons:
375
+ continue
376
+ seen_persons.add(norm)
377
+
378
+ result = normalize_entity(
379
+ raw_person, "person", registry=registry,
380
+ source_id=source_id, auto_save=False
381
+ )
382
+ persons_found.append(result["canonical"])
383
+
384
+ # Normalize roles
385
+ roles_mentioned = []
386
+ seen_roles = set()
387
+ for raw_role in all_roles:
388
+ norm = normalize_text(raw_role)
389
+ if not norm or len(norm) < 2 or norm in seen_roles:
390
+ continue
391
+ seen_roles.add(norm)
392
+
393
+ result = normalize_entity(
394
+ raw_role, "role", registry=registry,
395
+ source_id=source_id, auto_save=False
396
+ )
397
+ roles_mentioned.append(result["canonical"])
398
+
399
+ # Deduplicate
400
+ themes_found = list(dict.fromkeys(themes_found))
401
+ themes_new = list(dict.fromkeys(themes_new))
402
+ persons_found = list(dict.fromkeys(persons_found))
403
+ roles_mentioned = list(dict.fromkeys(roles_mentioned))
404
+
405
+ return {
406
+ "source_id": source_id,
407
+ "themes_found": themes_found,
408
+ "themes_new": themes_new,
409
+ "roles_mentioned": roles_mentioned,
410
+ "persons_found": persons_found,
411
+ "domains_touched": sorted(domains_touched),
412
+ "chunk_count": chunk_count,
413
+ "format": detected_format,
414
+ }
415
+
416
+
417
+ # ---------------------------------------------------------------------------
418
+ # ANALYZE ALL CHUNKS
419
+ # ---------------------------------------------------------------------------
420
+ def analyze_all_chunks(registry=None, save=True):
421
+ """
422
+ Analyze ALL chunk and insight files.
423
+
424
+ Returns:
425
+ {
426
+ "total_files": int,
427
+ "total_chunks": int,
428
+ "all_themes": Counter,
429
+ "all_persons": Counter,
430
+ "all_roles": Counter,
431
+ "all_domains": Counter,
432
+ "new_themes": [str],
433
+ "files_processed": [dict]
434
+ }
435
+ """
436
+ if registry is None:
437
+ registry = load_registry()
438
+
439
+ all_themes = Counter()
440
+ all_persons = Counter()
441
+ all_roles = Counter()
442
+ all_domains = Counter()
443
+ new_themes = []
444
+ files_processed = []
445
+ total_chunks = 0
446
+
447
+ # Process chunk files
448
+ chunk_files = sorted(CHUNKS_DIR.glob("*.json"))
449
+ for fpath in chunk_files:
450
+ # Skip state/index files
451
+ if fpath.name in ("CHUNKS-STATE.json", "_INDEX.json", "_rag_export.json"):
452
+ continue
453
+
454
+ result = analyze_chunk_file(fpath, registry=registry)
455
+ if "error" in result:
456
+ continue
457
+
458
+ files_processed.append({
459
+ "file": fpath.name,
460
+ "source_id": result["source_id"],
461
+ "format": result["format"],
462
+ "themes": len(result["themes_found"]),
463
+ "new_themes": len(result["themes_new"]),
464
+ })
465
+
466
+ for t in result["themes_found"]:
467
+ all_themes[t] += 1
468
+ for p in result["persons_found"]:
469
+ all_persons[p] += 1
470
+ for r in result["roles_mentioned"]:
471
+ all_roles[r] += 1
472
+ for d in result["domains_touched"]:
473
+ all_domains[d] += 1
474
+ new_themes.extend(result["themes_new"])
475
+ total_chunks += result["chunk_count"]
476
+
477
+ # Process insight files
478
+ insight_files = sorted(INSIGHTS_DIR.glob("*.json"))
479
+ for fpath in insight_files:
480
+ if fpath.name == "INSIGHTS-STATE.json":
481
+ continue
482
+
483
+ result = analyze_chunk_file(fpath, registry=registry)
484
+ if "error" in result:
485
+ continue
486
+
487
+ files_processed.append({
488
+ "file": fpath.name,
489
+ "source_id": result["source_id"],
490
+ "format": result["format"],
491
+ "themes": len(result["themes_found"]),
492
+ "new_themes": len(result["themes_new"]),
493
+ })
494
+
495
+ for t in result["themes_found"]:
496
+ all_themes[t] += 1
497
+ for p in result["persons_found"]:
498
+ all_persons[p] += 1
499
+ for r in result["roles_mentioned"]:
500
+ all_roles[r] += 1
501
+ for d in result["domains_touched"]:
502
+ all_domains[d] += 1
503
+ new_themes.extend(result["themes_new"])
504
+
505
+ if save:
506
+ save_registry(registry)
507
+
508
+ return {
509
+ "total_files": len(files_processed),
510
+ "total_chunks": total_chunks,
511
+ "all_themes": all_themes,
512
+ "all_persons": all_persons,
513
+ "all_roles": all_roles,
514
+ "all_domains": all_domains,
515
+ "new_themes": list(set(new_themes)),
516
+ "files_processed": files_processed,
517
+ }
518
+
519
+
520
+ # ---------------------------------------------------------------------------
521
+ # CLI
522
+ # ---------------------------------------------------------------------------
523
+ def main():
524
+ """CLI: analyze chunk/insight files."""
525
+ if len(sys.argv) > 1 and sys.argv[1] == "--all":
526
+ print("\n=== THEME ANALYZER: Full Scan ===\n")
527
+ result = analyze_all_chunks(save=True)
528
+ print(f"Files processed: {result['total_files']}")
529
+ print(f"Total chunks: {result['total_chunks']}")
530
+ print(f"Themes found: {len(result['all_themes'])}")
531
+ print(f"New themes: {len(result['new_themes'])}")
532
+ print(f"Persons found: {len(result['all_persons'])}")
533
+ print(f"Roles found: {len(result['all_roles'])}")
534
+ print(f"Domains touched: {len(result['all_domains'])}")
535
+
536
+ print(f"\n--- Top 20 Themes ---")
537
+ for theme, count in result["all_themes"].most_common(20):
538
+ print(f" {count:4d}x {theme}")
539
+
540
+ print(f"\n--- Top 10 Persons ---")
541
+ for person, count in result["all_persons"].most_common(10):
542
+ print(f" {count:4d}x {person}")
543
+
544
+ print(f"\n--- Domains ---")
545
+ for dom, count in result["all_domains"].most_common():
546
+ print(f" {count:4d}x {dom}")
547
+
548
+ elif len(sys.argv) > 1:
549
+ filepath = sys.argv[1]
550
+ print(f"\n=== THEME ANALYZER: Single File ===\n")
551
+ result = analyze_chunk_file(filepath)
552
+ print(json.dumps(result, indent=2, ensure_ascii=False))
553
+
554
+ else:
555
+ print("Uso:")
556
+ print(" python3 theme_analyzer.py --all # Analyze all chunks + insights")
557
+ print(" python3 theme_analyzer.py <filepath> # Analyze single file")
558
+ sys.exit(1)
559
+
560
+
561
+ if __name__ == "__main__":
562
+ main()