mega-brain-ai 1.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.antigravity/README.md +46 -0
- package/.antigravity/rules/.gitkeep +0 -0
- package/.antigravity/rules/mega-brain.md +39 -0
- package/.claude/CLAUDE.md +172 -0
- package/.claude/agents.yaml +44 -0
- package/.claude/commands/agents.md +161 -0
- package/.claude/commands/ask.md +117 -0
- package/.claude/commands/benchmark.md +224 -0
- package/.claude/commands/chat.md +343 -0
- package/.claude/commands/compare.md +116 -0
- package/.claude/commands/conclave.md +196 -0
- package/.claude/commands/config.md +133 -0
- package/.claude/commands/create-agent.md +467 -0
- package/.claude/commands/debate.md +159 -0
- package/.claude/commands/documentation/create-architecture-documentation.md +175 -0
- package/.claude/commands/dossiers.md +180 -0
- package/.claude/commands/evolve.md +223 -0
- package/.claude/commands/extract-dna.md +172 -0
- package/.claude/commands/extract-knowledge.md +507 -0
- package/.claude/commands/gsd/add-phase.md +43 -0
- package/.claude/commands/gsd/add-tests.md +41 -0
- package/.claude/commands/gsd/add-todo.md +47 -0
- package/.claude/commands/gsd/audit-milestone.md +36 -0
- package/.claude/commands/gsd/check-todos.md +45 -0
- package/.claude/commands/gsd/cleanup.md +18 -0
- package/.claude/commands/gsd/complete-milestone.md +136 -0
- package/.claude/commands/gsd/debug.md +167 -0
- package/.claude/commands/gsd/discuss-phase.md +83 -0
- package/.claude/commands/gsd/execute-phase.md +41 -0
- package/.claude/commands/gsd/health.md +22 -0
- package/.claude/commands/gsd/help.md +22 -0
- package/.claude/commands/gsd/insert-phase.md +32 -0
- package/.claude/commands/gsd/join-discord.md +18 -0
- package/.claude/commands/gsd/list-phase-assumptions.md +46 -0
- package/.claude/commands/gsd/map-codebase.md +71 -0
- package/.claude/commands/gsd/new-milestone.md +44 -0
- package/.claude/commands/gsd/new-project.md +42 -0
- package/.claude/commands/gsd/pause-work.md +38 -0
- package/.claude/commands/gsd/plan-milestone-gaps.md +34 -0
- package/.claude/commands/gsd/plan-phase.md +45 -0
- package/.claude/commands/gsd/progress.md +24 -0
- package/.claude/commands/gsd/quick.md +41 -0
- package/.claude/commands/gsd/reapply-patches.md +110 -0
- package/.claude/commands/gsd/remove-phase.md +31 -0
- package/.claude/commands/gsd/research-phase.md +189 -0
- package/.claude/commands/gsd/resume-work.md +40 -0
- package/.claude/commands/gsd/set-profile.md +34 -0
- package/.claude/commands/gsd/settings.md +36 -0
- package/.claude/commands/gsd/update.md +37 -0
- package/.claude/commands/gsd/verify-work.md +38 -0
- package/.claude/commands/inbox.md +296 -0
- package/.claude/commands/ingest-empresa.md +191 -0
- package/.claude/commands/ingest.md +183 -0
- package/.claude/commands/jarvis-briefing.md +67 -0
- package/.claude/commands/jarvis-control.md +169 -0
- package/.claude/commands/jarvis-full.md +182 -0
- package/.claude/commands/jarvis.md +212 -0
- package/.claude/commands/ler-drive.md +212 -0
- package/.claude/commands/log.md +158 -0
- package/.claude/commands/loop.md +133 -0
- package/.claude/commands/loops.md +73 -0
- package/.claude/commands/mission-autopilot.md +538 -0
- package/.claude/commands/mission.md +353 -0
- package/.claude/commands/process-inbox.md +148 -0
- package/.claude/commands/process-jarvis.md +3036 -0
- package/.claude/commands/process-video.md +131 -0
- package/.claude/commands/rag-search.md +78 -0
- package/.claude/commands/resume.md +33 -0
- package/.claude/commands/save.md +38 -0
- package/.claude/commands/scan-inbox.md +125 -0
- package/.claude/commands/setup.md +99 -0
- package/.claude/commands/system-digest.md +243 -0
- package/.claude/commands/verify.md +182 -0
- package/.claude/commands/view-dna.md +169 -0
- package/.claude/get-shit-done/VERSION +1 -0
- package/.claude/get-shit-done/bin/gsd-tools.cjs +588 -0
- package/.claude/get-shit-done/bin/lib/commands.cjs +553 -0
- package/.claude/get-shit-done/bin/lib/config.cjs +162 -0
- package/.claude/get-shit-done/bin/lib/core.cjs +411 -0
- package/.claude/get-shit-done/bin/lib/frontmatter.cjs +299 -0
- package/.claude/get-shit-done/bin/lib/init.cjs +710 -0
- package/.claude/get-shit-done/bin/lib/milestone.cjs +216 -0
- package/.claude/get-shit-done/bin/lib/phase.cjs +871 -0
- package/.claude/get-shit-done/bin/lib/roadmap.cjs +298 -0
- package/.claude/get-shit-done/bin/lib/state.cjs +679 -0
- package/.claude/get-shit-done/bin/lib/template.cjs +222 -0
- package/.claude/get-shit-done/bin/lib/verify.cjs +773 -0
- package/.claude/get-shit-done/references/checkpoints.md +776 -0
- package/.claude/get-shit-done/references/continuation-format.md +249 -0
- package/.claude/get-shit-done/references/decimal-phase-calculation.md +65 -0
- package/.claude/get-shit-done/references/git-integration.md +248 -0
- package/.claude/get-shit-done/references/git-planning-commit.md +38 -0
- package/.claude/get-shit-done/references/model-profile-resolution.md +34 -0
- package/.claude/get-shit-done/references/model-profiles.md +92 -0
- package/.claude/get-shit-done/references/phase-argument-parsing.md +61 -0
- package/.claude/get-shit-done/references/planning-config.md +196 -0
- package/.claude/get-shit-done/references/questioning.md +145 -0
- package/.claude/get-shit-done/references/tdd.md +263 -0
- package/.claude/get-shit-done/references/ui-brand.md +160 -0
- package/.claude/get-shit-done/references/verification-patterns.md +612 -0
- package/.claude/get-shit-done/templates/DEBUG.md +164 -0
- package/.claude/get-shit-done/templates/UAT.md +247 -0
- package/.claude/get-shit-done/templates/VALIDATION.md +76 -0
- package/.claude/get-shit-done/templates/codebase/architecture.md +255 -0
- package/.claude/get-shit-done/templates/codebase/concerns.md +310 -0
- package/.claude/get-shit-done/templates/codebase/conventions.md +307 -0
- package/.claude/get-shit-done/templates/codebase/integrations.md +280 -0
- package/.claude/get-shit-done/templates/codebase/stack.md +186 -0
- package/.claude/get-shit-done/templates/codebase/structure.md +285 -0
- package/.claude/get-shit-done/templates/codebase/testing.md +480 -0
- package/.claude/get-shit-done/templates/config.json +37 -0
- package/.claude/get-shit-done/templates/context.md +283 -0
- package/.claude/get-shit-done/templates/continue-here.md +78 -0
- package/.claude/get-shit-done/templates/debug-subagent-prompt.md +91 -0
- package/.claude/get-shit-done/templates/discovery.md +146 -0
- package/.claude/get-shit-done/templates/milestone-archive.md +123 -0
- package/.claude/get-shit-done/templates/milestone.md +115 -0
- package/.claude/get-shit-done/templates/phase-prompt.md +569 -0
- package/.claude/get-shit-done/templates/planner-subagent-prompt.md +117 -0
- package/.claude/get-shit-done/templates/project.md +184 -0
- package/.claude/get-shit-done/templates/requirements.md +231 -0
- package/.claude/get-shit-done/templates/research-project/ARCHITECTURE.md +204 -0
- package/.claude/get-shit-done/templates/research-project/FEATURES.md +147 -0
- package/.claude/get-shit-done/templates/research-project/PITFALLS.md +200 -0
- package/.claude/get-shit-done/templates/research-project/STACK.md +120 -0
- package/.claude/get-shit-done/templates/research-project/SUMMARY.md +170 -0
- package/.claude/get-shit-done/templates/research.md +552 -0
- package/.claude/get-shit-done/templates/retrospective.md +54 -0
- package/.claude/get-shit-done/templates/roadmap.md +202 -0
- package/.claude/get-shit-done/templates/state.md +176 -0
- package/.claude/get-shit-done/templates/summary-complex.md +59 -0
- package/.claude/get-shit-done/templates/summary-minimal.md +41 -0
- package/.claude/get-shit-done/templates/summary-standard.md +48 -0
- package/.claude/get-shit-done/templates/summary.md +248 -0
- package/.claude/get-shit-done/templates/user-setup.md +311 -0
- package/.claude/get-shit-done/templates/verification-report.md +322 -0
- package/.claude/get-shit-done/workflows/add-phase.md +111 -0
- package/.claude/get-shit-done/workflows/add-tests.md +350 -0
- package/.claude/get-shit-done/workflows/add-todo.md +157 -0
- package/.claude/get-shit-done/workflows/audit-milestone.md +297 -0
- package/.claude/get-shit-done/workflows/check-todos.md +176 -0
- package/.claude/get-shit-done/workflows/cleanup.md +152 -0
- package/.claude/get-shit-done/workflows/complete-milestone.md +763 -0
- package/.claude/get-shit-done/workflows/diagnose-issues.md +219 -0
- package/.claude/get-shit-done/workflows/discovery-phase.md +289 -0
- package/.claude/get-shit-done/workflows/discuss-phase.md +542 -0
- package/.claude/get-shit-done/workflows/execute-phase.md +449 -0
- package/.claude/get-shit-done/workflows/execute-plan.md +448 -0
- package/.claude/get-shit-done/workflows/health.md +156 -0
- package/.claude/get-shit-done/workflows/help.md +489 -0
- package/.claude/get-shit-done/workflows/insert-phase.md +129 -0
- package/.claude/get-shit-done/workflows/list-phase-assumptions.md +178 -0
- package/.claude/get-shit-done/workflows/map-codebase.md +315 -0
- package/.claude/get-shit-done/workflows/new-milestone.md +382 -0
- package/.claude/get-shit-done/workflows/new-project.md +1116 -0
- package/.claude/get-shit-done/workflows/pause-work.md +122 -0
- package/.claude/get-shit-done/workflows/plan-milestone-gaps.md +274 -0
- package/.claude/get-shit-done/workflows/plan-phase.md +569 -0
- package/.claude/get-shit-done/workflows/progress.md +381 -0
- package/.claude/get-shit-done/workflows/quick.md +453 -0
- package/.claude/get-shit-done/workflows/remove-phase.md +154 -0
- package/.claude/get-shit-done/workflows/research-phase.md +73 -0
- package/.claude/get-shit-done/workflows/resume-project.md +306 -0
- package/.claude/get-shit-done/workflows/set-profile.md +80 -0
- package/.claude/get-shit-done/workflows/settings.md +213 -0
- package/.claude/get-shit-done/workflows/transition.md +544 -0
- package/.claude/get-shit-done/workflows/update.md +219 -0
- package/.claude/get-shit-done/workflows/verify-phase.md +242 -0
- package/.claude/get-shit-done/workflows/verify-work.md +569 -0
- package/.claude/gsd-file-manifest.json +144 -0
- package/.claude/hooks/agent_creation_trigger.py +168 -0
- package/.claude/hooks/agent_index_updater.py +255 -0
- package/.claude/hooks/agent_memory_persister.py +203 -0
- package/.claude/hooks/claude_md_agent_sync.py +162 -0
- package/.claude/hooks/claude_md_guard.py +154 -0
- package/.claude/hooks/continuous_save.py +414 -0
- package/.claude/hooks/creation_validator.py +360 -0
- package/.claude/hooks/enforce_dual_location.py +501 -0
- package/.claude/hooks/enforce_plan_mode.py +220 -0
- package/.claude/hooks/gsd-check-update.js +62 -0
- package/.claude/hooks/gsd-context-monitor.js +122 -0
- package/.claude/hooks/gsd-statusline.js +108 -0
- package/.claude/hooks/inbox_age_alert.py +367 -0
- package/.claude/hooks/ledger_updater.py +303 -0
- package/.claude/hooks/memory_hints_injector.py +251 -0
- package/.claude/hooks/memory_updater.py +202 -0
- package/.claude/hooks/notification_system.py +115 -0
- package/.claude/hooks/pending_tracker.py +188 -0
- package/.claude/hooks/pipeline_checkpoint.py +583 -0
- package/.claude/hooks/post_batch_cascading.py +1740 -0
- package/.claude/hooks/post_tool_use.py +120 -0
- package/.claude/hooks/quality_watchdog.py +394 -0
- package/.claude/hooks/ralph_wiggum.py +286 -0
- package/.claude/hooks/session-source-sync.py +223 -0
- package/.claude/hooks/session_autosave_v2.py +1135 -0
- package/.claude/hooks/session_end.py +203 -0
- package/.claude/hooks/session_start.py +939 -0
- package/.claude/hooks/skill_indexer.py +48 -0
- package/.claude/hooks/skill_router.py +358 -0
- package/.claude/hooks/stop_hook_completeness.py +187 -0
- package/.claude/hooks/user_prompt_submit.py +125 -0
- package/.claude/package.json +1 -0
- package/.claude/rules/ANTHROPIC-STANDARDS.md +384 -0
- package/.claude/rules/CLAUDE-LITE.md +201 -0
- package/.claude/rules/RULE-GROUP-1.md +320 -0
- package/.claude/rules/RULE-GROUP-2.md +307 -0
- package/.claude/rules/RULE-GROUP-3.md +248 -0
- package/.claude/rules/RULE-GROUP-4.md +427 -0
- package/.claude/rules/RULE-GROUP-5.md +388 -0
- package/.claude/rules/RULE-GROUP-6.md +387 -0
- package/.claude/rules/RULE-GSD-MANDATORY.md +106 -0
- package/.claude/rules/agent-cognition.md +779 -0
- package/.claude/rules/agent-integrity.md +692 -0
- package/.claude/rules/epistemic-standards.md +333 -0
- package/.claude/rules/logging.md +53 -0
- package/.claude/rules/mcp-governance.md +128 -0
- package/.claude/rules/pipeline.md +60 -0
- package/.claude/rules/state-management.md +93 -0
- package/.claude/scripts/apply-tags.py +77 -0
- package/.claude/scripts/batch-extract-transcriptions.py +132 -0
- package/.claude/scripts/build-complete-index.py +250 -0
- package/.claude/scripts/build-planilha-index.py +170 -0
- package/.claude/scripts/complete-tag-matching.py +250 -0
- package/.claude/scripts/deduplicate-inbox.py +139 -0
- package/.claude/scripts/docx-xml-extractor.py +141 -0
- package/.claude/scripts/extract-docx-text.py +58 -0
- package/.claude/scripts/extract-single-transcription.py +74 -0
- package/.claude/scripts/extract_docx_from_gdrive.py +77 -0
- package/.claude/scripts/jarvis_orchestrator.py +5 -0
- package/.claude/scripts/organized-downloader.py +246 -0
- package/.claude/scripts/planilha-tagger.py +187 -0
- package/.claude/scripts/revert-tags.py +70 -0
- package/.claude/scripts/source-sync.py +265 -0
- package/.claude/scripts/tag-inbox-files.py +276 -0
- package/.claude/scripts/tag-inbox-v2.py +253 -0
- package/.claude/scripts/test-extraction.py +35 -0
- package/.claude/scripts/test-full-extraction.py +74 -0
- package/.claude/scripts/validate_cascading_integrity.py +409 -0
- package/.claude/settings.json +215 -0
- package/.claude/skills/DETECTION-PROTOCOL.md +217 -0
- package/.claude/skills/README.md +240 -0
- package/.claude/skills/SKILL-REGISTRY.md +283 -0
- package/.claude/skills/SKILL-SUGGESTIONS.md +114 -0
- package/.claude/skills/_TEMPLATES/SKILL-WRITER-GUIDE.md +385 -0
- package/.claude/skills/agent-creation/SKILL.md +374 -0
- package/.claude/skills/ask-company/SKILL.md +198 -0
- package/.claude/skills/brainstorming/SKILL.md +72 -0
- package/.claude/skills/chronicler/SKILL.md +146 -0
- package/.claude/skills/chronicler/chronicler_core.py +468 -0
- package/.claude/skills/code-review/SKILL.md +160 -0
- package/.claude/skills/convert-to-company-docs/SKILL.md +68 -0
- package/.claude/skills/convert-to-company-docs/convert.py +532 -0
- package/.claude/skills/dispatching-parallel-agents/SKILL.md +193 -0
- package/.claude/skills/docs-megabrain/SKILL.md +251 -0
- package/.claude/skills/executing-plans/SKILL.md +114 -0
- package/.claude/skills/executor/SKILL.md +161 -0
- package/.claude/skills/fase-2-5-tagging/SKILL.md +182 -0
- package/.claude/skills/feature-dev/SKILL.md +154 -0
- package/.claude/skills/frontend-design/SKILL.md +165 -0
- package/.claude/skills/gdrive-transcription-downloader/SKILL.md +249 -0
- package/.claude/skills/gemini-fallback/SKILL.md +67 -0
- package/.claude/skills/gemini-fallback/gemini_fetch.py +0 -0
- package/.claude/skills/gha/SKILL.md +96 -0
- package/.claude/skills/gha/gha_diagnostic.py +227 -0
- package/.claude/skills/github-workflow/SKILL.md +190 -0
- package/.claude/skills/hookify/SKILL.md +134 -0
- package/.claude/skills/hybrid-source-reading/SKILL.md +265 -0
- package/.claude/skills/jarvis/SKILL.md +546 -0
- package/.claude/skills/jarvis-briefing/SKILL.md +340 -0
- package/.claude/skills/knowledge-extraction/SKILL.md +318 -0
- package/.claude/skills/ler-planilha/SKILL.md +281 -0
- package/.claude/skills/pipeline-jarvis/SKILL.md +430 -0
- package/.claude/skills/plugin-dev/SKILL.md +176 -0
- package/.claude/skills/pr-review-toolkit/SKILL.md +178 -0
- package/.claude/skills/process-company-inbox/SKILL.md +183 -0
- package/.claude/skills/python-megabrain/SKILL.md +323 -0
- package/.claude/skills/resume/SKILL.md +61 -0
- package/.claude/skills/save/SKILL.md +87 -0
- package/.claude/skills/skill-creator-internal/SKILL.md +186 -0
- package/.claude/skills/skill-writer/SKILL.md +153 -0
- package/.claude/skills/skill-writer/examples.md +191 -0
- package/.claude/skills/skill-writer/troubleshooting.md +205 -0
- package/.claude/skills/smart-download-tagger/SKILL.md +148 -0
- package/.claude/skills/source-sync/SKILL.md +240 -0
- package/.claude/skills/sync-docs/SKILL.md +193 -0
- package/.claude/skills/sync-docs/config.json +37 -0
- package/.claude/skills/sync-docs/gdrive_sync.py +358 -0
- package/.claude/skills/sync-docs/reauth.py +71 -0
- package/.claude/skills/using-superpowers/SKILL.md +105 -0
- package/.claude/skills/verification-before-completion/SKILL.md +130 -0
- package/.claude/skills/verify/SKILL.md +154 -0
- package/.claude/skills/verify/verify_runner.py +0 -0
- package/.claude/skills/verify-6-levels/SKILL.md +234 -0
- package/.claude/skills/writing-plans/SKILL.md +184 -0
- package/.claude/templates/BATCH-LOG-TEMPLATE.md +221 -0
- package/.claudeignore +9 -0
- package/.cursor/agents.yaml +44 -0
- package/.cursor/rules/mega-brain.md +39 -0
- package/.gitattributes +19 -0
- package/.github/CODEOWNERS +8 -0
- package/.github/ISSUE_TEMPLATE/agent.md +96 -0
- package/.github/ISSUE_TEMPLATE/bug.md +67 -0
- package/.github/ISSUE_TEMPLATE/feature.md +56 -0
- package/.github/ISSUE_TEMPLATE/pipeline.md +70 -0
- package/.github/PULL_REQUEST_TEMPLATE.md +30 -0
- package/.github/assets/banner.svg +152 -0
- package/.github/assets/logo-dark.svg +79 -0
- package/.github/assets/social-preview.png +0 -0
- package/.github/layer1-allowlist.txt +196 -0
- package/.github/layer2-manifest.txt +42 -0
- package/.github/layer3-manifest.txt +94 -0
- package/.github/workflows/claude-code-pr.yml +198 -0
- package/.github/workflows/claude-code-review.yml +57 -0
- package/.github/workflows/claude.yml +76 -0
- package/.github/workflows/publish-pro.yml +72 -0
- package/.github/workflows/publish.yml +86 -0
- package/.github/workflows/verification.yml +251 -0
- package/.gitignore +244 -0
- package/.gitleaks.toml +118 -0
- package/.windsurf/agents.yaml +44 -0
- package/.windsurf/rules/mega-brain.md +39 -0
- package/CONTRIBUTING.md +62 -0
- package/QUICK-START.md +231 -0
- package/README.md +168 -0
- package/agents/AGENT-INDEX.yaml +107 -0
- package/agents/MASTER-AGENT.md +612 -0
- package/agents/README.md +48 -0
- package/agents/_templates/INDEX.md +741 -0
- package/agents/_templates/TEMPLATE-AGENT-MD-ULTRA-ROBUSTO-V3.md +2399 -0
- package/agents/boardroom/CHECKLIST-MASTER.md +281 -0
- package/agents/boardroom/INTEGRATION-GUIDE.md +406 -0
- package/agents/boardroom/README.md +238 -0
- package/agents/boardroom/config/BOARDROOM-CONFIG.md +186 -0
- package/agents/boardroom/config/TTS-INTEGRATION.md +258 -0
- package/agents/boardroom/config/VOICE-PROFILES.md +624 -0
- package/agents/boardroom/scripts/audio_generator.py +375 -0
- package/agents/boardroom/scripts/audio_generator_edge.py +353 -0
- package/agents/boardroom/scripts/jarvis_boardroom_hook.py +415 -0
- package/agents/boardroom/scripts/notebooklm_generator.py +578 -0
- package/agents/boardroom/templates/EPISODE-TEMPLATE.md +367 -0
- package/agents/boardroom/templates/scene-templates/SCENE-AGENT-DEBATE.md +252 -0
- package/agents/boardroom/templates/scene-templates/SCENE-COUNCIL.md +270 -0
- package/agents/boardroom/templates/scene-templates/SCENE-DNA-CONSULTATION.md +126 -0
- package/agents/boardroom/templates/scene-templates/SCENE-QUESTION.md +174 -0
- package/agents/boardroom/workflows/WORKFLOW-AUDIO-GENERATION.md +421 -0
- package/agents/conclave/CRITIC.md +197 -0
- package/agents/conclave/DEVILS-ADVOCATE.md +274 -0
- package/agents/conclave/README.md +35 -0
- package/agents/conclave/SYNTHESIZER.md +293 -0
- package/agents/conclave/advogado-do-diabo/AGENT.md +502 -0
- package/agents/conclave/advogado-do-diabo/SOUL.md +100 -0
- package/agents/conclave/critico-metodologico/AGENT.md +683 -0
- package/agents/conclave/critico-metodologico/SOUL.md +107 -0
- package/agents/conclave/sintetizador/AGENT.md +571 -0
- package/agents/conclave/sintetizador/SOUL.md +94 -0
- package/agents/constitution/BASE-CONSTITUTION.md +254 -0
- package/agents/persona-registry.yaml +300 -0
- package/agents/sua-empresa/.gitkeep +0 -0
- package/agents/sua-empresa/README.md +44 -0
- package/agents/sua-empresa/_example/jds/EXAMPLE-JD.md +42 -0
- package/agents/sua-empresa/_example/org/EXAMPLE-ORG.md +32 -0
- package/agents/sua-empresa/_example/roles/EXAMPLE-ROLE.md +38 -0
- package/artifacts/README.md +11 -0
- package/artifacts/canonical/.gitkeep +0 -0
- package/artifacts/chunks/.gitkeep +0 -0
- package/artifacts/insights/.gitkeep +0 -0
- package/artifacts/narratives/.gitkeep +0 -0
- package/bin/cli.js +2 -0
- package/bin/lib/ascii-art.js +202 -0
- package/bin/lib/feature-gate.js +46 -0
- package/bin/lib/installer.js +593 -0
- package/bin/lib/license.js +59 -0
- package/bin/lib/pro-commands.js +75 -0
- package/bin/lib/setup-wizard.js +547 -0
- package/bin/lib/validate-email.js +113 -0
- package/bin/mega-brain.js +136 -0
- package/bin/pre-publish-gate.js +229 -0
- package/bin/push.js +1056 -0
- package/bin/templates/env.example +27 -0
- package/bin/utils/pro-detector.js +50 -0
- package/bin/validate-package.js +190 -0
- package/core/__init__.py +2 -0
- package/core/glossary/INDEX.md +63 -0
- package/core/glossary/digital.md +243 -0
- package/core/glossary/finance.md +49 -0
- package/core/glossary/marketing.md +69 -0
- package/core/glossary/operations.md +50 -0
- package/core/glossary/sales.md +690 -0
- package/core/intelligence/__init__.py +41 -0
- package/core/intelligence/agent_trigger.py +468 -0
- package/core/intelligence/audit_layers.py +491 -0
- package/core/intelligence/autonomous_processor.py +796 -0
- package/core/intelligence/bootstrap_registry.py +550 -0
- package/core/intelligence/business_model_detector.py +476 -0
- package/core/intelligence/dossier_trigger.py +336 -0
- package/core/intelligence/entity_normalizer.py +565 -0
- package/core/intelligence/org_chain_detector.py +411 -0
- package/core/intelligence/review_dashboard.py +338 -0
- package/core/intelligence/role_detector.py +855 -0
- package/core/intelligence/session_autosave.py +46 -0
- package/core/intelligence/skill_generator.py +601 -0
- package/core/intelligence/sow_generator.py +711 -0
- package/core/intelligence/sync_package_files.py +504 -0
- package/core/intelligence/task_orchestrator.py +780 -0
- package/core/intelligence/theme_analyzer.py +562 -0
- package/core/intelligence/tool_discovery.py +432 -0
- package/core/intelligence/validate_json_integrity.py +106 -0
- package/core/intelligence/validate_layers.py +310 -0
- package/core/intelligence/verify_classifications.py +94 -0
- package/core/intelligence/viability_scorer.py +592 -0
- package/core/jarvis/02-JARVIS-SOUL.md +390 -0
- package/core/jarvis/03-JARVIS-DNA.yaml +312 -0
- package/core/jarvis/AGENT.md +191 -0
- package/core/jarvis/agent-creator/AGENT.md +199 -0
- package/core/jarvis/agent-creator/SOUL.md +82 -0
- package/core/jarvis/agent-creator/tasks/create-agent.md +133 -0
- package/core/jarvis/agent-creator/tasks/sync-agents.md +100 -0
- package/core/jarvis/agent-creator/workflows/wf-create-agent.yaml +110 -0
- package/core/jarvis/agent-creator/workflows/wf-pipeline-trigger.yaml +111 -0
- package/core/jarvis/autonomous/benchmark/AGENT.md +347 -0
- package/core/jarvis/autonomous/benchmark/SOUL.md +78 -0
- package/core/jarvis/autonomous/critic/AGENT.md +324 -0
- package/core/jarvis/autonomous/critic/SOUL.md +78 -0
- package/core/jarvis/autonomous/evolver/AGENT.md +294 -0
- package/core/jarvis/autonomous/evolver/SOUL.md +85 -0
- package/core/jarvis/autonomous/playbook-generator/AGENT.md +399 -0
- package/core/jarvis/autonomous/playbook-generator/SOUL.md +80 -0
- package/core/patterns/_ROLE_PATTERNS.yaml +547 -0
- package/core/patterns/quality_gates.yaml +259 -0
- package/core/patterns/trigger_config.yaml +193 -0
- package/core/schemas/SCHEMA-INDEX.md +94 -0
- package/core/schemas/canonical-map.schema.json +98 -0
- package/core/schemas/chunks-state.schema.json +131 -0
- package/core/schemas/decisions-registry.schema.json +120 -0
- package/core/schemas/file-registry.schema.json +69 -0
- package/core/schemas/insights-state.schema.json +111 -0
- package/core/schemas/narratives-state.schema.json +150 -0
- package/core/tasks/CHANGELOG.md +55 -0
- package/core/tasks/TASK-REGISTRY.md +113 -0
- package/core/tasks/_templates/task-tmpl.md +105 -0
- package/core/tasks/analyze-themes.md +84 -0
- package/core/tasks/detect-role.md +82 -0
- package/core/tasks/extract-dna.md +114 -0
- package/core/tasks/normalize-entities.md +82 -0
- package/core/tasks/process-batch.md +111 -0
- package/core/tasks/validate-cascade.md +105 -0
- package/core/templates/README.md +27 -0
- package/core/templates/agents/dna-config-template.yaml +181 -0
- package/core/templates/agents/enrichment-protocol.md +408 -0
- package/core/templates/agents/memory-template.md +567 -0
- package/core/templates/agents/reasoning-model.md +331 -0
- package/core/templates/agents/soul-template.md +416 -0
- package/core/templates/agents/template-evolution.md +544 -0
- package/core/templates/debates/CONCLAVE-LOG-TEMPLATE-v2.md +309 -0
- package/core/templates/debates/conclave-log-template.md +309 -0
- package/core/templates/debates/conclave-protocol.md +518 -0
- package/core/templates/debates/debate-dynamics-config.yaml +322 -0
- package/core/templates/debates/debate-dynamics.md +613 -0
- package/core/templates/debates/debate-protocol.md +323 -0
- package/core/templates/logs/LOG-TEMPLATES.md +1068 -0
- package/core/templates/logs/batch-visual-template.md +841 -0
- package/core/templates/logs/log-structure.md +65 -0
- package/core/templates/logs/visual-diff.md +159 -0
- package/core/templates/phases/dossier-compilation.md +790 -0
- package/core/templates/phases/narrative-metabolism.md +292 -0
- package/core/templates/phases/narrative-synthesis.md +278 -0
- package/core/templates/phases/phase4-checkpoint.md +146 -0
- package/core/templates/phases/prompt-1.1-chunking.md +154 -0
- package/core/templates/phases/prompt-1.2-entity-resolution.md +186 -0
- package/core/templates/phases/prompt-2.1-dna-tags.md +208 -0
- package/core/templates/phases/prompt-2.1-insight-extraction.md +191 -0
- package/core/templates/phases/prompt-3.1-narrative.md +331 -0
- package/core/templates/phases/sources-compilation.md +340 -0
- package/core/workflows/PIPELINE-JARVIS-DOCS.md +606 -0
- package/core/workflows/wf-conclave.yaml +139 -0
- package/core/workflows/wf-extract-dna.yaml +158 -0
- package/core/workflows/wf-ingest.yaml +88 -0
- package/core/workflows/wf-pipeline-full.yaml +138 -0
- package/docs/API-KEYS-GUIDE.md +372 -0
- package/docs/INTEGRATION-POINTS.md +501 -0
- package/docs/LAYERS.md +403 -0
- package/docs/PLAN-MODE-PROTOCOL.md +388 -0
- package/docs/RESTORE-AND-INDEX.md +203 -0
- package/docs/TAG-RESOLVER-IMPLEMENTATION.md +597 -0
- package/docs/conselho.md +337 -0
- package/docs/context7-readme.md +28 -0
- package/docs/jarvis-logging-protocol.md +380 -0
- package/docs/pipeline-completa-v4.md +1315 -0
- package/docs/prompts/meta_agente_mapeamento_processos.md +297 -0
- package/docs/quick-start.md +197 -0
- package/docs/readme-ralph-cascateamento.md +207 -0
- package/docs/template-master.md +727 -0
- package/docs/templates/phase5/IMPLEMENTATION-GUIDE.md +355 -0
- package/docs/templates/phase5/MOGA-BRAIN-PHASE5-TEMPLATES.md +1284 -0
- package/docs/templates/phase5/README.md +165 -0
- package/docs/workflow-continuous-claude.md +2232 -0
- package/inbox/.gitkeep +0 -0
- package/inbox/README.md +15 -0
- package/knowledge/NAVIGATION-MAP.json +292 -0
- package/knowledge/README.md +11 -0
- package/knowledge/dna/.gitkeep +0 -0
- package/knowledge/dossiers/persons/.gitkeep +0 -0
- package/knowledge/dossiers/system/.gitkeep +0 -0
- package/knowledge/dossiers/themes/.gitkeep +0 -0
- package/knowledge/playbooks/.gitkeep +0 -0
- package/knowledge/sources/.gitkeep +0 -0
- package/logs/.gitkeep +0 -0
- package/logs/README.md +11 -0
- package/package.json +180 -0
- package/requirements.txt +4 -0
|
@@ -0,0 +1,562 @@
|
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
"""
|
|
3
|
+
THEME ANALYZER - Intelligence Layer v1.0
|
|
4
|
+
==========================================
|
|
5
|
+
Extrai e normaliza temas de TODOS os formatos de chunk e insight do Mega Brain.
|
|
6
|
+
|
|
7
|
+
Formatos suportados:
|
|
8
|
+
- AH-BP001: key_concepts[], section, framework_name
|
|
9
|
+
- CG-SM001: temas[], pessoas[], meta.speaker
|
|
10
|
+
- RAG migrated: metadata.theme, topic_hint, mentions[]
|
|
11
|
+
- SS001 legacy: topic, entities[], keywords[]
|
|
12
|
+
- Insights: themes[], type (METRIC/FRAMEWORK/PRINCIPLE/TACTIC)
|
|
13
|
+
|
|
14
|
+
Para cada tema extraido:
|
|
15
|
+
1. Normaliza via entity_normalizer
|
|
16
|
+
2. Atualiza occurrence_count no ENTITY-REGISTRY
|
|
17
|
+
3. Mapeia tema -> dominio via DOMAINS-TAXONOMY
|
|
18
|
+
4. Detecta roles mencionados e associa ao tema
|
|
19
|
+
|
|
20
|
+
Output: {themes_found, themes_new, roles_mentioned, domains_touched, persons_found}
|
|
21
|
+
|
|
22
|
+
Versao: 1.0.0
|
|
23
|
+
Data: 2026-02-24
|
|
24
|
+
"""
|
|
25
|
+
|
|
26
|
+
import json
|
|
27
|
+
import os
|
|
28
|
+
import re
|
|
29
|
+
import sys
|
|
30
|
+
from pathlib import Path
|
|
31
|
+
from datetime import datetime, timezone
|
|
32
|
+
from collections import Counter
|
|
33
|
+
|
|
34
|
+
# Local imports
|
|
35
|
+
sys.path.insert(0, str(Path(__file__).parent))
|
|
36
|
+
from entity_normalizer import (
|
|
37
|
+
load_registry, save_registry, normalize_entity,
|
|
38
|
+
normalize_text, get_domain_aliases, load_taxonomy
|
|
39
|
+
)
|
|
40
|
+
|
|
41
|
+
# ---------------------------------------------------------------------------
|
|
42
|
+
# PATHS
|
|
43
|
+
# ---------------------------------------------------------------------------
|
|
44
|
+
BASE_DIR = Path(__file__).parent.parent
|
|
45
|
+
CHUNKS_DIR = BASE_DIR / "processing" / "chunks"
|
|
46
|
+
INSIGHTS_DIR = BASE_DIR / "processing" / "insights"
|
|
47
|
+
|
|
48
|
+
# ---------------------------------------------------------------------------
|
|
49
|
+
# DOSSIER THEME ID MAP
|
|
50
|
+
# ---------------------------------------------------------------------------
|
|
51
|
+
# Maps known dossier theme IDs (used in CG-SM001 format) to readable names
|
|
52
|
+
DOSSIER_THEME_MAP = {
|
|
53
|
+
"01-ESTRUTURA-TIME": "estrutura-time-vendas",
|
|
54
|
+
"02-PROCESSO-VENDAS": "processo-vendas",
|
|
55
|
+
"03-OUTBOUND": "outbound",
|
|
56
|
+
"04-COMISSIONAMENTO": "comissionamento",
|
|
57
|
+
"05-METRICAS": "metricas-vendas",
|
|
58
|
+
"06-FUNIL-APLICACAO": "funil-aplicacao",
|
|
59
|
+
"07-PRICING": "pricing-ofertas",
|
|
60
|
+
"08-HIRING": "hiring-contratacao",
|
|
61
|
+
"09-GESTAO": "gestao-lideranca",
|
|
62
|
+
"10-CULTURA": "cultura-organizacional",
|
|
63
|
+
"11-SCRIPTS-VENDAS": "scripts-vendas",
|
|
64
|
+
"12-OBJECOES": "objecoes",
|
|
65
|
+
"13-FOLLOW-UP": "follow-up",
|
|
66
|
+
"14-SHOW-RATES": "show-rates",
|
|
67
|
+
"15-CALL-FUNNELS": "call-funnels",
|
|
68
|
+
"16-ONBOARDING": "onboarding",
|
|
69
|
+
"17-CUSTOMER-SUCCESS": "customer-success",
|
|
70
|
+
"18-REFERRAL": "referral",
|
|
71
|
+
"19-RETENTION": "retention",
|
|
72
|
+
"20-SCALING": "scaling-operacoes",
|
|
73
|
+
"21-MINDSET": "mindset",
|
|
74
|
+
"22-OFERTAS": "ofertas",
|
|
75
|
+
}
|
|
76
|
+
|
|
77
|
+
|
|
78
|
+
# ---------------------------------------------------------------------------
|
|
79
|
+
# CHUNK PROCESSORS (one per format)
|
|
80
|
+
# ---------------------------------------------------------------------------
|
|
81
|
+
def process_ah_format(chunk, source_id):
|
|
82
|
+
"""
|
|
83
|
+
Process AH-BP001 format chunks.
|
|
84
|
+
Fields: key_concepts[], section, type, framework_name, content
|
|
85
|
+
"""
|
|
86
|
+
themes = []
|
|
87
|
+
roles = []
|
|
88
|
+
persons = []
|
|
89
|
+
|
|
90
|
+
# Extract from key_concepts
|
|
91
|
+
for concept in chunk.get("key_concepts", []):
|
|
92
|
+
themes.append(concept)
|
|
93
|
+
|
|
94
|
+
# framework_name is a strong theme signal
|
|
95
|
+
fw = chunk.get("framework_name")
|
|
96
|
+
if fw:
|
|
97
|
+
themes.append(fw)
|
|
98
|
+
|
|
99
|
+
# section can hint at theme
|
|
100
|
+
section = chunk.get("section", "")
|
|
101
|
+
if section and section not in ("START HERE",):
|
|
102
|
+
themes.append(section)
|
|
103
|
+
|
|
104
|
+
return {"themes": themes, "roles": roles, "persons": persons}
|
|
105
|
+
|
|
106
|
+
|
|
107
|
+
def process_cg_format(chunk, source_id):
|
|
108
|
+
"""
|
|
109
|
+
Process CG-SM001 format chunks.
|
|
110
|
+
Fields: temas[], pessoas[], meta.speaker, texto
|
|
111
|
+
"""
|
|
112
|
+
themes = []
|
|
113
|
+
roles = []
|
|
114
|
+
persons = []
|
|
115
|
+
|
|
116
|
+
# temas already mapped to dossier IDs
|
|
117
|
+
for tema_id in chunk.get("temas", []):
|
|
118
|
+
readable = DOSSIER_THEME_MAP.get(tema_id, tema_id)
|
|
119
|
+
themes.append(readable)
|
|
120
|
+
|
|
121
|
+
# pessoas explicitly listed
|
|
122
|
+
for pessoa in chunk.get("pessoas", []):
|
|
123
|
+
persons.append(pessoa)
|
|
124
|
+
|
|
125
|
+
# Speaker from meta
|
|
126
|
+
meta = chunk.get("meta", {})
|
|
127
|
+
speaker = meta.get("speaker")
|
|
128
|
+
if speaker:
|
|
129
|
+
persons.append(speaker)
|
|
130
|
+
|
|
131
|
+
return {"themes": themes, "roles": roles, "persons": persons}
|
|
132
|
+
|
|
133
|
+
|
|
134
|
+
def process_rag_format(chunk, source_id):
|
|
135
|
+
"""
|
|
136
|
+
Process RAG-migrated format chunks.
|
|
137
|
+
Fields: metadata.theme, topic_hint, text, mentions[]
|
|
138
|
+
"""
|
|
139
|
+
themes = []
|
|
140
|
+
roles = []
|
|
141
|
+
persons = []
|
|
142
|
+
|
|
143
|
+
meta = chunk.get("metadata", {})
|
|
144
|
+
theme = meta.get("theme")
|
|
145
|
+
if theme:
|
|
146
|
+
readable = DOSSIER_THEME_MAP.get(theme, theme)
|
|
147
|
+
themes.append(readable)
|
|
148
|
+
|
|
149
|
+
topic = chunk.get("topic_hint", "")
|
|
150
|
+
if topic and not topic.startswith("#"):
|
|
151
|
+
themes.append(topic)
|
|
152
|
+
|
|
153
|
+
for mention in chunk.get("mentions", []):
|
|
154
|
+
persons.append(mention)
|
|
155
|
+
|
|
156
|
+
return {"themes": themes, "roles": roles, "persons": persons}
|
|
157
|
+
|
|
158
|
+
|
|
159
|
+
def process_ss_format(chunk, source_id):
|
|
160
|
+
"""
|
|
161
|
+
Process SS001 legacy format (individual chunk files).
|
|
162
|
+
Fields: topic, entities[], keywords[], content, speaker
|
|
163
|
+
"""
|
|
164
|
+
themes = []
|
|
165
|
+
roles = []
|
|
166
|
+
persons = []
|
|
167
|
+
|
|
168
|
+
topic = chunk.get("topic", "")
|
|
169
|
+
if topic:
|
|
170
|
+
# Convert SCREAMING_SNAKE to readable
|
|
171
|
+
readable = topic.lower().replace("_", " ").strip()
|
|
172
|
+
if readable and readable not in ("intro context",):
|
|
173
|
+
themes.append(readable)
|
|
174
|
+
|
|
175
|
+
for entity in chunk.get("entities", []):
|
|
176
|
+
persons.append(entity)
|
|
177
|
+
|
|
178
|
+
for kw in chunk.get("keywords", []):
|
|
179
|
+
themes.append(kw)
|
|
180
|
+
|
|
181
|
+
speaker = chunk.get("speaker", "")
|
|
182
|
+
if speaker:
|
|
183
|
+
persons.append(speaker.replace("_", " ").title())
|
|
184
|
+
|
|
185
|
+
return {"themes": themes, "roles": roles, "persons": persons}
|
|
186
|
+
|
|
187
|
+
|
|
188
|
+
def process_insight(insight, source_id):
|
|
189
|
+
"""
|
|
190
|
+
Process insight format.
|
|
191
|
+
Fields: themes[], type, insight text, source.speaker
|
|
192
|
+
"""
|
|
193
|
+
themes = []
|
|
194
|
+
roles = []
|
|
195
|
+
persons = []
|
|
196
|
+
|
|
197
|
+
for theme_id in insight.get("themes", []):
|
|
198
|
+
readable = DOSSIER_THEME_MAP.get(theme_id, theme_id)
|
|
199
|
+
themes.append(readable)
|
|
200
|
+
|
|
201
|
+
# The insight text itself may contain framework names
|
|
202
|
+
insight_text = insight.get("insight", "")
|
|
203
|
+
itype = insight.get("type", "")
|
|
204
|
+
if itype in ("FRAMEWORK", "METHODOLOGY") and insight_text:
|
|
205
|
+
# Extract framework name (usually before the colon)
|
|
206
|
+
match = re.match(r"^([^:]+):", insight_text)
|
|
207
|
+
if match:
|
|
208
|
+
themes.append(match.group(1).strip())
|
|
209
|
+
|
|
210
|
+
speaker = insight.get("source", {}).get("speaker")
|
|
211
|
+
if speaker:
|
|
212
|
+
persons.append(speaker)
|
|
213
|
+
|
|
214
|
+
return {"themes": themes, "roles": roles, "persons": persons}
|
|
215
|
+
|
|
216
|
+
|
|
217
|
+
# ---------------------------------------------------------------------------
|
|
218
|
+
# FORMAT DETECTOR
|
|
219
|
+
# ---------------------------------------------------------------------------
|
|
220
|
+
def detect_chunk_format(chunk):
|
|
221
|
+
"""Detect which format a chunk uses."""
|
|
222
|
+
if "key_concepts" in chunk and "section" in chunk:
|
|
223
|
+
return "ah"
|
|
224
|
+
if "temas" in chunk and "meta" in chunk:
|
|
225
|
+
return "cg"
|
|
226
|
+
if "metadata" in chunk and "migrated_from_rag" in chunk.get("metadata", {}):
|
|
227
|
+
return "rag"
|
|
228
|
+
if "metadata" in chunk and "theme" in chunk.get("metadata", {}):
|
|
229
|
+
return "rag"
|
|
230
|
+
if "topic" in chunk and "entities" in chunk:
|
|
231
|
+
return "ss"
|
|
232
|
+
if "key_concepts" in chunk:
|
|
233
|
+
return "ah"
|
|
234
|
+
if "temas" in chunk:
|
|
235
|
+
return "cg"
|
|
236
|
+
return "unknown"
|
|
237
|
+
|
|
238
|
+
|
|
239
|
+
FORMAT_PROCESSORS = {
|
|
240
|
+
"ah": process_ah_format,
|
|
241
|
+
"cg": process_cg_format,
|
|
242
|
+
"rag": process_rag_format,
|
|
243
|
+
"ss": process_ss_format,
|
|
244
|
+
}
|
|
245
|
+
|
|
246
|
+
|
|
247
|
+
# ---------------------------------------------------------------------------
|
|
248
|
+
# CORE: ANALYZE FILE
|
|
249
|
+
# ---------------------------------------------------------------------------
|
|
250
|
+
def analyze_chunk_file(filepath, registry=None):
|
|
251
|
+
"""
|
|
252
|
+
Analyze a single chunk file. Extracts themes, persons, roles.
|
|
253
|
+
|
|
254
|
+
Args:
|
|
255
|
+
filepath: path to chunk .json file
|
|
256
|
+
registry: shared ENTITY-REGISTRY dict
|
|
257
|
+
|
|
258
|
+
Returns:
|
|
259
|
+
{
|
|
260
|
+
"source_id": str,
|
|
261
|
+
"themes_found": [str],
|
|
262
|
+
"themes_new": [str],
|
|
263
|
+
"roles_mentioned": [str],
|
|
264
|
+
"persons_found": [str],
|
|
265
|
+
"domains_touched": [str],
|
|
266
|
+
"chunk_count": int,
|
|
267
|
+
"format": str
|
|
268
|
+
}
|
|
269
|
+
"""
|
|
270
|
+
if registry is None:
|
|
271
|
+
registry = load_registry()
|
|
272
|
+
|
|
273
|
+
filepath = Path(filepath)
|
|
274
|
+
if not filepath.exists():
|
|
275
|
+
return {"error": f"File not found: {filepath}"}
|
|
276
|
+
|
|
277
|
+
with open(filepath, "r", encoding="utf-8") as f:
|
|
278
|
+
data = json.load(f)
|
|
279
|
+
|
|
280
|
+
source_id = data.get("source_id", data.get("source_hash", filepath.stem))
|
|
281
|
+
|
|
282
|
+
# Handle both consolidated files (with "chunks" array) and individual chunk files
|
|
283
|
+
if "chunks" in data:
|
|
284
|
+
chunks = data["chunks"]
|
|
285
|
+
elif "insights" in data:
|
|
286
|
+
# Insight files
|
|
287
|
+
return _analyze_insights_file(data, source_id, registry)
|
|
288
|
+
else:
|
|
289
|
+
# Individual chunk file (SS001 format)
|
|
290
|
+
chunks = [data]
|
|
291
|
+
|
|
292
|
+
all_themes = []
|
|
293
|
+
all_persons = []
|
|
294
|
+
all_roles = []
|
|
295
|
+
detected_format = "unknown"
|
|
296
|
+
|
|
297
|
+
for chunk in chunks:
|
|
298
|
+
fmt = detect_chunk_format(chunk)
|
|
299
|
+
if fmt == "unknown":
|
|
300
|
+
continue
|
|
301
|
+
detected_format = fmt
|
|
302
|
+
|
|
303
|
+
processor = FORMAT_PROCESSORS[fmt]
|
|
304
|
+
result = processor(chunk, source_id)
|
|
305
|
+
|
|
306
|
+
all_themes.extend(result["themes"])
|
|
307
|
+
all_persons.extend(result["persons"])
|
|
308
|
+
all_roles.extend(result["roles"])
|
|
309
|
+
|
|
310
|
+
# Normalize and deduplicate
|
|
311
|
+
return _normalize_and_compile(
|
|
312
|
+
all_themes, all_persons, all_roles,
|
|
313
|
+
source_id, len(chunks), detected_format, registry
|
|
314
|
+
)
|
|
315
|
+
|
|
316
|
+
|
|
317
|
+
def _analyze_insights_file(data, source_id, registry):
|
|
318
|
+
"""Analyze an insights file."""
|
|
319
|
+
all_themes = []
|
|
320
|
+
all_persons = []
|
|
321
|
+
all_roles = []
|
|
322
|
+
|
|
323
|
+
for insight in data.get("insights", []):
|
|
324
|
+
result = process_insight(insight, source_id)
|
|
325
|
+
all_themes.extend(result["themes"])
|
|
326
|
+
all_persons.extend(result["persons"])
|
|
327
|
+
all_roles.extend(result["roles"])
|
|
328
|
+
|
|
329
|
+
count = data.get("insights_extracted", len(data.get("insights", [])))
|
|
330
|
+
return _normalize_and_compile(
|
|
331
|
+
all_themes, all_persons, all_roles,
|
|
332
|
+
source_id, count, "insight", registry
|
|
333
|
+
)
|
|
334
|
+
|
|
335
|
+
|
|
336
|
+
def _normalize_and_compile(all_themes, all_persons, all_roles,
|
|
337
|
+
source_id, chunk_count, detected_format, registry):
|
|
338
|
+
"""Normalize extracted data and compile results."""
|
|
339
|
+
domain_aliases = get_domain_aliases()
|
|
340
|
+
|
|
341
|
+
# Normalize themes
|
|
342
|
+
themes_found = []
|
|
343
|
+
themes_new = []
|
|
344
|
+
domains_touched = set()
|
|
345
|
+
|
|
346
|
+
seen_themes = set()
|
|
347
|
+
for raw_theme in all_themes:
|
|
348
|
+
norm = normalize_text(raw_theme)
|
|
349
|
+
if not norm or len(norm) < 2 or norm in seen_themes:
|
|
350
|
+
continue
|
|
351
|
+
seen_themes.add(norm)
|
|
352
|
+
|
|
353
|
+
result = normalize_entity(
|
|
354
|
+
raw_theme, "theme", registry=registry,
|
|
355
|
+
source_id=source_id, auto_save=False
|
|
356
|
+
)
|
|
357
|
+
themes_found.append(result["canonical"])
|
|
358
|
+
if result["created"]:
|
|
359
|
+
themes_new.append(result["canonical"])
|
|
360
|
+
|
|
361
|
+
# Map to domain
|
|
362
|
+
if norm in domain_aliases:
|
|
363
|
+
domains_touched.add(domain_aliases[norm])
|
|
364
|
+
# Also check entity data for domain_ids
|
|
365
|
+
theme_data = registry.get("themes", {}).get(result["canonical"], {})
|
|
366
|
+
for did in theme_data.get("domain_ids", []):
|
|
367
|
+
domains_touched.add(did)
|
|
368
|
+
|
|
369
|
+
# Normalize persons
|
|
370
|
+
persons_found = []
|
|
371
|
+
seen_persons = set()
|
|
372
|
+
for raw_person in all_persons:
|
|
373
|
+
norm = normalize_text(raw_person)
|
|
374
|
+
if not norm or len(norm) < 2 or norm in seen_persons:
|
|
375
|
+
continue
|
|
376
|
+
seen_persons.add(norm)
|
|
377
|
+
|
|
378
|
+
result = normalize_entity(
|
|
379
|
+
raw_person, "person", registry=registry,
|
|
380
|
+
source_id=source_id, auto_save=False
|
|
381
|
+
)
|
|
382
|
+
persons_found.append(result["canonical"])
|
|
383
|
+
|
|
384
|
+
# Normalize roles
|
|
385
|
+
roles_mentioned = []
|
|
386
|
+
seen_roles = set()
|
|
387
|
+
for raw_role in all_roles:
|
|
388
|
+
norm = normalize_text(raw_role)
|
|
389
|
+
if not norm or len(norm) < 2 or norm in seen_roles:
|
|
390
|
+
continue
|
|
391
|
+
seen_roles.add(norm)
|
|
392
|
+
|
|
393
|
+
result = normalize_entity(
|
|
394
|
+
raw_role, "role", registry=registry,
|
|
395
|
+
source_id=source_id, auto_save=False
|
|
396
|
+
)
|
|
397
|
+
roles_mentioned.append(result["canonical"])
|
|
398
|
+
|
|
399
|
+
# Deduplicate
|
|
400
|
+
themes_found = list(dict.fromkeys(themes_found))
|
|
401
|
+
themes_new = list(dict.fromkeys(themes_new))
|
|
402
|
+
persons_found = list(dict.fromkeys(persons_found))
|
|
403
|
+
roles_mentioned = list(dict.fromkeys(roles_mentioned))
|
|
404
|
+
|
|
405
|
+
return {
|
|
406
|
+
"source_id": source_id,
|
|
407
|
+
"themes_found": themes_found,
|
|
408
|
+
"themes_new": themes_new,
|
|
409
|
+
"roles_mentioned": roles_mentioned,
|
|
410
|
+
"persons_found": persons_found,
|
|
411
|
+
"domains_touched": sorted(domains_touched),
|
|
412
|
+
"chunk_count": chunk_count,
|
|
413
|
+
"format": detected_format,
|
|
414
|
+
}
|
|
415
|
+
|
|
416
|
+
|
|
417
|
+
# ---------------------------------------------------------------------------
|
|
418
|
+
# ANALYZE ALL CHUNKS
|
|
419
|
+
# ---------------------------------------------------------------------------
|
|
420
|
+
def analyze_all_chunks(registry=None, save=True):
|
|
421
|
+
"""
|
|
422
|
+
Analyze ALL chunk and insight files.
|
|
423
|
+
|
|
424
|
+
Returns:
|
|
425
|
+
{
|
|
426
|
+
"total_files": int,
|
|
427
|
+
"total_chunks": int,
|
|
428
|
+
"all_themes": Counter,
|
|
429
|
+
"all_persons": Counter,
|
|
430
|
+
"all_roles": Counter,
|
|
431
|
+
"all_domains": Counter,
|
|
432
|
+
"new_themes": [str],
|
|
433
|
+
"files_processed": [dict]
|
|
434
|
+
}
|
|
435
|
+
"""
|
|
436
|
+
if registry is None:
|
|
437
|
+
registry = load_registry()
|
|
438
|
+
|
|
439
|
+
all_themes = Counter()
|
|
440
|
+
all_persons = Counter()
|
|
441
|
+
all_roles = Counter()
|
|
442
|
+
all_domains = Counter()
|
|
443
|
+
new_themes = []
|
|
444
|
+
files_processed = []
|
|
445
|
+
total_chunks = 0
|
|
446
|
+
|
|
447
|
+
# Process chunk files
|
|
448
|
+
chunk_files = sorted(CHUNKS_DIR.glob("*.json"))
|
|
449
|
+
for fpath in chunk_files:
|
|
450
|
+
# Skip state/index files
|
|
451
|
+
if fpath.name in ("CHUNKS-STATE.json", "_INDEX.json", "_rag_export.json"):
|
|
452
|
+
continue
|
|
453
|
+
|
|
454
|
+
result = analyze_chunk_file(fpath, registry=registry)
|
|
455
|
+
if "error" in result:
|
|
456
|
+
continue
|
|
457
|
+
|
|
458
|
+
files_processed.append({
|
|
459
|
+
"file": fpath.name,
|
|
460
|
+
"source_id": result["source_id"],
|
|
461
|
+
"format": result["format"],
|
|
462
|
+
"themes": len(result["themes_found"]),
|
|
463
|
+
"new_themes": len(result["themes_new"]),
|
|
464
|
+
})
|
|
465
|
+
|
|
466
|
+
for t in result["themes_found"]:
|
|
467
|
+
all_themes[t] += 1
|
|
468
|
+
for p in result["persons_found"]:
|
|
469
|
+
all_persons[p] += 1
|
|
470
|
+
for r in result["roles_mentioned"]:
|
|
471
|
+
all_roles[r] += 1
|
|
472
|
+
for d in result["domains_touched"]:
|
|
473
|
+
all_domains[d] += 1
|
|
474
|
+
new_themes.extend(result["themes_new"])
|
|
475
|
+
total_chunks += result["chunk_count"]
|
|
476
|
+
|
|
477
|
+
# Process insight files
|
|
478
|
+
insight_files = sorted(INSIGHTS_DIR.glob("*.json"))
|
|
479
|
+
for fpath in insight_files:
|
|
480
|
+
if fpath.name == "INSIGHTS-STATE.json":
|
|
481
|
+
continue
|
|
482
|
+
|
|
483
|
+
result = analyze_chunk_file(fpath, registry=registry)
|
|
484
|
+
if "error" in result:
|
|
485
|
+
continue
|
|
486
|
+
|
|
487
|
+
files_processed.append({
|
|
488
|
+
"file": fpath.name,
|
|
489
|
+
"source_id": result["source_id"],
|
|
490
|
+
"format": result["format"],
|
|
491
|
+
"themes": len(result["themes_found"]),
|
|
492
|
+
"new_themes": len(result["themes_new"]),
|
|
493
|
+
})
|
|
494
|
+
|
|
495
|
+
for t in result["themes_found"]:
|
|
496
|
+
all_themes[t] += 1
|
|
497
|
+
for p in result["persons_found"]:
|
|
498
|
+
all_persons[p] += 1
|
|
499
|
+
for r in result["roles_mentioned"]:
|
|
500
|
+
all_roles[r] += 1
|
|
501
|
+
for d in result["domains_touched"]:
|
|
502
|
+
all_domains[d] += 1
|
|
503
|
+
new_themes.extend(result["themes_new"])
|
|
504
|
+
|
|
505
|
+
if save:
|
|
506
|
+
save_registry(registry)
|
|
507
|
+
|
|
508
|
+
return {
|
|
509
|
+
"total_files": len(files_processed),
|
|
510
|
+
"total_chunks": total_chunks,
|
|
511
|
+
"all_themes": all_themes,
|
|
512
|
+
"all_persons": all_persons,
|
|
513
|
+
"all_roles": all_roles,
|
|
514
|
+
"all_domains": all_domains,
|
|
515
|
+
"new_themes": list(set(new_themes)),
|
|
516
|
+
"files_processed": files_processed,
|
|
517
|
+
}
|
|
518
|
+
|
|
519
|
+
|
|
520
|
+
# ---------------------------------------------------------------------------
|
|
521
|
+
# CLI
|
|
522
|
+
# ---------------------------------------------------------------------------
|
|
523
|
+
def main():
|
|
524
|
+
"""CLI: analyze chunk/insight files."""
|
|
525
|
+
if len(sys.argv) > 1 and sys.argv[1] == "--all":
|
|
526
|
+
print("\n=== THEME ANALYZER: Full Scan ===\n")
|
|
527
|
+
result = analyze_all_chunks(save=True)
|
|
528
|
+
print(f"Files processed: {result['total_files']}")
|
|
529
|
+
print(f"Total chunks: {result['total_chunks']}")
|
|
530
|
+
print(f"Themes found: {len(result['all_themes'])}")
|
|
531
|
+
print(f"New themes: {len(result['new_themes'])}")
|
|
532
|
+
print(f"Persons found: {len(result['all_persons'])}")
|
|
533
|
+
print(f"Roles found: {len(result['all_roles'])}")
|
|
534
|
+
print(f"Domains touched: {len(result['all_domains'])}")
|
|
535
|
+
|
|
536
|
+
print(f"\n--- Top 20 Themes ---")
|
|
537
|
+
for theme, count in result["all_themes"].most_common(20):
|
|
538
|
+
print(f" {count:4d}x {theme}")
|
|
539
|
+
|
|
540
|
+
print(f"\n--- Top 10 Persons ---")
|
|
541
|
+
for person, count in result["all_persons"].most_common(10):
|
|
542
|
+
print(f" {count:4d}x {person}")
|
|
543
|
+
|
|
544
|
+
print(f"\n--- Domains ---")
|
|
545
|
+
for dom, count in result["all_domains"].most_common():
|
|
546
|
+
print(f" {count:4d}x {dom}")
|
|
547
|
+
|
|
548
|
+
elif len(sys.argv) > 1:
|
|
549
|
+
filepath = sys.argv[1]
|
|
550
|
+
print(f"\n=== THEME ANALYZER: Single File ===\n")
|
|
551
|
+
result = analyze_chunk_file(filepath)
|
|
552
|
+
print(json.dumps(result, indent=2, ensure_ascii=False))
|
|
553
|
+
|
|
554
|
+
else:
|
|
555
|
+
print("Uso:")
|
|
556
|
+
print(" python3 theme_analyzer.py --all # Analyze all chunks + insights")
|
|
557
|
+
print(" python3 theme_analyzer.py <filepath> # Analyze single file")
|
|
558
|
+
sys.exit(1)
|
|
559
|
+
|
|
560
|
+
|
|
561
|
+
if __name__ == "__main__":
|
|
562
|
+
main()
|