mega-brain-ai 1.3.0
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- package/.antigravity/README.md +46 -0
- package/.antigravity/rules/.gitkeep +0 -0
- package/.antigravity/rules/mega-brain.md +39 -0
- package/.claude/CLAUDE.md +172 -0
- package/.claude/agents.yaml +44 -0
- package/.claude/commands/agents.md +161 -0
- package/.claude/commands/ask.md +117 -0
- package/.claude/commands/benchmark.md +224 -0
- package/.claude/commands/chat.md +343 -0
- package/.claude/commands/compare.md +116 -0
- package/.claude/commands/conclave.md +196 -0
- package/.claude/commands/config.md +133 -0
- package/.claude/commands/create-agent.md +467 -0
- package/.claude/commands/debate.md +159 -0
- package/.claude/commands/documentation/create-architecture-documentation.md +175 -0
- package/.claude/commands/dossiers.md +180 -0
- package/.claude/commands/evolve.md +223 -0
- package/.claude/commands/extract-dna.md +172 -0
- package/.claude/commands/extract-knowledge.md +507 -0
- package/.claude/commands/gsd/add-phase.md +43 -0
- package/.claude/commands/gsd/add-tests.md +41 -0
- package/.claude/commands/gsd/add-todo.md +47 -0
- package/.claude/commands/gsd/audit-milestone.md +36 -0
- package/.claude/commands/gsd/check-todos.md +45 -0
- package/.claude/commands/gsd/cleanup.md +18 -0
- package/.claude/commands/gsd/complete-milestone.md +136 -0
- package/.claude/commands/gsd/debug.md +167 -0
- package/.claude/commands/gsd/discuss-phase.md +83 -0
- package/.claude/commands/gsd/execute-phase.md +41 -0
- package/.claude/commands/gsd/health.md +22 -0
- package/.claude/commands/gsd/help.md +22 -0
- package/.claude/commands/gsd/insert-phase.md +32 -0
- package/.claude/commands/gsd/join-discord.md +18 -0
- package/.claude/commands/gsd/list-phase-assumptions.md +46 -0
- package/.claude/commands/gsd/map-codebase.md +71 -0
- package/.claude/commands/gsd/new-milestone.md +44 -0
- package/.claude/commands/gsd/new-project.md +42 -0
- package/.claude/commands/gsd/pause-work.md +38 -0
- package/.claude/commands/gsd/plan-milestone-gaps.md +34 -0
- package/.claude/commands/gsd/plan-phase.md +45 -0
- package/.claude/commands/gsd/progress.md +24 -0
- package/.claude/commands/gsd/quick.md +41 -0
- package/.claude/commands/gsd/reapply-patches.md +110 -0
- package/.claude/commands/gsd/remove-phase.md +31 -0
- package/.claude/commands/gsd/research-phase.md +189 -0
- package/.claude/commands/gsd/resume-work.md +40 -0
- package/.claude/commands/gsd/set-profile.md +34 -0
- package/.claude/commands/gsd/settings.md +36 -0
- package/.claude/commands/gsd/update.md +37 -0
- package/.claude/commands/gsd/verify-work.md +38 -0
- package/.claude/commands/inbox.md +296 -0
- package/.claude/commands/ingest-empresa.md +191 -0
- package/.claude/commands/ingest.md +183 -0
- package/.claude/commands/jarvis-briefing.md +67 -0
- package/.claude/commands/jarvis-control.md +169 -0
- package/.claude/commands/jarvis-full.md +182 -0
- package/.claude/commands/jarvis.md +212 -0
- package/.claude/commands/ler-drive.md +212 -0
- package/.claude/commands/log.md +158 -0
- package/.claude/commands/loop.md +133 -0
- package/.claude/commands/loops.md +73 -0
- package/.claude/commands/mission-autopilot.md +538 -0
- package/.claude/commands/mission.md +353 -0
- package/.claude/commands/process-inbox.md +148 -0
- package/.claude/commands/process-jarvis.md +3036 -0
- package/.claude/commands/process-video.md +131 -0
- package/.claude/commands/rag-search.md +78 -0
- package/.claude/commands/resume.md +33 -0
- package/.claude/commands/save.md +38 -0
- package/.claude/commands/scan-inbox.md +125 -0
- package/.claude/commands/setup.md +99 -0
- package/.claude/commands/system-digest.md +243 -0
- package/.claude/commands/verify.md +182 -0
- package/.claude/commands/view-dna.md +169 -0
- package/.claude/get-shit-done/VERSION +1 -0
- package/.claude/get-shit-done/bin/gsd-tools.cjs +588 -0
- package/.claude/get-shit-done/bin/lib/commands.cjs +553 -0
- package/.claude/get-shit-done/bin/lib/config.cjs +162 -0
- package/.claude/get-shit-done/bin/lib/core.cjs +411 -0
- package/.claude/get-shit-done/bin/lib/frontmatter.cjs +299 -0
- package/.claude/get-shit-done/bin/lib/init.cjs +710 -0
- package/.claude/get-shit-done/bin/lib/milestone.cjs +216 -0
- package/.claude/get-shit-done/bin/lib/phase.cjs +871 -0
- package/.claude/get-shit-done/bin/lib/roadmap.cjs +298 -0
- package/.claude/get-shit-done/bin/lib/state.cjs +679 -0
- package/.claude/get-shit-done/bin/lib/template.cjs +222 -0
- package/.claude/get-shit-done/bin/lib/verify.cjs +773 -0
- package/.claude/get-shit-done/references/checkpoints.md +776 -0
- package/.claude/get-shit-done/references/continuation-format.md +249 -0
- package/.claude/get-shit-done/references/decimal-phase-calculation.md +65 -0
- package/.claude/get-shit-done/references/git-integration.md +248 -0
- package/.claude/get-shit-done/references/git-planning-commit.md +38 -0
- package/.claude/get-shit-done/references/model-profile-resolution.md +34 -0
- package/.claude/get-shit-done/references/model-profiles.md +92 -0
- package/.claude/get-shit-done/references/phase-argument-parsing.md +61 -0
- package/.claude/get-shit-done/references/planning-config.md +196 -0
- package/.claude/get-shit-done/references/questioning.md +145 -0
- package/.claude/get-shit-done/references/tdd.md +263 -0
- package/.claude/get-shit-done/references/ui-brand.md +160 -0
- package/.claude/get-shit-done/references/verification-patterns.md +612 -0
- package/.claude/get-shit-done/templates/DEBUG.md +164 -0
- package/.claude/get-shit-done/templates/UAT.md +247 -0
- package/.claude/get-shit-done/templates/VALIDATION.md +76 -0
- package/.claude/get-shit-done/templates/codebase/architecture.md +255 -0
- package/.claude/get-shit-done/templates/codebase/concerns.md +310 -0
- package/.claude/get-shit-done/templates/codebase/conventions.md +307 -0
- package/.claude/get-shit-done/templates/codebase/integrations.md +280 -0
- package/.claude/get-shit-done/templates/codebase/stack.md +186 -0
- package/.claude/get-shit-done/templates/codebase/structure.md +285 -0
- package/.claude/get-shit-done/templates/codebase/testing.md +480 -0
- package/.claude/get-shit-done/templates/config.json +37 -0
- package/.claude/get-shit-done/templates/context.md +283 -0
- package/.claude/get-shit-done/templates/continue-here.md +78 -0
- package/.claude/get-shit-done/templates/debug-subagent-prompt.md +91 -0
- package/.claude/get-shit-done/templates/discovery.md +146 -0
- package/.claude/get-shit-done/templates/milestone-archive.md +123 -0
- package/.claude/get-shit-done/templates/milestone.md +115 -0
- package/.claude/get-shit-done/templates/phase-prompt.md +569 -0
- package/.claude/get-shit-done/templates/planner-subagent-prompt.md +117 -0
- package/.claude/get-shit-done/templates/project.md +184 -0
- package/.claude/get-shit-done/templates/requirements.md +231 -0
- package/.claude/get-shit-done/templates/research-project/ARCHITECTURE.md +204 -0
- package/.claude/get-shit-done/templates/research-project/FEATURES.md +147 -0
- package/.claude/get-shit-done/templates/research-project/PITFALLS.md +200 -0
- package/.claude/get-shit-done/templates/research-project/STACK.md +120 -0
- package/.claude/get-shit-done/templates/research-project/SUMMARY.md +170 -0
- package/.claude/get-shit-done/templates/research.md +552 -0
- package/.claude/get-shit-done/templates/retrospective.md +54 -0
- package/.claude/get-shit-done/templates/roadmap.md +202 -0
- package/.claude/get-shit-done/templates/state.md +176 -0
- package/.claude/get-shit-done/templates/summary-complex.md +59 -0
- package/.claude/get-shit-done/templates/summary-minimal.md +41 -0
- package/.claude/get-shit-done/templates/summary-standard.md +48 -0
- package/.claude/get-shit-done/templates/summary.md +248 -0
- package/.claude/get-shit-done/templates/user-setup.md +311 -0
- package/.claude/get-shit-done/templates/verification-report.md +322 -0
- package/.claude/get-shit-done/workflows/add-phase.md +111 -0
- package/.claude/get-shit-done/workflows/add-tests.md +350 -0
- package/.claude/get-shit-done/workflows/add-todo.md +157 -0
- package/.claude/get-shit-done/workflows/audit-milestone.md +297 -0
- package/.claude/get-shit-done/workflows/check-todos.md +176 -0
- package/.claude/get-shit-done/workflows/cleanup.md +152 -0
- package/.claude/get-shit-done/workflows/complete-milestone.md +763 -0
- package/.claude/get-shit-done/workflows/diagnose-issues.md +219 -0
- package/.claude/get-shit-done/workflows/discovery-phase.md +289 -0
- package/.claude/get-shit-done/workflows/discuss-phase.md +542 -0
- package/.claude/get-shit-done/workflows/execute-phase.md +449 -0
- package/.claude/get-shit-done/workflows/execute-plan.md +448 -0
- package/.claude/get-shit-done/workflows/health.md +156 -0
- package/.claude/get-shit-done/workflows/help.md +489 -0
- package/.claude/get-shit-done/workflows/insert-phase.md +129 -0
- package/.claude/get-shit-done/workflows/list-phase-assumptions.md +178 -0
- package/.claude/get-shit-done/workflows/map-codebase.md +315 -0
- package/.claude/get-shit-done/workflows/new-milestone.md +382 -0
- package/.claude/get-shit-done/workflows/new-project.md +1116 -0
- package/.claude/get-shit-done/workflows/pause-work.md +122 -0
- package/.claude/get-shit-done/workflows/plan-milestone-gaps.md +274 -0
- package/.claude/get-shit-done/workflows/plan-phase.md +569 -0
- package/.claude/get-shit-done/workflows/progress.md +381 -0
- package/.claude/get-shit-done/workflows/quick.md +453 -0
- package/.claude/get-shit-done/workflows/remove-phase.md +154 -0
- package/.claude/get-shit-done/workflows/research-phase.md +73 -0
- package/.claude/get-shit-done/workflows/resume-project.md +306 -0
- package/.claude/get-shit-done/workflows/set-profile.md +80 -0
- package/.claude/get-shit-done/workflows/settings.md +213 -0
- package/.claude/get-shit-done/workflows/transition.md +544 -0
- package/.claude/get-shit-done/workflows/update.md +219 -0
- package/.claude/get-shit-done/workflows/verify-phase.md +242 -0
- package/.claude/get-shit-done/workflows/verify-work.md +569 -0
- package/.claude/gsd-file-manifest.json +144 -0
- package/.claude/hooks/agent_creation_trigger.py +168 -0
- package/.claude/hooks/agent_index_updater.py +255 -0
- package/.claude/hooks/agent_memory_persister.py +203 -0
- package/.claude/hooks/claude_md_agent_sync.py +162 -0
- package/.claude/hooks/claude_md_guard.py +154 -0
- package/.claude/hooks/continuous_save.py +414 -0
- package/.claude/hooks/creation_validator.py +360 -0
- package/.claude/hooks/enforce_dual_location.py +501 -0
- package/.claude/hooks/enforce_plan_mode.py +220 -0
- package/.claude/hooks/gsd-check-update.js +62 -0
- package/.claude/hooks/gsd-context-monitor.js +122 -0
- package/.claude/hooks/gsd-statusline.js +108 -0
- package/.claude/hooks/inbox_age_alert.py +367 -0
- package/.claude/hooks/ledger_updater.py +303 -0
- package/.claude/hooks/memory_hints_injector.py +251 -0
- package/.claude/hooks/memory_updater.py +202 -0
- package/.claude/hooks/notification_system.py +115 -0
- package/.claude/hooks/pending_tracker.py +188 -0
- package/.claude/hooks/pipeline_checkpoint.py +583 -0
- package/.claude/hooks/post_batch_cascading.py +1740 -0
- package/.claude/hooks/post_tool_use.py +120 -0
- package/.claude/hooks/quality_watchdog.py +394 -0
- package/.claude/hooks/ralph_wiggum.py +286 -0
- package/.claude/hooks/session-source-sync.py +223 -0
- package/.claude/hooks/session_autosave_v2.py +1135 -0
- package/.claude/hooks/session_end.py +203 -0
- package/.claude/hooks/session_start.py +939 -0
- package/.claude/hooks/skill_indexer.py +48 -0
- package/.claude/hooks/skill_router.py +358 -0
- package/.claude/hooks/stop_hook_completeness.py +187 -0
- package/.claude/hooks/user_prompt_submit.py +125 -0
- package/.claude/package.json +1 -0
- package/.claude/rules/ANTHROPIC-STANDARDS.md +384 -0
- package/.claude/rules/CLAUDE-LITE.md +201 -0
- package/.claude/rules/RULE-GROUP-1.md +320 -0
- package/.claude/rules/RULE-GROUP-2.md +307 -0
- package/.claude/rules/RULE-GROUP-3.md +248 -0
- package/.claude/rules/RULE-GROUP-4.md +427 -0
- package/.claude/rules/RULE-GROUP-5.md +388 -0
- package/.claude/rules/RULE-GROUP-6.md +387 -0
- package/.claude/rules/RULE-GSD-MANDATORY.md +106 -0
- package/.claude/rules/agent-cognition.md +779 -0
- package/.claude/rules/agent-integrity.md +692 -0
- package/.claude/rules/epistemic-standards.md +333 -0
- package/.claude/rules/logging.md +53 -0
- package/.claude/rules/mcp-governance.md +128 -0
- package/.claude/rules/pipeline.md +60 -0
- package/.claude/rules/state-management.md +93 -0
- package/.claude/scripts/apply-tags.py +77 -0
- package/.claude/scripts/batch-extract-transcriptions.py +132 -0
- package/.claude/scripts/build-complete-index.py +250 -0
- package/.claude/scripts/build-planilha-index.py +170 -0
- package/.claude/scripts/complete-tag-matching.py +250 -0
- package/.claude/scripts/deduplicate-inbox.py +139 -0
- package/.claude/scripts/docx-xml-extractor.py +141 -0
- package/.claude/scripts/extract-docx-text.py +58 -0
- package/.claude/scripts/extract-single-transcription.py +74 -0
- package/.claude/scripts/extract_docx_from_gdrive.py +77 -0
- package/.claude/scripts/jarvis_orchestrator.py +5 -0
- package/.claude/scripts/organized-downloader.py +246 -0
- package/.claude/scripts/planilha-tagger.py +187 -0
- package/.claude/scripts/revert-tags.py +70 -0
- package/.claude/scripts/source-sync.py +265 -0
- package/.claude/scripts/tag-inbox-files.py +276 -0
- package/.claude/scripts/tag-inbox-v2.py +253 -0
- package/.claude/scripts/test-extraction.py +35 -0
- package/.claude/scripts/test-full-extraction.py +74 -0
- package/.claude/scripts/validate_cascading_integrity.py +409 -0
- package/.claude/settings.json +215 -0
- package/.claude/skills/DETECTION-PROTOCOL.md +217 -0
- package/.claude/skills/README.md +240 -0
- package/.claude/skills/SKILL-REGISTRY.md +283 -0
- package/.claude/skills/SKILL-SUGGESTIONS.md +114 -0
- package/.claude/skills/_TEMPLATES/SKILL-WRITER-GUIDE.md +385 -0
- package/.claude/skills/agent-creation/SKILL.md +374 -0
- package/.claude/skills/ask-company/SKILL.md +198 -0
- package/.claude/skills/brainstorming/SKILL.md +72 -0
- package/.claude/skills/chronicler/SKILL.md +146 -0
- package/.claude/skills/chronicler/chronicler_core.py +468 -0
- package/.claude/skills/code-review/SKILL.md +160 -0
- package/.claude/skills/convert-to-company-docs/SKILL.md +68 -0
- package/.claude/skills/convert-to-company-docs/convert.py +532 -0
- package/.claude/skills/dispatching-parallel-agents/SKILL.md +193 -0
- package/.claude/skills/docs-megabrain/SKILL.md +251 -0
- package/.claude/skills/executing-plans/SKILL.md +114 -0
- package/.claude/skills/executor/SKILL.md +161 -0
- package/.claude/skills/fase-2-5-tagging/SKILL.md +182 -0
- package/.claude/skills/feature-dev/SKILL.md +154 -0
- package/.claude/skills/frontend-design/SKILL.md +165 -0
- package/.claude/skills/gdrive-transcription-downloader/SKILL.md +249 -0
- package/.claude/skills/gemini-fallback/SKILL.md +67 -0
- package/.claude/skills/gemini-fallback/gemini_fetch.py +0 -0
- package/.claude/skills/gha/SKILL.md +96 -0
- package/.claude/skills/gha/gha_diagnostic.py +227 -0
- package/.claude/skills/github-workflow/SKILL.md +190 -0
- package/.claude/skills/hookify/SKILL.md +134 -0
- package/.claude/skills/hybrid-source-reading/SKILL.md +265 -0
- package/.claude/skills/jarvis/SKILL.md +546 -0
- package/.claude/skills/jarvis-briefing/SKILL.md +340 -0
- package/.claude/skills/knowledge-extraction/SKILL.md +318 -0
- package/.claude/skills/ler-planilha/SKILL.md +281 -0
- package/.claude/skills/pipeline-jarvis/SKILL.md +430 -0
- package/.claude/skills/plugin-dev/SKILL.md +176 -0
- package/.claude/skills/pr-review-toolkit/SKILL.md +178 -0
- package/.claude/skills/process-company-inbox/SKILL.md +183 -0
- package/.claude/skills/python-megabrain/SKILL.md +323 -0
- package/.claude/skills/resume/SKILL.md +61 -0
- package/.claude/skills/save/SKILL.md +87 -0
- package/.claude/skills/skill-creator-internal/SKILL.md +186 -0
- package/.claude/skills/skill-writer/SKILL.md +153 -0
- package/.claude/skills/skill-writer/examples.md +191 -0
- package/.claude/skills/skill-writer/troubleshooting.md +205 -0
- package/.claude/skills/smart-download-tagger/SKILL.md +148 -0
- package/.claude/skills/source-sync/SKILL.md +240 -0
- package/.claude/skills/sync-docs/SKILL.md +193 -0
- package/.claude/skills/sync-docs/config.json +37 -0
- package/.claude/skills/sync-docs/gdrive_sync.py +358 -0
- package/.claude/skills/sync-docs/reauth.py +71 -0
- package/.claude/skills/using-superpowers/SKILL.md +105 -0
- package/.claude/skills/verification-before-completion/SKILL.md +130 -0
- package/.claude/skills/verify/SKILL.md +154 -0
- package/.claude/skills/verify/verify_runner.py +0 -0
- package/.claude/skills/verify-6-levels/SKILL.md +234 -0
- package/.claude/skills/writing-plans/SKILL.md +184 -0
- package/.claude/templates/BATCH-LOG-TEMPLATE.md +221 -0
- package/.claudeignore +9 -0
- package/.cursor/agents.yaml +44 -0
- package/.cursor/rules/mega-brain.md +39 -0
- package/.gitattributes +19 -0
- package/.github/CODEOWNERS +8 -0
- package/.github/ISSUE_TEMPLATE/agent.md +96 -0
- package/.github/ISSUE_TEMPLATE/bug.md +67 -0
- package/.github/ISSUE_TEMPLATE/feature.md +56 -0
- package/.github/ISSUE_TEMPLATE/pipeline.md +70 -0
- package/.github/PULL_REQUEST_TEMPLATE.md +30 -0
- package/.github/assets/banner.svg +152 -0
- package/.github/assets/logo-dark.svg +79 -0
- package/.github/assets/social-preview.png +0 -0
- package/.github/layer1-allowlist.txt +196 -0
- package/.github/layer2-manifest.txt +42 -0
- package/.github/layer3-manifest.txt +94 -0
- package/.github/workflows/claude-code-pr.yml +198 -0
- package/.github/workflows/claude-code-review.yml +57 -0
- package/.github/workflows/claude.yml +76 -0
- package/.github/workflows/publish-pro.yml +72 -0
- package/.github/workflows/publish.yml +86 -0
- package/.github/workflows/verification.yml +251 -0
- package/.gitignore +244 -0
- package/.gitleaks.toml +118 -0
- package/.windsurf/agents.yaml +44 -0
- package/.windsurf/rules/mega-brain.md +39 -0
- package/CONTRIBUTING.md +62 -0
- package/QUICK-START.md +231 -0
- package/README.md +168 -0
- package/agents/AGENT-INDEX.yaml +107 -0
- package/agents/MASTER-AGENT.md +612 -0
- package/agents/README.md +48 -0
- package/agents/_templates/INDEX.md +741 -0
- package/agents/_templates/TEMPLATE-AGENT-MD-ULTRA-ROBUSTO-V3.md +2399 -0
- package/agents/boardroom/CHECKLIST-MASTER.md +281 -0
- package/agents/boardroom/INTEGRATION-GUIDE.md +406 -0
- package/agents/boardroom/README.md +238 -0
- package/agents/boardroom/config/BOARDROOM-CONFIG.md +186 -0
- package/agents/boardroom/config/TTS-INTEGRATION.md +258 -0
- package/agents/boardroom/config/VOICE-PROFILES.md +624 -0
- package/agents/boardroom/scripts/audio_generator.py +375 -0
- package/agents/boardroom/scripts/audio_generator_edge.py +353 -0
- package/agents/boardroom/scripts/jarvis_boardroom_hook.py +415 -0
- package/agents/boardroom/scripts/notebooklm_generator.py +578 -0
- package/agents/boardroom/templates/EPISODE-TEMPLATE.md +367 -0
- package/agents/boardroom/templates/scene-templates/SCENE-AGENT-DEBATE.md +252 -0
- package/agents/boardroom/templates/scene-templates/SCENE-COUNCIL.md +270 -0
- package/agents/boardroom/templates/scene-templates/SCENE-DNA-CONSULTATION.md +126 -0
- package/agents/boardroom/templates/scene-templates/SCENE-QUESTION.md +174 -0
- package/agents/boardroom/workflows/WORKFLOW-AUDIO-GENERATION.md +421 -0
- package/agents/conclave/CRITIC.md +197 -0
- package/agents/conclave/DEVILS-ADVOCATE.md +274 -0
- package/agents/conclave/README.md +35 -0
- package/agents/conclave/SYNTHESIZER.md +293 -0
- package/agents/conclave/advogado-do-diabo/AGENT.md +502 -0
- package/agents/conclave/advogado-do-diabo/SOUL.md +100 -0
- package/agents/conclave/critico-metodologico/AGENT.md +683 -0
- package/agents/conclave/critico-metodologico/SOUL.md +107 -0
- package/agents/conclave/sintetizador/AGENT.md +571 -0
- package/agents/conclave/sintetizador/SOUL.md +94 -0
- package/agents/constitution/BASE-CONSTITUTION.md +254 -0
- package/agents/persona-registry.yaml +300 -0
- package/agents/sua-empresa/.gitkeep +0 -0
- package/agents/sua-empresa/README.md +44 -0
- package/agents/sua-empresa/_example/jds/EXAMPLE-JD.md +42 -0
- package/agents/sua-empresa/_example/org/EXAMPLE-ORG.md +32 -0
- package/agents/sua-empresa/_example/roles/EXAMPLE-ROLE.md +38 -0
- package/artifacts/README.md +11 -0
- package/artifacts/canonical/.gitkeep +0 -0
- package/artifacts/chunks/.gitkeep +0 -0
- package/artifacts/insights/.gitkeep +0 -0
- package/artifacts/narratives/.gitkeep +0 -0
- package/bin/cli.js +2 -0
- package/bin/lib/ascii-art.js +202 -0
- package/bin/lib/feature-gate.js +46 -0
- package/bin/lib/installer.js +593 -0
- package/bin/lib/license.js +59 -0
- package/bin/lib/pro-commands.js +75 -0
- package/bin/lib/setup-wizard.js +547 -0
- package/bin/lib/validate-email.js +113 -0
- package/bin/mega-brain.js +136 -0
- package/bin/pre-publish-gate.js +229 -0
- package/bin/push.js +1056 -0
- package/bin/templates/env.example +27 -0
- package/bin/utils/pro-detector.js +50 -0
- package/bin/validate-package.js +190 -0
- package/core/__init__.py +2 -0
- package/core/glossary/INDEX.md +63 -0
- package/core/glossary/digital.md +243 -0
- package/core/glossary/finance.md +49 -0
- package/core/glossary/marketing.md +69 -0
- package/core/glossary/operations.md +50 -0
- package/core/glossary/sales.md +690 -0
- package/core/intelligence/__init__.py +41 -0
- package/core/intelligence/agent_trigger.py +468 -0
- package/core/intelligence/audit_layers.py +491 -0
- package/core/intelligence/autonomous_processor.py +796 -0
- package/core/intelligence/bootstrap_registry.py +550 -0
- package/core/intelligence/business_model_detector.py +476 -0
- package/core/intelligence/dossier_trigger.py +336 -0
- package/core/intelligence/entity_normalizer.py +565 -0
- package/core/intelligence/org_chain_detector.py +411 -0
- package/core/intelligence/review_dashboard.py +338 -0
- package/core/intelligence/role_detector.py +855 -0
- package/core/intelligence/session_autosave.py +46 -0
- package/core/intelligence/skill_generator.py +601 -0
- package/core/intelligence/sow_generator.py +711 -0
- package/core/intelligence/sync_package_files.py +504 -0
- package/core/intelligence/task_orchestrator.py +780 -0
- package/core/intelligence/theme_analyzer.py +562 -0
- package/core/intelligence/tool_discovery.py +432 -0
- package/core/intelligence/validate_json_integrity.py +106 -0
- package/core/intelligence/validate_layers.py +310 -0
- package/core/intelligence/verify_classifications.py +94 -0
- package/core/intelligence/viability_scorer.py +592 -0
- package/core/jarvis/02-JARVIS-SOUL.md +390 -0
- package/core/jarvis/03-JARVIS-DNA.yaml +312 -0
- package/core/jarvis/AGENT.md +191 -0
- package/core/jarvis/agent-creator/AGENT.md +199 -0
- package/core/jarvis/agent-creator/SOUL.md +82 -0
- package/core/jarvis/agent-creator/tasks/create-agent.md +133 -0
- package/core/jarvis/agent-creator/tasks/sync-agents.md +100 -0
- package/core/jarvis/agent-creator/workflows/wf-create-agent.yaml +110 -0
- package/core/jarvis/agent-creator/workflows/wf-pipeline-trigger.yaml +111 -0
- package/core/jarvis/autonomous/benchmark/AGENT.md +347 -0
- package/core/jarvis/autonomous/benchmark/SOUL.md +78 -0
- package/core/jarvis/autonomous/critic/AGENT.md +324 -0
- package/core/jarvis/autonomous/critic/SOUL.md +78 -0
- package/core/jarvis/autonomous/evolver/AGENT.md +294 -0
- package/core/jarvis/autonomous/evolver/SOUL.md +85 -0
- package/core/jarvis/autonomous/playbook-generator/AGENT.md +399 -0
- package/core/jarvis/autonomous/playbook-generator/SOUL.md +80 -0
- package/core/patterns/_ROLE_PATTERNS.yaml +547 -0
- package/core/patterns/quality_gates.yaml +259 -0
- package/core/patterns/trigger_config.yaml +193 -0
- package/core/schemas/SCHEMA-INDEX.md +94 -0
- package/core/schemas/canonical-map.schema.json +98 -0
- package/core/schemas/chunks-state.schema.json +131 -0
- package/core/schemas/decisions-registry.schema.json +120 -0
- package/core/schemas/file-registry.schema.json +69 -0
- package/core/schemas/insights-state.schema.json +111 -0
- package/core/schemas/narratives-state.schema.json +150 -0
- package/core/tasks/CHANGELOG.md +55 -0
- package/core/tasks/TASK-REGISTRY.md +113 -0
- package/core/tasks/_templates/task-tmpl.md +105 -0
- package/core/tasks/analyze-themes.md +84 -0
- package/core/tasks/detect-role.md +82 -0
- package/core/tasks/extract-dna.md +114 -0
- package/core/tasks/normalize-entities.md +82 -0
- package/core/tasks/process-batch.md +111 -0
- package/core/tasks/validate-cascade.md +105 -0
- package/core/templates/README.md +27 -0
- package/core/templates/agents/dna-config-template.yaml +181 -0
- package/core/templates/agents/enrichment-protocol.md +408 -0
- package/core/templates/agents/memory-template.md +567 -0
- package/core/templates/agents/reasoning-model.md +331 -0
- package/core/templates/agents/soul-template.md +416 -0
- package/core/templates/agents/template-evolution.md +544 -0
- package/core/templates/debates/CONCLAVE-LOG-TEMPLATE-v2.md +309 -0
- package/core/templates/debates/conclave-log-template.md +309 -0
- package/core/templates/debates/conclave-protocol.md +518 -0
- package/core/templates/debates/debate-dynamics-config.yaml +322 -0
- package/core/templates/debates/debate-dynamics.md +613 -0
- package/core/templates/debates/debate-protocol.md +323 -0
- package/core/templates/logs/LOG-TEMPLATES.md +1068 -0
- package/core/templates/logs/batch-visual-template.md +841 -0
- package/core/templates/logs/log-structure.md +65 -0
- package/core/templates/logs/visual-diff.md +159 -0
- package/core/templates/phases/dossier-compilation.md +790 -0
- package/core/templates/phases/narrative-metabolism.md +292 -0
- package/core/templates/phases/narrative-synthesis.md +278 -0
- package/core/templates/phases/phase4-checkpoint.md +146 -0
- package/core/templates/phases/prompt-1.1-chunking.md +154 -0
- package/core/templates/phases/prompt-1.2-entity-resolution.md +186 -0
- package/core/templates/phases/prompt-2.1-dna-tags.md +208 -0
- package/core/templates/phases/prompt-2.1-insight-extraction.md +191 -0
- package/core/templates/phases/prompt-3.1-narrative.md +331 -0
- package/core/templates/phases/sources-compilation.md +340 -0
- package/core/workflows/PIPELINE-JARVIS-DOCS.md +606 -0
- package/core/workflows/wf-conclave.yaml +139 -0
- package/core/workflows/wf-extract-dna.yaml +158 -0
- package/core/workflows/wf-ingest.yaml +88 -0
- package/core/workflows/wf-pipeline-full.yaml +138 -0
- package/docs/API-KEYS-GUIDE.md +372 -0
- package/docs/INTEGRATION-POINTS.md +501 -0
- package/docs/LAYERS.md +403 -0
- package/docs/PLAN-MODE-PROTOCOL.md +388 -0
- package/docs/RESTORE-AND-INDEX.md +203 -0
- package/docs/TAG-RESOLVER-IMPLEMENTATION.md +597 -0
- package/docs/conselho.md +337 -0
- package/docs/context7-readme.md +28 -0
- package/docs/jarvis-logging-protocol.md +380 -0
- package/docs/pipeline-completa-v4.md +1315 -0
- package/docs/prompts/meta_agente_mapeamento_processos.md +297 -0
- package/docs/quick-start.md +197 -0
- package/docs/readme-ralph-cascateamento.md +207 -0
- package/docs/template-master.md +727 -0
- package/docs/templates/phase5/IMPLEMENTATION-GUIDE.md +355 -0
- package/docs/templates/phase5/MOGA-BRAIN-PHASE5-TEMPLATES.md +1284 -0
- package/docs/templates/phase5/README.md +165 -0
- package/docs/workflow-continuous-claude.md +2232 -0
- package/inbox/.gitkeep +0 -0
- package/inbox/README.md +15 -0
- package/knowledge/NAVIGATION-MAP.json +292 -0
- package/knowledge/README.md +11 -0
- package/knowledge/dna/.gitkeep +0 -0
- package/knowledge/dossiers/persons/.gitkeep +0 -0
- package/knowledge/dossiers/system/.gitkeep +0 -0
- package/knowledge/dossiers/themes/.gitkeep +0 -0
- package/knowledge/playbooks/.gitkeep +0 -0
- package/knowledge/sources/.gitkeep +0 -0
- package/logs/.gitkeep +0 -0
- package/logs/README.md +11 -0
- package/package.json +180 -0
- package/requirements.txt +4 -0
|
@@ -0,0 +1,253 @@
|
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
"""
|
|
3
|
+
FASE 2.5 v2 - Tagueamento por MATCHING DE NOMES
|
|
4
|
+
Mega Brain - Sistema de Inteligência de Negócios
|
|
5
|
+
|
|
6
|
+
ABORDAGEM CORRETA:
|
|
7
|
+
1. Extrair de TODAS as abas: nome_video → TAG
|
|
8
|
+
2. Para cada arquivo INBOX, fazer matching por nome similar
|
|
9
|
+
3. Se match encontrado, usar TAG da planilha
|
|
10
|
+
4. Se não, manter órfão
|
|
11
|
+
"""
|
|
12
|
+
|
|
13
|
+
import os
|
|
14
|
+
import re
|
|
15
|
+
import json
|
|
16
|
+
from pathlib import Path
|
|
17
|
+
from datetime import datetime
|
|
18
|
+
from difflib import SequenceMatcher
|
|
19
|
+
|
|
20
|
+
# Configurações
|
|
21
|
+
INBOX_PATH = "inbox"
|
|
22
|
+
SCHEMA_PATH = ".claude/mission-control/SPREADSHEET-SCHEMA.json"
|
|
23
|
+
INDEX_PATH = ".claude/mission-control/PLANILHA-INDEX.json"
|
|
24
|
+
OUTPUT_PATH = ".claude/mission-control/TAG-MAPPING-V2.json"
|
|
25
|
+
|
|
26
|
+
def normalize_name(name):
|
|
27
|
+
"""Normaliza nome para matching."""
|
|
28
|
+
# Remove extensão
|
|
29
|
+
name = os.path.splitext(name)[0]
|
|
30
|
+
# Lowercase
|
|
31
|
+
name = name.lower()
|
|
32
|
+
# Remove timestamps
|
|
33
|
+
name = re.sub(r'_\d{14}$', '', name)
|
|
34
|
+
name = re.sub(r'\d{1,2}-\d{1,2}-\d{2,4}', '', name) # Remove datas tipo 12-25-24
|
|
35
|
+
# Remove número inicial
|
|
36
|
+
name = re.sub(r'^\d+[\s\.\-]+', '', name)
|
|
37
|
+
# Remove [youtube.com...] e similares
|
|
38
|
+
name = re.sub(r'\[youtube\.com[^\]]*\]', '', name)
|
|
39
|
+
name = re.sub(r'\[[^\]]*\]', '', name)
|
|
40
|
+
# Remove (1), (2), etc
|
|
41
|
+
name = re.sub(r'\s*\(\d+\)\s*', '', name)
|
|
42
|
+
# Remove caracteres especiais
|
|
43
|
+
name = re.sub(r'[^\w\s]', ' ', name)
|
|
44
|
+
name = re.sub(r'\s+', ' ', name).strip()
|
|
45
|
+
return name
|
|
46
|
+
|
|
47
|
+
def similar(a, b):
|
|
48
|
+
"""Calcula similaridade entre dois nomes (0-1)."""
|
|
49
|
+
return SequenceMatcher(None, a, b).ratio()
|
|
50
|
+
|
|
51
|
+
def load_planilha_index():
|
|
52
|
+
"""Carrega índice da planilha (nome → TAG)."""
|
|
53
|
+
if os.path.exists(INDEX_PATH):
|
|
54
|
+
with open(INDEX_PATH, 'r', encoding='utf-8') as f:
|
|
55
|
+
return json.load(f)
|
|
56
|
+
return None
|
|
57
|
+
|
|
58
|
+
def scan_inbox_files():
|
|
59
|
+
"""Varre todos os arquivos do INBOX."""
|
|
60
|
+
files = []
|
|
61
|
+
extensions = {'.txt', '.docx', '.pdf'}
|
|
62
|
+
|
|
63
|
+
for root, dirs, filenames in os.walk(INBOX_PATH):
|
|
64
|
+
if '_BACKUP' in root or '_TEMPLATE' in root:
|
|
65
|
+
continue
|
|
66
|
+
|
|
67
|
+
for filename in filenames:
|
|
68
|
+
ext = os.path.splitext(filename)[1].lower()
|
|
69
|
+
if ext in extensions:
|
|
70
|
+
filepath = Path(root) / filename
|
|
71
|
+
|
|
72
|
+
# Verificar se já tem TAG
|
|
73
|
+
has_tag = bool(re.match(r'^\[[\w-]+\]', filename))
|
|
74
|
+
|
|
75
|
+
files.append({
|
|
76
|
+
'path': str(filepath),
|
|
77
|
+
'filename': filename,
|
|
78
|
+
'folder': os.path.basename(root),
|
|
79
|
+
'parent_folder': os.path.basename(os.path.dirname(root)),
|
|
80
|
+
'normalized': normalize_name(filename),
|
|
81
|
+
'has_tag': has_tag
|
|
82
|
+
})
|
|
83
|
+
|
|
84
|
+
return files
|
|
85
|
+
|
|
86
|
+
def match_file_to_index(file_info, index, threshold=0.7):
|
|
87
|
+
"""Tenta encontrar match no índice da planilha."""
|
|
88
|
+
normalized_name = file_info['normalized']
|
|
89
|
+
|
|
90
|
+
if not normalized_name:
|
|
91
|
+
return None, 0
|
|
92
|
+
|
|
93
|
+
best_match = None
|
|
94
|
+
best_score = 0
|
|
95
|
+
|
|
96
|
+
for entry in index['entries']:
|
|
97
|
+
# Comparar com nome normalizado da planilha
|
|
98
|
+
score = similar(normalized_name, entry['normalized'])
|
|
99
|
+
if score > best_score and score >= threshold:
|
|
100
|
+
best_score = score
|
|
101
|
+
best_match = entry
|
|
102
|
+
|
|
103
|
+
return best_match, best_score
|
|
104
|
+
|
|
105
|
+
def main(execute=False, threshold=0.7):
|
|
106
|
+
print("=" * 60)
|
|
107
|
+
print("FASE 2.5 v2 - TAGUEAMENTO POR MATCHING")
|
|
108
|
+
print("=" * 60)
|
|
109
|
+
print()
|
|
110
|
+
|
|
111
|
+
# 1. Carregar índice da planilha
|
|
112
|
+
print("[1/4] Carregando índice da planilha...")
|
|
113
|
+
index = load_planilha_index()
|
|
114
|
+
if not index:
|
|
115
|
+
print(" ERRO: Índice não encontrado!")
|
|
116
|
+
print(" Execute primeiro: /criar-indice-planilha")
|
|
117
|
+
return None
|
|
118
|
+
print(f" {len(index['entries'])} entradas no índice")
|
|
119
|
+
|
|
120
|
+
# 2. Escanear INBOX
|
|
121
|
+
print("[2/4] Escaneando INBOX...")
|
|
122
|
+
files = scan_inbox_files()
|
|
123
|
+
print(f" {len(files)} arquivos encontrados")
|
|
124
|
+
|
|
125
|
+
# 3. Fazer matching
|
|
126
|
+
print(f"[3/4] Matching (threshold={threshold})...")
|
|
127
|
+
|
|
128
|
+
matched = []
|
|
129
|
+
orphans = []
|
|
130
|
+
already_tagged = []
|
|
131
|
+
|
|
132
|
+
for f in files:
|
|
133
|
+
if f['has_tag']:
|
|
134
|
+
already_tagged.append(f)
|
|
135
|
+
continue
|
|
136
|
+
|
|
137
|
+
match, score = match_file_to_index(f, index, threshold)
|
|
138
|
+
if match:
|
|
139
|
+
matched.append({
|
|
140
|
+
'file': f,
|
|
141
|
+
'match': match,
|
|
142
|
+
'score': score
|
|
143
|
+
})
|
|
144
|
+
else:
|
|
145
|
+
orphans.append(f)
|
|
146
|
+
|
|
147
|
+
print(f" Já tagueados: {len(already_tagged)}")
|
|
148
|
+
print(f" Match encontrado: {len(matched)}")
|
|
149
|
+
print(f" Órfãos: {len(orphans)}")
|
|
150
|
+
|
|
151
|
+
# 4. Gerar relatório
|
|
152
|
+
print("[4/4] Gerando relatório...")
|
|
153
|
+
|
|
154
|
+
report = {
|
|
155
|
+
'timestamp': datetime.now().isoformat(),
|
|
156
|
+
'threshold': threshold,
|
|
157
|
+
'summary': {
|
|
158
|
+
'total_files': len(files),
|
|
159
|
+
'already_tagged': len(already_tagged),
|
|
160
|
+
'matched': len(matched),
|
|
161
|
+
'orphans': len(orphans)
|
|
162
|
+
},
|
|
163
|
+
'matches': [],
|
|
164
|
+
'orphans': []
|
|
165
|
+
}
|
|
166
|
+
|
|
167
|
+
for m in matched:
|
|
168
|
+
report['matches'].append({
|
|
169
|
+
'current_path': m['file']['path'],
|
|
170
|
+
'filename': m['file']['filename'],
|
|
171
|
+
'folder': m['file']['folder'],
|
|
172
|
+
'matched_to': m['match']['original_name'],
|
|
173
|
+
'tag': m['match']['tag'],
|
|
174
|
+
'sheet': m['match']['sheet'],
|
|
175
|
+
'score': round(m['score'], 3)
|
|
176
|
+
})
|
|
177
|
+
|
|
178
|
+
for o in orphans:
|
|
179
|
+
report['orphans'].append({
|
|
180
|
+
'path': o['path'],
|
|
181
|
+
'filename': o['filename'],
|
|
182
|
+
'folder': o['folder'],
|
|
183
|
+
'normalized': o['normalized']
|
|
184
|
+
})
|
|
185
|
+
|
|
186
|
+
# Salvar relatório
|
|
187
|
+
with open(OUTPUT_PATH, 'w', encoding='utf-8') as f:
|
|
188
|
+
json.dump(report, f, ensure_ascii=False, indent=2)
|
|
189
|
+
|
|
190
|
+
print()
|
|
191
|
+
print("=" * 60)
|
|
192
|
+
print("RELATÓRIO GERADO")
|
|
193
|
+
print("=" * 60)
|
|
194
|
+
print(f"Arquivo: {OUTPUT_PATH}")
|
|
195
|
+
|
|
196
|
+
# 5. Executar renomeação se solicitado
|
|
197
|
+
if execute and matched:
|
|
198
|
+
print()
|
|
199
|
+
print("=" * 60)
|
|
200
|
+
print("EXECUTANDO RENOMEAÇÃO")
|
|
201
|
+
print("=" * 60)
|
|
202
|
+
|
|
203
|
+
success = 0
|
|
204
|
+
errors = []
|
|
205
|
+
|
|
206
|
+
for m in matched:
|
|
207
|
+
filepath = Path(m['file']['path'])
|
|
208
|
+
tag = m['match']['tag']
|
|
209
|
+
new_name = f"[{tag}] {filepath.name}"
|
|
210
|
+
new_path = filepath.parent / new_name
|
|
211
|
+
|
|
212
|
+
if new_path.exists():
|
|
213
|
+
errors.append({'path': str(filepath), 'error': 'Destino já existe'})
|
|
214
|
+
continue
|
|
215
|
+
|
|
216
|
+
try:
|
|
217
|
+
filepath.rename(new_path)
|
|
218
|
+
success += 1
|
|
219
|
+
if success % 50 == 0:
|
|
220
|
+
print(f" Renomeados: {success}/{len(matched)}")
|
|
221
|
+
except Exception as e:
|
|
222
|
+
errors.append({'path': str(filepath), 'error': str(e)})
|
|
223
|
+
|
|
224
|
+
print()
|
|
225
|
+
print(f"Sucesso: {success}")
|
|
226
|
+
print(f"Erros: {len(errors)}")
|
|
227
|
+
|
|
228
|
+
report['execution'] = {
|
|
229
|
+
'success': success,
|
|
230
|
+
'errors': len(errors),
|
|
231
|
+
'error_details': errors
|
|
232
|
+
}
|
|
233
|
+
|
|
234
|
+
with open(OUTPUT_PATH, 'w', encoding='utf-8') as f:
|
|
235
|
+
json.dump(report, f, ensure_ascii=False, indent=2)
|
|
236
|
+
|
|
237
|
+
else:
|
|
238
|
+
print()
|
|
239
|
+
print("PRÓXIMO PASSO: Execute com --execute para renomear")
|
|
240
|
+
print(f" Threshold atual: {threshold}")
|
|
241
|
+
print(" Use --threshold=0.6 para matching mais flexível")
|
|
242
|
+
|
|
243
|
+
return report
|
|
244
|
+
|
|
245
|
+
|
|
246
|
+
if __name__ == '__main__':
|
|
247
|
+
import sys
|
|
248
|
+
execute = '--execute' in sys.argv
|
|
249
|
+
threshold = 0.7
|
|
250
|
+
for arg in sys.argv:
|
|
251
|
+
if arg.startswith('--threshold='):
|
|
252
|
+
threshold = float(arg.split('=')[1])
|
|
253
|
+
main(execute=execute, threshold=threshold)
|
|
@@ -0,0 +1,35 @@
|
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
"""
|
|
3
|
+
Test extraction of text from base64-encoded .docx
|
|
4
|
+
"""
|
|
5
|
+
|
|
6
|
+
import base64
|
|
7
|
+
import subprocess
|
|
8
|
+
import tempfile
|
|
9
|
+
import os
|
|
10
|
+
|
|
11
|
+
# Base64 content from Google Drive (truncated for test - will use full content)
|
|
12
|
+
base64_content = """UEsDBBQACAgIACc2JVwAAAAAAAAAAAAAAAASAAAAd29yZC9udW1iZXJpbmcueG1s7VrLjtowFP2C/gOK1OWQJ4FBA7PoaKpWo6pqpx9gEkMs/IhsB2a+oYvu2m2/rV9SJyHhTRMaBEheBe71PfYxh3t0pdzdvxDcmkEuEKMDw25bRgvSgIWITgbGt+fHm57REhLQEGBG4cB4hcK4H765m/dpQkaQq3UtBUFFnwQDI5Iy7pumCCJIgGizGFKVHDNOgFRf+cQkgE+T+CZgJAYSjRBG8tV0LMs3FjBsYCSc9hcQNwQFnAk2lmlJn43HKICLR1HBq+yblzywICGQymxHk0OszsCoiFAsCjRyLJpKRgXI7BCJGcHFunlcZbeQg7m6Z4LzjeaMhzFnARRCRR/yZIloWxUuMIUoK6ocYX3P4iQEIFrCpOrYACr3bqu9F5eWQS2JLO9C4CoHyVNPaMQBf90+BTjiPlfrY1RJxRsIqkomvBTkMRBBBLgsAPAxCJgFUxi+A3QGSjGHk0py3kAKEZhwQJYiFbV+WdvakMvXCMRwiTb5P7T3nCXxUu7eMWgr/0C7Uw/A2QLw6wH0tgEC+HIchqkqV3FQWA/HL3FQ0Q+qAUggpiJFuDXDRRfMQuVfYLsp78RRH9PaFMqxVEMGQdaQjaEyGDASkqvAp4S01r59UCztbAmeYZVC6jEwrCyivIpLFZsBnC4yh7lTPZIyGMIAEYDzlKp8hi9l7q3dLuMfgyKK4Vjm4fgzTx+IhiqXhgdG11GWOe9HgE4yz3R9K11rlot5/kgKNKp8dLEiS5nZbpts7IpsMJtD/gSlhHw3I6c2I9vzTkLJqUPpCyOA7mbk1mbk2P5JGLlNSM6rT6fXOwkdrynNdWpTUgxOQqnTkOb82ow89zSNwW9Cc93adDrWaZpCtynN9epT6p6mK/Qa0txtbUa+11RjMNcM959u7BztxqMEYyh3XsCfXz+uzIwPkvl+bT58iM3P39fmwc0K7dwW3KzSzu2+zSrt3M7brNLO7bzNKu3cxtus0s7tuc0q7dy+23rq1dPvtTivnn4v3X/19HvhJqyn30t2Y09Pv3r6vWwP1tPv5bqvnn4v13j19HuBftvRfqv9Vvut9lvtt9pvtd824bc081m6+m7Vmumu0TSzlVtlzv4y50CZu7/MPVDm7S/zDpR19pd1VsvMlRecg39BLRwiffbMDUQIVcjZ93vxiwcNT9w4T8y1SycPygam3DNJkExw1DDBjTPBadmcct6QoAtFA4PkhWcNL9w4L7RJRGPGNfXvCG7s5I8OevMgU4ZHM3NCUteDPUTGeLrRMMbNb0LX2wi6iGjKZQJGg+WuxI9DbZX5csgyRUGfIPli44ab54spAPfBVUi9IPlg65b44II38s4u+SIIg3SBQ28uID6DXPfgY/V3wmX/9AaD09fxm6+Wy/7o9Oxk/2zyT193909JMDntnh4dvdgP0m3/tAl/V0LmR0u9jjZvxCwJLjpyCyL3mlqggSRdCX90ntkFJvic7Nghx3MOW+6eT6VgToNdHWsX8sEy/VeWowiRkx9/Rk5eEWvrFvj7pCgz8JuyFkFA/H2CC5LmguoxNh4wOflRA9cbwlIfp3C8nhbBzH4uYxokg+82DP4ZGPx59/iQPHjOB4nT4dK2yLEakX1raZSgO+qLgDj+BUU17pS59KlwVFgKvI263NCMDRRwvYpC7bbydDmwRsPjv4zHiz7J5ExJFhA3vzFUu7pXaIdopiI8K9oIgRLPJx8k9S5A2tO+lYAHooTI18shUBq+/mV8/VTFYnIMP3pOBwyrlSKcNyAG78bw/nCV2zQxXKIFgqXdHg6Z7uEX4HvfmdhxfYh8vRyapuHrX+jH8W0KLrY7dY1OA2LvQzA1pLEauHu+sNylNnEhMvZyIKCGsX8pYyuHGhPkVcZkWMr6GX3P5qwM7zGBR+XvqQauRleJNO7jwlbSoWJD5PDlIE0Nh/8yDp9DQnYl7CRLJOTUgRIQx59dBegESwU0uekXljjtGSVyS0Pk8OXwWj/P4asZar01Zn5GuRZjeNtHoOoKbj5jUSI5ME1A7PyCS56itvabxkhz+Eh7TPs+tDjG5TxzhsjTwVeduRNhsYMbrHByHdlbvTDym7M3J/shBo4Pgq+acjckZAdLfNw9CdkmJ0XW3OtZaf8QV3F7KRNp+26G/z89uD+NKr6eC46TB9j0lqakj3XeiNKkL/BTiLC0g/ZnZIAVMZw/vc40ejB87ckj7NhByYOywn6LsHcRtyxuYekXDn8kXKPyILGqBzu3xByruYFaIkMeNshH0zYtpXNtWk4YFeQBzZgE5YHgGiroUNMw2aDp3VIJme/ocev09CzqV1oN4IspyvseoOlQaJBG1XJAnXZjVPmyrXLyIeKqQ2bWlS6BXGEisx6WQ63czILf1ZfnC4Y8UACaEIQV4sIvB+toFv6je+fVdgH9KdL5inZVDEzlCN8AWC4gRGZYDgvRMMPHmOEZwxoBmPTbIcdsipIJHhhzsBy+4eeZoSZbp2dKCDV6mGcdciRjptnkTxRxraAPLHsPJgFPWcypDTa8fhB8T5C7sWm6wWYXd2/TdLh/+OqYPOu+3H9xcNS91E0pkCVcriDHTrNdmjmZGGKSCt8SvB25ZuFqxsPlKmTczHrf3fdlhJkdBC5RujPtLOg7RUcqzTQi04rO0aoPL9SI+5OD7S54uFzFjIZPPsYnB7nxLa5UprQt6iWU/PLaqp5gmCyUMZ1S3G4ByxhLbY7VPpGRpOUyp+HyzHLVNX6eZ2pidnflEGF+xYbrYq0N+dG2aiGygFN0oxIyB98R4jZs6zcn+5N/nPxDSA2F/+4xSUE/g0JapbbMz16dvNgPqjHzt5MPMQNbKs4j6nNl8ZWJRYxBG2J94/mGLa0L5QoL87sAmU7+mDLt9CYxWOrQ+a5Mjm/fII3zhZB/5WpvkRSGRdafnw1OseNDAkz2aHe7jfOP4PPmk40n+FlpDuSHJQSqaqqtZ8RscIPiE/eUtSqF09te81iFz7H4V3L5TaNNZ/Y1YfCi09M3dl8pW34t7vAyT8+wsSA8LHbXmHkJymdfy/vHY/chVlGOr9av/h+AUEsHCElAgyk3IAAAeckBAFBLAwQUAAgICAAnNiVcAAAAAAAAAAAAAAAAEQAAAHdvcmQvc2V0dGluZ3MueG1spZZLktowEIZPkDtQ2oMfA2RCjZlFpiZZZFaQA8iSbKvQqyQZD7ePZFs2j1TKkBXS391fy0275ZfXT85mR6INlSIDySIGMyKQxFSUGfi9f58/g5mxUGDIpCAZOBEDXrdfXpqNIdY6LzNzBGE2HGWgslZtosiginBoFlIR4YyF1Bxat9VlxKE+1GqOJFfQ0pwyak9RGsdr0GNkBmotNj1izinS0sjC+pCNLAqKSP8TIvSUvF3Im0Q1J8K2GSNNmDuDFKaiygQaf5TmjFWAHP/1EEfOgl+jpmTDGjau0Jx1iRqpsdISEWOc+tYZB2ISTyigRwwRU45wmTOchEMqBoxvjivQkHvhcvdFa1Hjg4y1MGzKQTrTL5prqE+3p4AP1PM8XtFJXXxFcFG21kNDPoJAFdQ2ANgjBCbRgeDvUBzh0My4nNTOVyRMYakhH5vU3PXPJvFVu+wqqMhIK/+P9kPLWo3tvnyEdvYGJqv7AOkNYH0f4PkWgMjnY4zIRZ5zKL6Psx44NMyDaQALzcF4wrcI91OwlYZX4HYo/5Xjlj7Wo9LYDWSI2oEMtu5+ITwneK9rsj8p8i6d16zZHKEbEwmIvAMmBayZ3cN8Z6UKxq9p3Jm7O2Zc7br7aoCsgFsKyN3curiOPiQm3lRrOr2aPmV0kZPpnQ8iH1CpLm1eJhlgtKxs4vnW7bC7DttNXqa9LW1taWdrNxAhVyPn3S9GLQ3amd9T0J5GbRm05aitgrYatXXQ1l6rXN01o+LgyhCWXi8kY7Ih+Odov5H6eoRvhO0fUEsHCLVCXjdPAgAAaAgAAFBLAwQUAAgICAAnNiVcAAAAAAAAAAAAAAAAEgAAAHdvcmQvZm9udFRhYmxlLnhtbKWVS27bMBCGT9A7CNzblI3USAXLQdEg3XTX9gATkpII84UhZcW3L2Xr4dpBICsrSRz93wzJn8Pt05tWyUGgl9bkZLVMSSIMs1yaMid//7wsHkniAxgOyhqRk6Pw5Gn3ZdtkhTXBJ1FufKZZTqoQXEapZ5XQ4JfWCRODhUUNIX5iSTXgvnYLZrWDIF+lkuFI12m6IR3G5qRGk3WIhZYMrbdFaCWZLQrJRPfoFTgl71nybFmthQmnjBSFijVY4yvpfE/Tc2kxWPWQw0eTOGjV/9e4Kdk4QhP3QqtzosYid2iZ8D6OPp+DA3GVTljAFjEoppTwf86+Eg3SDJjWGVegIfcy5u4W7YQaJzKuhVdTCjmHfslXBDzeVgEz1vNS7+QkF18RoirUOBhyDoJVgKEHqDkEZdle8B9gDjCYmZeT7HxF4hJKBD2a1N+1s6v0yi6/K3BipJWfo/1EW7vR7g9zaBcncPX1PsD6BrC5D/B4C2DibR6DRuUlR/L7OJuBI/t+MA0QwO99S/hGedcFT0PDEbhtyu9y4murbVHrNDZkYKeGTHbd5ZI0mQEdO8t3lKAI3W1pd+vs/gFQSwcIoGOcdbcBAAC3BgAAUEsDBBQACAgIACc2JVwAAAAAAAAAAAAAAAAPAAAAd29yZC9zdHlsZXMueG1s"""
|
|
13
|
+
|
|
14
|
+
# Decode and process
|
|
15
|
+
try:
|
|
16
|
+
docx_bytes = base64.b64decode(base64_content)
|
|
17
|
+
print(f"Decoded {len(docx_bytes)} bytes")
|
|
18
|
+
|
|
19
|
+
# Save to temp file
|
|
20
|
+
with open('/tmp/test_doc.docx', 'wb') as f:
|
|
21
|
+
f.write(docx_bytes)
|
|
22
|
+
|
|
23
|
+
print("Saved to /tmp/test_doc.docx")
|
|
24
|
+
|
|
25
|
+
# Check if it's a valid zip/docx
|
|
26
|
+
import zipfile
|
|
27
|
+
if zipfile.is_zipfile('/tmp/test_doc.docx'):
|
|
28
|
+
print("Valid ZIP/DOCX structure detected")
|
|
29
|
+
with zipfile.ZipFile('/tmp/test_doc.docx', 'r') as z:
|
|
30
|
+
print("Contents:", z.namelist()[:5])
|
|
31
|
+
else:
|
|
32
|
+
print("Not a valid ZIP file - content may be truncated")
|
|
33
|
+
|
|
34
|
+
except Exception as e:
|
|
35
|
+
print(f"Error: {e}")
|
|
@@ -0,0 +1,74 @@
|
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
"""
|
|
3
|
+
Test script to verify extraction works with known base64 content
|
|
4
|
+
"""
|
|
5
|
+
|
|
6
|
+
import base64
|
|
7
|
+
import tempfile
|
|
8
|
+
import zipfile
|
|
9
|
+
import re
|
|
10
|
+
from xml.etree import ElementTree as ET
|
|
11
|
+
|
|
12
|
+
WORD_NAMESPACE = '{http://schemas.openxmlformats.org/wordprocessingml/2006/main}'
|
|
13
|
+
|
|
14
|
+
def extract_text_from_xml(xml_content: str) -> str:
|
|
15
|
+
try:
|
|
16
|
+
root = ET.fromstring(xml_content)
|
|
17
|
+
except ET.ParseError:
|
|
18
|
+
texts = re.findall(r'<w:t[^>]*>([^<]*)</w:t>', xml_content)
|
|
19
|
+
return ' '.join(texts)
|
|
20
|
+
|
|
21
|
+
texts = []
|
|
22
|
+
for elem in root.iter():
|
|
23
|
+
if elem.tag == f'{WORD_NAMESPACE}t':
|
|
24
|
+
if elem.text:
|
|
25
|
+
texts.append(elem.text)
|
|
26
|
+
elif elem.tag == f'{WORD_NAMESPACE}p':
|
|
27
|
+
if texts and not texts[-1].endswith('\n'):
|
|
28
|
+
texts.append('\n')
|
|
29
|
+
elif elem.tag == f'{WORD_NAMESPACE}br':
|
|
30
|
+
texts.append('\n')
|
|
31
|
+
|
|
32
|
+
text = ''.join(texts)
|
|
33
|
+
text = re.sub(r'[ \t]+', ' ', text)
|
|
34
|
+
text = re.sub(r'\n\s*\n', '\n\n', text)
|
|
35
|
+
return text.strip()
|
|
36
|
+
|
|
37
|
+
# Read test base64 from file
|
|
38
|
+
TEST_FILE = ".claude/temp/full_base64.txt"
|
|
39
|
+
|
|
40
|
+
try:
|
|
41
|
+
with open(TEST_FILE, 'r') as f:
|
|
42
|
+
base64_content = f.read().strip()
|
|
43
|
+
|
|
44
|
+
print(f"Read {len(base64_content)} chars of base64")
|
|
45
|
+
|
|
46
|
+
docx_bytes = base64.b64decode(base64_content)
|
|
47
|
+
print(f"Decoded to {len(docx_bytes)} bytes")
|
|
48
|
+
|
|
49
|
+
# Save temporarily and check structure
|
|
50
|
+
with tempfile.NamedTemporaryFile(suffix='.docx', delete=False) as tmp:
|
|
51
|
+
tmp.write(docx_bytes)
|
|
52
|
+
tmp_path = tmp.name
|
|
53
|
+
|
|
54
|
+
if zipfile.is_zipfile(tmp_path):
|
|
55
|
+
print("Valid ZIP/DOCX structure")
|
|
56
|
+
with zipfile.ZipFile(tmp_path, 'r') as z:
|
|
57
|
+
files = z.namelist()
|
|
58
|
+
print(f"Contains {len(files)} files")
|
|
59
|
+
if 'word/document.xml' in files:
|
|
60
|
+
xml_content = z.read('word/document.xml').decode('utf-8')
|
|
61
|
+
print(f"document.xml: {len(xml_content)} chars")
|
|
62
|
+
text = extract_text_from_xml(xml_content)
|
|
63
|
+
print(f"\nExtracted text ({len(text)} chars, {len(text.split())} words):")
|
|
64
|
+
print("="*60)
|
|
65
|
+
print(text[:2000] if len(text) > 2000 else text)
|
|
66
|
+
print("="*60)
|
|
67
|
+
else:
|
|
68
|
+
print("Not a valid ZIP file")
|
|
69
|
+
|
|
70
|
+
except FileNotFoundError:
|
|
71
|
+
print(f"Test file not found: {TEST_FILE}")
|
|
72
|
+
print("Please save base64 content to this file first")
|
|
73
|
+
except Exception as e:
|
|
74
|
+
print(f"Error: {e}")
|