@jaguilar87/gaia 5.0.0-rc1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (609) hide show
  1. package/.claude-plugin/marketplace.json +33 -0
  2. package/.claude-plugin/plugin.json +26 -0
  3. package/ARCHITECTURE.md +335 -0
  4. package/CHANGELOG.md +1212 -0
  5. package/CODE_OF_CONDUCT.md +11 -0
  6. package/CONTRIBUTING.md +146 -0
  7. package/INSTALL.md +436 -0
  8. package/LICENSE +21 -0
  9. package/README.md +222 -0
  10. package/SECURITY.md +47 -0
  11. package/agents/README.md +78 -0
  12. package/agents/cloud-troubleshooter.md +73 -0
  13. package/agents/developer.md +65 -0
  14. package/agents/gaia-operator.md +64 -0
  15. package/agents/gaia-orchestrator.md +237 -0
  16. package/agents/gaia-planner.md +53 -0
  17. package/agents/gaia-system.md +70 -0
  18. package/agents/gitops-operator.md +61 -0
  19. package/agents/terraform-architect.md +63 -0
  20. package/bin/README.md +106 -0
  21. package/bin/cli/__init__.py +1 -0
  22. package/bin/cli/approvals.py +740 -0
  23. package/bin/cli/cleanup.py +562 -0
  24. package/bin/cli/context.py +283 -0
  25. package/bin/cli/doctor.py +628 -0
  26. package/bin/cli/history.py +305 -0
  27. package/bin/cli/memory.py +464 -0
  28. package/bin/cli/metrics.py +1068 -0
  29. package/bin/cli/plans.py +515 -0
  30. package/bin/cli/status.py +302 -0
  31. package/bin/cli/update.py +382 -0
  32. package/bin/gaia +112 -0
  33. package/bin/gaia-cleanup.js +531 -0
  34. package/bin/gaia-doctor.js +635 -0
  35. package/bin/gaia-evidence +126 -0
  36. package/bin/gaia-history.js +251 -0
  37. package/bin/gaia-metrics.js +1278 -0
  38. package/bin/gaia-review.js +269 -0
  39. package/bin/gaia-scan +44 -0
  40. package/bin/gaia-scan.py +589 -0
  41. package/bin/gaia-skills-diagnose.js +929 -0
  42. package/bin/gaia-status.js +278 -0
  43. package/bin/gaia-uninstall.js +111 -0
  44. package/bin/gaia-update.js +816 -0
  45. package/bin/pre-publish-validate.js +610 -0
  46. package/bin/python-detect.js +60 -0
  47. package/commands/README.md +64 -0
  48. package/commands/gaia.md +37 -0
  49. package/commands/scan-project.md +67 -0
  50. package/config/README.md +71 -0
  51. package/config/cloud/aws.json +134 -0
  52. package/config/cloud/gcp.json +139 -0
  53. package/config/context-contracts.json +158 -0
  54. package/config/crons-schema.md +81 -0
  55. package/config/git_standards.json +72 -0
  56. package/config/surface-routing.json +421 -0
  57. package/config/universal-rules.json +102 -0
  58. package/dist/gaia-ops/.claude-plugin/plugin.json +24 -0
  59. package/dist/gaia-ops/README.md +80 -0
  60. package/dist/gaia-ops/agents/cloud-troubleshooter.md +73 -0
  61. package/dist/gaia-ops/agents/developer.md +65 -0
  62. package/dist/gaia-ops/agents/gaia-operator.md +64 -0
  63. package/dist/gaia-ops/agents/gaia-orchestrator.md +237 -0
  64. package/dist/gaia-ops/agents/gaia-planner.md +53 -0
  65. package/dist/gaia-ops/agents/gaia-system.md +70 -0
  66. package/dist/gaia-ops/agents/gitops-operator.md +61 -0
  67. package/dist/gaia-ops/agents/terraform-architect.md +63 -0
  68. package/dist/gaia-ops/commands/gaia.md +37 -0
  69. package/dist/gaia-ops/config/README.md +71 -0
  70. package/dist/gaia-ops/config/cloud/aws.json +134 -0
  71. package/dist/gaia-ops/config/cloud/gcp.json +139 -0
  72. package/dist/gaia-ops/config/context-contracts.json +158 -0
  73. package/dist/gaia-ops/config/crons-schema.md +81 -0
  74. package/dist/gaia-ops/config/git_standards.json +72 -0
  75. package/dist/gaia-ops/config/surface-routing.json +421 -0
  76. package/dist/gaia-ops/config/universal-rules.json +102 -0
  77. package/dist/gaia-ops/hooks/adapters/__init__.py +52 -0
  78. package/dist/gaia-ops/hooks/adapters/base.py +219 -0
  79. package/dist/gaia-ops/hooks/adapters/channel.py +17 -0
  80. package/dist/gaia-ops/hooks/adapters/claude_code.py +1890 -0
  81. package/dist/gaia-ops/hooks/adapters/types.py +194 -0
  82. package/dist/gaia-ops/hooks/adapters/utils.py +25 -0
  83. package/dist/gaia-ops/hooks/hooks.json +163 -0
  84. package/dist/gaia-ops/hooks/modules/__init__.py +15 -0
  85. package/dist/gaia-ops/hooks/modules/agents/__init__.py +29 -0
  86. package/dist/gaia-ops/hooks/modules/agents/contract_validator.py +647 -0
  87. package/dist/gaia-ops/hooks/modules/agents/response_contract.py +496 -0
  88. package/dist/gaia-ops/hooks/modules/agents/skill_injection_verifier.py +120 -0
  89. package/dist/gaia-ops/hooks/modules/agents/state_tracker.py +267 -0
  90. package/dist/gaia-ops/hooks/modules/agents/task_info_builder.py +74 -0
  91. package/dist/gaia-ops/hooks/modules/agents/transcript_analyzer.py +458 -0
  92. package/dist/gaia-ops/hooks/modules/agents/transcript_reader.py +152 -0
  93. package/dist/gaia-ops/hooks/modules/audit/__init__.py +28 -0
  94. package/dist/gaia-ops/hooks/modules/audit/event_detector.py +168 -0
  95. package/dist/gaia-ops/hooks/modules/audit/logger.py +131 -0
  96. package/dist/gaia-ops/hooks/modules/audit/metrics.py +134 -0
  97. package/dist/gaia-ops/hooks/modules/audit/workflow_auditor.py +611 -0
  98. package/dist/gaia-ops/hooks/modules/audit/workflow_recorder.py +296 -0
  99. package/dist/gaia-ops/hooks/modules/context/__init__.py +11 -0
  100. package/dist/gaia-ops/hooks/modules/context/agentic_loop_detector.py +165 -0
  101. package/dist/gaia-ops/hooks/modules/context/anchor_tracker.py +317 -0
  102. package/dist/gaia-ops/hooks/modules/context/compact_context_builder.py +218 -0
  103. package/dist/gaia-ops/hooks/modules/context/context_freshness.py +145 -0
  104. package/dist/gaia-ops/hooks/modules/context/context_injector.py +558 -0
  105. package/dist/gaia-ops/hooks/modules/context/context_writer.py +530 -0
  106. package/dist/gaia-ops/hooks/modules/context/contracts_loader.py +161 -0
  107. package/dist/gaia-ops/hooks/modules/core/__init__.py +40 -0
  108. package/dist/gaia-ops/hooks/modules/core/hook_entry.py +78 -0
  109. package/dist/gaia-ops/hooks/modules/core/paths.py +160 -0
  110. package/dist/gaia-ops/hooks/modules/core/plugin_mode.py +149 -0
  111. package/dist/gaia-ops/hooks/modules/core/plugin_setup.py +577 -0
  112. package/dist/gaia-ops/hooks/modules/core/state.py +179 -0
  113. package/dist/gaia-ops/hooks/modules/core/stdin.py +24 -0
  114. package/dist/gaia-ops/hooks/modules/events/__init__.py +1 -0
  115. package/dist/gaia-ops/hooks/modules/events/event_writer.py +210 -0
  116. package/dist/gaia-ops/hooks/modules/memory/__init__.py +8 -0
  117. package/dist/gaia-ops/hooks/modules/memory/episode_writer.py +216 -0
  118. package/dist/gaia-ops/hooks/modules/orchestrator/__init__.py +1 -0
  119. package/dist/gaia-ops/hooks/modules/orchestrator/delegate_mode.py +122 -0
  120. package/dist/gaia-ops/hooks/modules/scanning/__init__.py +8 -0
  121. package/dist/gaia-ops/hooks/modules/scanning/scan_trigger.py +84 -0
  122. package/dist/gaia-ops/hooks/modules/security/__init__.py +120 -0
  123. package/dist/gaia-ops/hooks/modules/security/approval_cleanup.py +87 -0
  124. package/dist/gaia-ops/hooks/modules/security/approval_constants.py +23 -0
  125. package/dist/gaia-ops/hooks/modules/security/approval_grants.py +1638 -0
  126. package/dist/gaia-ops/hooks/modules/security/approval_messages.py +71 -0
  127. package/dist/gaia-ops/hooks/modules/security/approval_scopes.py +222 -0
  128. package/dist/gaia-ops/hooks/modules/security/blocked_commands.py +595 -0
  129. package/dist/gaia-ops/hooks/modules/security/blocked_message_formatter.py +87 -0
  130. package/dist/gaia-ops/hooks/modules/security/command_semantics.py +181 -0
  131. package/dist/gaia-ops/hooks/modules/security/composition_rules.py +547 -0
  132. package/dist/gaia-ops/hooks/modules/security/flag_classifiers.py +873 -0
  133. package/dist/gaia-ops/hooks/modules/security/gitops_validator.py +179 -0
  134. package/dist/gaia-ops/hooks/modules/security/mutative_verbs.py +1131 -0
  135. package/dist/gaia-ops/hooks/modules/security/network_hosts.py +481 -0
  136. package/dist/gaia-ops/hooks/modules/security/prompt_validator.py +40 -0
  137. package/dist/gaia-ops/hooks/modules/security/shell_unwrapper.py +165 -0
  138. package/dist/gaia-ops/hooks/modules/security/tiers.py +196 -0
  139. package/dist/gaia-ops/hooks/modules/session/__init__.py +10 -0
  140. package/dist/gaia-ops/hooks/modules/session/pending_scanner.py +174 -0
  141. package/dist/gaia-ops/hooks/modules/session/session_context_writer.py +100 -0
  142. package/dist/gaia-ops/hooks/modules/session/session_event_injector.py +160 -0
  143. package/dist/gaia-ops/hooks/modules/session/session_manager.py +31 -0
  144. package/dist/gaia-ops/hooks/modules/session/session_registry.py +232 -0
  145. package/dist/gaia-ops/hooks/modules/tools/__init__.py +29 -0
  146. package/dist/gaia-ops/hooks/modules/tools/bash_validator.py +1008 -0
  147. package/dist/gaia-ops/hooks/modules/tools/cloud_pipe_validator.py +231 -0
  148. package/dist/gaia-ops/hooks/modules/tools/hook_response.py +55 -0
  149. package/dist/gaia-ops/hooks/modules/tools/shell_parser.py +227 -0
  150. package/dist/gaia-ops/hooks/modules/tools/stage_decomposer.py +315 -0
  151. package/dist/gaia-ops/hooks/modules/tools/task_validator.py +294 -0
  152. package/dist/gaia-ops/hooks/modules/validation/__init__.py +23 -0
  153. package/dist/gaia-ops/hooks/modules/validation/commit_validator.py +380 -0
  154. package/dist/gaia-ops/hooks/post_compact.py +43 -0
  155. package/dist/gaia-ops/hooks/post_tool_use.py +54 -0
  156. package/dist/gaia-ops/hooks/pre_compact.py +60 -0
  157. package/dist/gaia-ops/hooks/pre_tool_use.py +413 -0
  158. package/dist/gaia-ops/hooks/session_start.py +81 -0
  159. package/dist/gaia-ops/hooks/stop_hook.py +82 -0
  160. package/dist/gaia-ops/hooks/subagent_start.py +71 -0
  161. package/dist/gaia-ops/hooks/subagent_stop.py +295 -0
  162. package/dist/gaia-ops/hooks/task_completed.py +70 -0
  163. package/dist/gaia-ops/hooks/user_prompt_submit.py +246 -0
  164. package/dist/gaia-ops/settings.json +72 -0
  165. package/dist/gaia-ops/skills/README.md +154 -0
  166. package/dist/gaia-ops/skills/agent-protocol/SKILL.md +93 -0
  167. package/dist/gaia-ops/skills/agent-protocol/examples.md +223 -0
  168. package/dist/gaia-ops/skills/agent-response/SKILL.md +69 -0
  169. package/dist/gaia-ops/skills/agentic-loop/SKILL.md +80 -0
  170. package/dist/gaia-ops/skills/agentic-loop/reference.md +378 -0
  171. package/dist/gaia-ops/skills/blog-writing/SKILL.md +98 -0
  172. package/dist/gaia-ops/skills/blog-writing/reference.md +130 -0
  173. package/dist/gaia-ops/skills/brief-spec/SKILL.md +182 -0
  174. package/dist/gaia-ops/skills/command-execution/SKILL.md +64 -0
  175. package/dist/gaia-ops/skills/command-execution/reference.md +83 -0
  176. package/dist/gaia-ops/skills/context-updater/SKILL.md +87 -0
  177. package/dist/gaia-ops/skills/context-updater/examples.md +71 -0
  178. package/dist/gaia-ops/skills/developer-patterns/SKILL.md +50 -0
  179. package/dist/gaia-ops/skills/developer-patterns/reference.md +112 -0
  180. package/dist/gaia-ops/skills/execution/SKILL.md +99 -0
  181. package/dist/gaia-ops/skills/fast-queries/SKILL.md +43 -0
  182. package/dist/gaia-ops/skills/gaia-compact/SKILL.md +74 -0
  183. package/dist/gaia-ops/skills/gaia-patterns/SKILL.md +108 -0
  184. package/dist/gaia-ops/skills/gaia-patterns/reference.md +395 -0
  185. package/dist/gaia-ops/skills/gaia-planner/SKILL.md +37 -0
  186. package/dist/gaia-ops/skills/gaia-planner/reference.md +107 -0
  187. package/dist/gaia-ops/skills/gaia-release/SKILL.md +82 -0
  188. package/dist/gaia-ops/skills/gaia-release/reference.md +102 -0
  189. package/dist/gaia-ops/skills/gaia-self-check/SKILL.md +114 -0
  190. package/dist/gaia-ops/skills/gaia-self-check/reference.md +453 -0
  191. package/dist/gaia-ops/skills/gaia-verify/SKILL.md +77 -0
  192. package/dist/gaia-ops/skills/gaia-verify/reference.md +80 -0
  193. package/dist/gaia-ops/skills/git-conventions/SKILL.md +47 -0
  194. package/dist/gaia-ops/skills/gitops-patterns/SKILL.md +60 -0
  195. package/dist/gaia-ops/skills/gitops-patterns/reference.md +183 -0
  196. package/dist/gaia-ops/skills/gmail-policy/SKILL.md +200 -0
  197. package/dist/gaia-ops/skills/gmail-policy/reference.md +150 -0
  198. package/dist/gaia-ops/skills/gmail-triage/SKILL.md +100 -0
  199. package/dist/gaia-ops/skills/gws-setup/SKILL.md +99 -0
  200. package/dist/gaia-ops/skills/gws-setup/reference.md +73 -0
  201. package/dist/gaia-ops/skills/investigation/SKILL.md +100 -0
  202. package/dist/gaia-ops/skills/memory-curation/SKILL.md +83 -0
  203. package/dist/gaia-ops/skills/memory-search/SKILL.md +88 -0
  204. package/dist/gaia-ops/skills/orchestrator-approval/SKILL.md +160 -0
  205. package/dist/gaia-ops/skills/orchestrator-approval/reference.md +174 -0
  206. package/dist/gaia-ops/skills/pending-approvals/SKILL.md +72 -0
  207. package/dist/gaia-ops/skills/pending-approvals/reference.md +214 -0
  208. package/dist/gaia-ops/skills/readme-writing/SKILL.md +71 -0
  209. package/dist/gaia-ops/skills/readme-writing/reference.md +188 -0
  210. package/dist/gaia-ops/skills/reference.md +135 -0
  211. package/dist/gaia-ops/skills/request-approval/SKILL.md +140 -0
  212. package/dist/gaia-ops/skills/request-approval/examples.md +140 -0
  213. package/dist/gaia-ops/skills/request-approval/reference.md +57 -0
  214. package/dist/gaia-ops/skills/schedule-task/SKILL.md +64 -0
  215. package/dist/gaia-ops/skills/schedule-task/reference.md +233 -0
  216. package/dist/gaia-ops/skills/security-tiers/SKILL.md +141 -0
  217. package/dist/gaia-ops/skills/security-tiers/destructive-commands-reference.md +623 -0
  218. package/dist/gaia-ops/skills/security-tiers/reference.md +39 -0
  219. package/dist/gaia-ops/skills/skill-creation/SKILL.md +92 -0
  220. package/dist/gaia-ops/skills/skill-creation/reference.md +29 -0
  221. package/dist/gaia-ops/skills/terraform-patterns/SKILL.md +89 -0
  222. package/dist/gaia-ops/skills/terraform-patterns/reference.md +93 -0
  223. package/dist/gaia-ops/tools/__init__.py +9 -0
  224. package/dist/gaia-ops/tools/agentic-loop/decide-status.py +210 -0
  225. package/dist/gaia-ops/tools/agentic-loop/parse-metric.py +106 -0
  226. package/dist/gaia-ops/tools/agentic-loop/record-iteration.py +221 -0
  227. package/dist/gaia-ops/tools/context/README.md +132 -0
  228. package/dist/gaia-ops/tools/context/__init__.py +42 -0
  229. package/dist/gaia-ops/tools/context/_paths.py +20 -0
  230. package/dist/gaia-ops/tools/context/context_provider.py +721 -0
  231. package/dist/gaia-ops/tools/context/context_section_reader.py +342 -0
  232. package/dist/gaia-ops/tools/context/deep_merge.py +159 -0
  233. package/dist/gaia-ops/tools/context/pending_updates.py +760 -0
  234. package/dist/gaia-ops/tools/context/surface_router.py +278 -0
  235. package/dist/gaia-ops/tools/fast-queries/README.md +65 -0
  236. package/dist/gaia-ops/tools/fast-queries/__init__.py +30 -0
  237. package/dist/gaia-ops/tools/fast-queries/appservices/quicktriage_devops_developer.sh +75 -0
  238. package/dist/gaia-ops/tools/fast-queries/cloud/aws/quicktriage_aws_troubleshooter.sh +32 -0
  239. package/dist/gaia-ops/tools/fast-queries/cloud/gcp/quicktriage_gcp_troubleshooter.sh +88 -0
  240. package/dist/gaia-ops/tools/fast-queries/gitops/quicktriage_gitops_operator.sh +48 -0
  241. package/dist/gaia-ops/tools/fast-queries/run_triage.sh +59 -0
  242. package/dist/gaia-ops/tools/fast-queries/terraform/quicktriage_terraform_architect.sh +80 -0
  243. package/dist/gaia-ops/tools/gaia_simulator/__init__.py +33 -0
  244. package/dist/gaia-ops/tools/gaia_simulator/cli.py +354 -0
  245. package/dist/gaia-ops/tools/gaia_simulator/extractor.py +457 -0
  246. package/dist/gaia-ops/tools/gaia_simulator/reporter.py +258 -0
  247. package/dist/gaia-ops/tools/gaia_simulator/routing_simulator.py +334 -0
  248. package/dist/gaia-ops/tools/gaia_simulator/runner.py +539 -0
  249. package/dist/gaia-ops/tools/gaia_simulator/skills_mapper.py +264 -0
  250. package/dist/gaia-ops/tools/memory/README.md +0 -0
  251. package/dist/gaia-ops/tools/memory/__init__.py +20 -0
  252. package/dist/gaia-ops/tools/memory/backfill_fts5.py +107 -0
  253. package/dist/gaia-ops/tools/memory/conflict_detector.py +295 -0
  254. package/dist/gaia-ops/tools/memory/episodic.py +1210 -0
  255. package/dist/gaia-ops/tools/memory/git_invalidator.py +262 -0
  256. package/dist/gaia-ops/tools/memory/paths.py +102 -0
  257. package/dist/gaia-ops/tools/memory/scoring.py +193 -0
  258. package/dist/gaia-ops/tools/memory/search_store.py +360 -0
  259. package/dist/gaia-ops/tools/persist_transcript_analysis.py +85 -0
  260. package/dist/gaia-ops/tools/review/__init__.py +1 -0
  261. package/dist/gaia-ops/tools/review/review_engine.py +157 -0
  262. package/dist/gaia-ops/tools/scan/__init__.py +35 -0
  263. package/dist/gaia-ops/tools/scan/config.py +247 -0
  264. package/dist/gaia-ops/tools/scan/merge.py +212 -0
  265. package/dist/gaia-ops/tools/scan/orchestrator.py +549 -0
  266. package/dist/gaia-ops/tools/scan/registry.py +127 -0
  267. package/dist/gaia-ops/tools/scan/scanners/__init__.py +18 -0
  268. package/dist/gaia-ops/tools/scan/scanners/base.py +137 -0
  269. package/dist/gaia-ops/tools/scan/scanners/environment.py +349 -0
  270. package/dist/gaia-ops/tools/scan/scanners/git.py +570 -0
  271. package/dist/gaia-ops/tools/scan/scanners/infrastructure.py +875 -0
  272. package/dist/gaia-ops/tools/scan/scanners/orchestration.py +600 -0
  273. package/dist/gaia-ops/tools/scan/scanners/stack.py +1085 -0
  274. package/dist/gaia-ops/tools/scan/scanners/tools.py +260 -0
  275. package/dist/gaia-ops/tools/scan/setup.py +686 -0
  276. package/dist/gaia-ops/tools/scan/tests/__init__.py +1 -0
  277. package/dist/gaia-ops/tools/scan/tests/conftest.py +796 -0
  278. package/dist/gaia-ops/tools/scan/tests/test_environment.py +323 -0
  279. package/dist/gaia-ops/tools/scan/tests/test_git.py +419 -0
  280. package/dist/gaia-ops/tools/scan/tests/test_infrastructure.py +382 -0
  281. package/dist/gaia-ops/tools/scan/tests/test_integration.py +920 -0
  282. package/dist/gaia-ops/tools/scan/tests/test_merge.py +269 -0
  283. package/dist/gaia-ops/tools/scan/tests/test_orchestration.py +304 -0
  284. package/dist/gaia-ops/tools/scan/tests/test_stack.py +604 -0
  285. package/dist/gaia-ops/tools/scan/tests/test_tools.py +349 -0
  286. package/dist/gaia-ops/tools/scan/ui.py +624 -0
  287. package/dist/gaia-ops/tools/scan/verify.py +270 -0
  288. package/dist/gaia-ops/tools/scan/walk.py +118 -0
  289. package/dist/gaia-ops/tools/scan/workspace.py +85 -0
  290. package/dist/gaia-ops/tools/validation/README.md +244 -0
  291. package/dist/gaia-ops/tools/validation/__init__.py +17 -0
  292. package/dist/gaia-ops/tools/validation/approval_gate.py +321 -0
  293. package/dist/gaia-ops/tools/validation/validate_skills.py +189 -0
  294. package/dist/gaia-security/.claude-plugin/plugin.json +24 -0
  295. package/dist/gaia-security/README.md +90 -0
  296. package/dist/gaia-security/config/universal-rules.json +102 -0
  297. package/dist/gaia-security/hooks/adapters/__init__.py +52 -0
  298. package/dist/gaia-security/hooks/adapters/base.py +219 -0
  299. package/dist/gaia-security/hooks/adapters/channel.py +17 -0
  300. package/dist/gaia-security/hooks/adapters/claude_code.py +1890 -0
  301. package/dist/gaia-security/hooks/adapters/types.py +194 -0
  302. package/dist/gaia-security/hooks/adapters/utils.py +25 -0
  303. package/dist/gaia-security/hooks/hooks.json +84 -0
  304. package/dist/gaia-security/hooks/modules/__init__.py +15 -0
  305. package/dist/gaia-security/hooks/modules/agents/__init__.py +29 -0
  306. package/dist/gaia-security/hooks/modules/agents/contract_validator.py +647 -0
  307. package/dist/gaia-security/hooks/modules/agents/response_contract.py +496 -0
  308. package/dist/gaia-security/hooks/modules/agents/skill_injection_verifier.py +120 -0
  309. package/dist/gaia-security/hooks/modules/agents/state_tracker.py +267 -0
  310. package/dist/gaia-security/hooks/modules/agents/task_info_builder.py +74 -0
  311. package/dist/gaia-security/hooks/modules/agents/transcript_analyzer.py +458 -0
  312. package/dist/gaia-security/hooks/modules/agents/transcript_reader.py +152 -0
  313. package/dist/gaia-security/hooks/modules/audit/__init__.py +28 -0
  314. package/dist/gaia-security/hooks/modules/audit/event_detector.py +168 -0
  315. package/dist/gaia-security/hooks/modules/audit/logger.py +131 -0
  316. package/dist/gaia-security/hooks/modules/audit/metrics.py +134 -0
  317. package/dist/gaia-security/hooks/modules/audit/workflow_auditor.py +611 -0
  318. package/dist/gaia-security/hooks/modules/audit/workflow_recorder.py +296 -0
  319. package/dist/gaia-security/hooks/modules/context/__init__.py +11 -0
  320. package/dist/gaia-security/hooks/modules/context/agentic_loop_detector.py +165 -0
  321. package/dist/gaia-security/hooks/modules/context/anchor_tracker.py +317 -0
  322. package/dist/gaia-security/hooks/modules/context/compact_context_builder.py +218 -0
  323. package/dist/gaia-security/hooks/modules/context/context_freshness.py +145 -0
  324. package/dist/gaia-security/hooks/modules/context/context_injector.py +558 -0
  325. package/dist/gaia-security/hooks/modules/context/context_writer.py +530 -0
  326. package/dist/gaia-security/hooks/modules/context/contracts_loader.py +161 -0
  327. package/dist/gaia-security/hooks/modules/core/__init__.py +40 -0
  328. package/dist/gaia-security/hooks/modules/core/hook_entry.py +78 -0
  329. package/dist/gaia-security/hooks/modules/core/paths.py +160 -0
  330. package/dist/gaia-security/hooks/modules/core/plugin_mode.py +149 -0
  331. package/dist/gaia-security/hooks/modules/core/plugin_setup.py +577 -0
  332. package/dist/gaia-security/hooks/modules/core/state.py +179 -0
  333. package/dist/gaia-security/hooks/modules/core/stdin.py +24 -0
  334. package/dist/gaia-security/hooks/modules/events/__init__.py +1 -0
  335. package/dist/gaia-security/hooks/modules/events/event_writer.py +210 -0
  336. package/dist/gaia-security/hooks/modules/memory/__init__.py +8 -0
  337. package/dist/gaia-security/hooks/modules/memory/episode_writer.py +216 -0
  338. package/dist/gaia-security/hooks/modules/orchestrator/__init__.py +1 -0
  339. package/dist/gaia-security/hooks/modules/orchestrator/delegate_mode.py +122 -0
  340. package/dist/gaia-security/hooks/modules/scanning/__init__.py +8 -0
  341. package/dist/gaia-security/hooks/modules/scanning/scan_trigger.py +84 -0
  342. package/dist/gaia-security/hooks/modules/security/__init__.py +120 -0
  343. package/dist/gaia-security/hooks/modules/security/approval_cleanup.py +87 -0
  344. package/dist/gaia-security/hooks/modules/security/approval_constants.py +23 -0
  345. package/dist/gaia-security/hooks/modules/security/approval_grants.py +1638 -0
  346. package/dist/gaia-security/hooks/modules/security/approval_messages.py +71 -0
  347. package/dist/gaia-security/hooks/modules/security/approval_scopes.py +222 -0
  348. package/dist/gaia-security/hooks/modules/security/blocked_commands.py +595 -0
  349. package/dist/gaia-security/hooks/modules/security/blocked_message_formatter.py +87 -0
  350. package/dist/gaia-security/hooks/modules/security/command_semantics.py +181 -0
  351. package/dist/gaia-security/hooks/modules/security/composition_rules.py +547 -0
  352. package/dist/gaia-security/hooks/modules/security/flag_classifiers.py +873 -0
  353. package/dist/gaia-security/hooks/modules/security/gitops_validator.py +179 -0
  354. package/dist/gaia-security/hooks/modules/security/mutative_verbs.py +1131 -0
  355. package/dist/gaia-security/hooks/modules/security/network_hosts.py +481 -0
  356. package/dist/gaia-security/hooks/modules/security/prompt_validator.py +40 -0
  357. package/dist/gaia-security/hooks/modules/security/shell_unwrapper.py +165 -0
  358. package/dist/gaia-security/hooks/modules/security/tiers.py +196 -0
  359. package/dist/gaia-security/hooks/modules/session/__init__.py +10 -0
  360. package/dist/gaia-security/hooks/modules/session/pending_scanner.py +174 -0
  361. package/dist/gaia-security/hooks/modules/session/session_context_writer.py +100 -0
  362. package/dist/gaia-security/hooks/modules/session/session_event_injector.py +160 -0
  363. package/dist/gaia-security/hooks/modules/session/session_manager.py +31 -0
  364. package/dist/gaia-security/hooks/modules/session/session_registry.py +232 -0
  365. package/dist/gaia-security/hooks/modules/tools/__init__.py +29 -0
  366. package/dist/gaia-security/hooks/modules/tools/bash_validator.py +1008 -0
  367. package/dist/gaia-security/hooks/modules/tools/cloud_pipe_validator.py +231 -0
  368. package/dist/gaia-security/hooks/modules/tools/hook_response.py +55 -0
  369. package/dist/gaia-security/hooks/modules/tools/shell_parser.py +227 -0
  370. package/dist/gaia-security/hooks/modules/tools/stage_decomposer.py +315 -0
  371. package/dist/gaia-security/hooks/modules/tools/task_validator.py +294 -0
  372. package/dist/gaia-security/hooks/modules/validation/__init__.py +23 -0
  373. package/dist/gaia-security/hooks/modules/validation/commit_validator.py +380 -0
  374. package/dist/gaia-security/hooks/post_tool_use.py +54 -0
  375. package/dist/gaia-security/hooks/pre_tool_use.py +413 -0
  376. package/dist/gaia-security/hooks/session_start.py +81 -0
  377. package/dist/gaia-security/hooks/stop_hook.py +82 -0
  378. package/dist/gaia-security/hooks/user_prompt_submit.py +246 -0
  379. package/dist/gaia-security/settings.json +58 -0
  380. package/git-hooks/commit-msg +41 -0
  381. package/hooks/README.md +100 -0
  382. package/hooks/adapters/__init__.py +52 -0
  383. package/hooks/adapters/base.py +219 -0
  384. package/hooks/adapters/channel.py +17 -0
  385. package/hooks/adapters/claude_code.py +1890 -0
  386. package/hooks/adapters/types.py +194 -0
  387. package/hooks/adapters/utils.py +25 -0
  388. package/hooks/elicitation_result.py +179 -0
  389. package/hooks/hooks.json +84 -0
  390. package/hooks/modules/README.md +189 -0
  391. package/hooks/modules/__init__.py +15 -0
  392. package/hooks/modules/agents/__init__.py +29 -0
  393. package/hooks/modules/agents/contract_validator.py +647 -0
  394. package/hooks/modules/agents/response_contract.py +496 -0
  395. package/hooks/modules/agents/skill_injection_verifier.py +120 -0
  396. package/hooks/modules/agents/state_tracker.py +267 -0
  397. package/hooks/modules/agents/task_info_builder.py +74 -0
  398. package/hooks/modules/agents/transcript_analyzer.py +458 -0
  399. package/hooks/modules/agents/transcript_reader.py +152 -0
  400. package/hooks/modules/audit/__init__.py +28 -0
  401. package/hooks/modules/audit/event_detector.py +168 -0
  402. package/hooks/modules/audit/logger.py +131 -0
  403. package/hooks/modules/audit/metrics.py +134 -0
  404. package/hooks/modules/audit/workflow_auditor.py +611 -0
  405. package/hooks/modules/audit/workflow_recorder.py +296 -0
  406. package/hooks/modules/context/__init__.py +11 -0
  407. package/hooks/modules/context/agentic_loop_detector.py +165 -0
  408. package/hooks/modules/context/anchor_tracker.py +317 -0
  409. package/hooks/modules/context/compact_context_builder.py +218 -0
  410. package/hooks/modules/context/context_freshness.py +145 -0
  411. package/hooks/modules/context/context_injector.py +558 -0
  412. package/hooks/modules/context/context_writer.py +530 -0
  413. package/hooks/modules/context/contracts_loader.py +161 -0
  414. package/hooks/modules/core/__init__.py +40 -0
  415. package/hooks/modules/core/hook_entry.py +78 -0
  416. package/hooks/modules/core/paths.py +160 -0
  417. package/hooks/modules/core/plugin_mode.py +149 -0
  418. package/hooks/modules/core/plugin_setup.py +577 -0
  419. package/hooks/modules/core/state.py +179 -0
  420. package/hooks/modules/core/stdin.py +24 -0
  421. package/hooks/modules/events/__init__.py +1 -0
  422. package/hooks/modules/events/event_writer.py +210 -0
  423. package/hooks/modules/evidence/__init__.py +34 -0
  424. package/hooks/modules/evidence/assertions.py +137 -0
  425. package/hooks/modules/evidence/index_writer.py +57 -0
  426. package/hooks/modules/evidence/loader.py +126 -0
  427. package/hooks/modules/evidence/runner.py +241 -0
  428. package/hooks/modules/memory/__init__.py +8 -0
  429. package/hooks/modules/memory/episode_writer.py +216 -0
  430. package/hooks/modules/orchestrator/__init__.py +1 -0
  431. package/hooks/modules/orchestrator/delegate_mode.py +122 -0
  432. package/hooks/modules/scanning/__init__.py +8 -0
  433. package/hooks/modules/scanning/scan_trigger.py +84 -0
  434. package/hooks/modules/security/__init__.py +120 -0
  435. package/hooks/modules/security/approval_cleanup.py +87 -0
  436. package/hooks/modules/security/approval_constants.py +23 -0
  437. package/hooks/modules/security/approval_grants.py +1638 -0
  438. package/hooks/modules/security/approval_messages.py +71 -0
  439. package/hooks/modules/security/approval_scopes.py +222 -0
  440. package/hooks/modules/security/blocked_commands.py +595 -0
  441. package/hooks/modules/security/blocked_message_formatter.py +87 -0
  442. package/hooks/modules/security/command_semantics.py +181 -0
  443. package/hooks/modules/security/composition_rules.py +547 -0
  444. package/hooks/modules/security/flag_classifiers.py +873 -0
  445. package/hooks/modules/security/gitops_validator.py +179 -0
  446. package/hooks/modules/security/mutative_verbs.py +1131 -0
  447. package/hooks/modules/security/network_hosts.py +481 -0
  448. package/hooks/modules/security/prompt_validator.py +40 -0
  449. package/hooks/modules/security/shell_unwrapper.py +165 -0
  450. package/hooks/modules/security/tiers.py +196 -0
  451. package/hooks/modules/session/__init__.py +10 -0
  452. package/hooks/modules/session/pending_scanner.py +174 -0
  453. package/hooks/modules/session/session_context_writer.py +100 -0
  454. package/hooks/modules/session/session_event_injector.py +160 -0
  455. package/hooks/modules/session/session_manager.py +31 -0
  456. package/hooks/modules/session/session_registry.py +232 -0
  457. package/hooks/modules/tools/__init__.py +29 -0
  458. package/hooks/modules/tools/bash_validator.py +1008 -0
  459. package/hooks/modules/tools/cloud_pipe_validator.py +231 -0
  460. package/hooks/modules/tools/hook_response.py +55 -0
  461. package/hooks/modules/tools/shell_parser.py +227 -0
  462. package/hooks/modules/tools/stage_decomposer.py +315 -0
  463. package/hooks/modules/tools/task_validator.py +294 -0
  464. package/hooks/modules/validation/__init__.py +23 -0
  465. package/hooks/modules/validation/commit_validator.py +380 -0
  466. package/hooks/post_compact.py +43 -0
  467. package/hooks/post_tool_use.py +54 -0
  468. package/hooks/pre_compact.py +60 -0
  469. package/hooks/pre_tool_use.py +413 -0
  470. package/hooks/session_start.py +81 -0
  471. package/hooks/stop_hook.py +82 -0
  472. package/hooks/subagent_start.py +71 -0
  473. package/hooks/subagent_stop.py +295 -0
  474. package/hooks/task_completed.py +70 -0
  475. package/hooks/user_prompt_submit.py +246 -0
  476. package/index.js +83 -0
  477. package/package.json +99 -0
  478. package/pyproject.toml +32 -0
  479. package/skills/README.md +154 -0
  480. package/skills/agent-protocol/SKILL.md +93 -0
  481. package/skills/agent-protocol/examples.md +223 -0
  482. package/skills/agent-response/SKILL.md +69 -0
  483. package/skills/agentic-loop/SKILL.md +80 -0
  484. package/skills/agentic-loop/reference.md +378 -0
  485. package/skills/blog-writing/SKILL.md +98 -0
  486. package/skills/blog-writing/reference.md +130 -0
  487. package/skills/brief-spec/SKILL.md +182 -0
  488. package/skills/command-execution/SKILL.md +64 -0
  489. package/skills/command-execution/reference.md +83 -0
  490. package/skills/context-updater/SKILL.md +87 -0
  491. package/skills/context-updater/examples.md +71 -0
  492. package/skills/developer-patterns/SKILL.md +50 -0
  493. package/skills/developer-patterns/reference.md +112 -0
  494. package/skills/execution/SKILL.md +99 -0
  495. package/skills/fast-queries/SKILL.md +43 -0
  496. package/skills/gaia-compact/SKILL.md +74 -0
  497. package/skills/gaia-patterns/SKILL.md +108 -0
  498. package/skills/gaia-patterns/reference.md +395 -0
  499. package/skills/gaia-planner/SKILL.md +37 -0
  500. package/skills/gaia-planner/reference.md +107 -0
  501. package/skills/gaia-release/SKILL.md +82 -0
  502. package/skills/gaia-release/reference.md +102 -0
  503. package/skills/gaia-self-check/SKILL.md +114 -0
  504. package/skills/gaia-self-check/reference.md +453 -0
  505. package/skills/gaia-verify/SKILL.md +77 -0
  506. package/skills/gaia-verify/reference.md +80 -0
  507. package/skills/git-conventions/SKILL.md +47 -0
  508. package/skills/gitops-patterns/SKILL.md +60 -0
  509. package/skills/gitops-patterns/reference.md +183 -0
  510. package/skills/gmail-policy/SKILL.md +200 -0
  511. package/skills/gmail-policy/reference.md +150 -0
  512. package/skills/gmail-triage/SKILL.md +100 -0
  513. package/skills/gws-setup/SKILL.md +99 -0
  514. package/skills/gws-setup/reference.md +73 -0
  515. package/skills/investigation/SKILL.md +100 -0
  516. package/skills/memory-curation/SKILL.md +83 -0
  517. package/skills/memory-search/SKILL.md +88 -0
  518. package/skills/orchestrator-approval/SKILL.md +160 -0
  519. package/skills/orchestrator-approval/reference.md +174 -0
  520. package/skills/pending-approvals/SKILL.md +72 -0
  521. package/skills/pending-approvals/reference.md +214 -0
  522. package/skills/readme-writing/SKILL.md +71 -0
  523. package/skills/readme-writing/reference.md +188 -0
  524. package/skills/reference.md +135 -0
  525. package/skills/request-approval/SKILL.md +140 -0
  526. package/skills/request-approval/examples.md +140 -0
  527. package/skills/request-approval/reference.md +57 -0
  528. package/skills/schedule-task/SKILL.md +64 -0
  529. package/skills/schedule-task/reference.md +233 -0
  530. package/skills/security-tiers/SKILL.md +141 -0
  531. package/skills/security-tiers/destructive-commands-reference.md +623 -0
  532. package/skills/security-tiers/reference.md +39 -0
  533. package/skills/skill-creation/SKILL.md +92 -0
  534. package/skills/skill-creation/reference.md +29 -0
  535. package/skills/terraform-patterns/SKILL.md +89 -0
  536. package/skills/terraform-patterns/reference.md +93 -0
  537. package/templates/README.md +69 -0
  538. package/templates/managed-settings.template.json +43 -0
  539. package/tools/__init__.py +9 -0
  540. package/tools/agentic-loop/decide-status.py +210 -0
  541. package/tools/agentic-loop/parse-metric.py +106 -0
  542. package/tools/agentic-loop/record-iteration.py +221 -0
  543. package/tools/context/README.md +132 -0
  544. package/tools/context/__init__.py +42 -0
  545. package/tools/context/_paths.py +20 -0
  546. package/tools/context/context_provider.py +721 -0
  547. package/tools/context/context_section_reader.py +342 -0
  548. package/tools/context/deep_merge.py +159 -0
  549. package/tools/context/pending_updates.py +760 -0
  550. package/tools/context/surface_router.py +278 -0
  551. package/tools/fast-queries/README.md +65 -0
  552. package/tools/fast-queries/__init__.py +30 -0
  553. package/tools/fast-queries/appservices/quicktriage_devops_developer.sh +75 -0
  554. package/tools/fast-queries/cloud/aws/quicktriage_aws_troubleshooter.sh +32 -0
  555. package/tools/fast-queries/cloud/gcp/quicktriage_gcp_troubleshooter.sh +88 -0
  556. package/tools/fast-queries/gitops/quicktriage_gitops_operator.sh +48 -0
  557. package/tools/fast-queries/run_triage.sh +59 -0
  558. package/tools/fast-queries/terraform/quicktriage_terraform_architect.sh +80 -0
  559. package/tools/gaia_simulator/__init__.py +33 -0
  560. package/tools/gaia_simulator/cli.py +354 -0
  561. package/tools/gaia_simulator/extractor.py +457 -0
  562. package/tools/gaia_simulator/reporter.py +258 -0
  563. package/tools/gaia_simulator/routing_simulator.py +334 -0
  564. package/tools/gaia_simulator/runner.py +539 -0
  565. package/tools/gaia_simulator/skills_mapper.py +264 -0
  566. package/tools/memory/README.md +0 -0
  567. package/tools/memory/__init__.py +20 -0
  568. package/tools/memory/backfill_fts5.py +107 -0
  569. package/tools/memory/conflict_detector.py +295 -0
  570. package/tools/memory/episodic.py +1210 -0
  571. package/tools/memory/git_invalidator.py +262 -0
  572. package/tools/memory/paths.py +102 -0
  573. package/tools/memory/scoring.py +193 -0
  574. package/tools/memory/search_store.py +360 -0
  575. package/tools/persist_transcript_analysis.py +85 -0
  576. package/tools/review/__init__.py +1 -0
  577. package/tools/review/review_engine.py +157 -0
  578. package/tools/scan/__init__.py +35 -0
  579. package/tools/scan/config.py +247 -0
  580. package/tools/scan/merge.py +212 -0
  581. package/tools/scan/orchestrator.py +549 -0
  582. package/tools/scan/registry.py +127 -0
  583. package/tools/scan/scanners/__init__.py +18 -0
  584. package/tools/scan/scanners/base.py +137 -0
  585. package/tools/scan/scanners/environment.py +349 -0
  586. package/tools/scan/scanners/git.py +570 -0
  587. package/tools/scan/scanners/infrastructure.py +875 -0
  588. package/tools/scan/scanners/orchestration.py +600 -0
  589. package/tools/scan/scanners/stack.py +1085 -0
  590. package/tools/scan/scanners/tools.py +260 -0
  591. package/tools/scan/setup.py +686 -0
  592. package/tools/scan/tests/__init__.py +1 -0
  593. package/tools/scan/tests/conftest.py +796 -0
  594. package/tools/scan/tests/test_environment.py +323 -0
  595. package/tools/scan/tests/test_git.py +419 -0
  596. package/tools/scan/tests/test_infrastructure.py +382 -0
  597. package/tools/scan/tests/test_integration.py +920 -0
  598. package/tools/scan/tests/test_merge.py +269 -0
  599. package/tools/scan/tests/test_orchestration.py +304 -0
  600. package/tools/scan/tests/test_stack.py +604 -0
  601. package/tools/scan/tests/test_tools.py +349 -0
  602. package/tools/scan/ui.py +624 -0
  603. package/tools/scan/verify.py +270 -0
  604. package/tools/scan/walk.py +118 -0
  605. package/tools/scan/workspace.py +85 -0
  606. package/tools/validation/README.md +244 -0
  607. package/tools/validation/__init__.py +17 -0
  608. package/tools/validation/approval_gate.py +321 -0
  609. package/tools/validation/validate_skills.py +189 -0
@@ -0,0 +1,539 @@
1
+ """
2
+ Hook executor for gaia-ops replay testing.
3
+
4
+ Runs hooks as subprocesses with ReplayEvent payloads and compares results
5
+ against expected outcomes. Completely decoupled from log parsing.
6
+ """
7
+
8
+ from __future__ import annotations
9
+
10
+ import json
11
+ import os
12
+ import re
13
+ import subprocess
14
+ import sys
15
+ import tempfile
16
+ from dataclasses import dataclass, field
17
+ from pathlib import Path
18
+ from typing import Any, Optional
19
+
20
+ from gaia_simulator.extractor import ReplayEvent
21
+
22
+
23
+ @dataclass(frozen=True)
24
+ class ReplayResult:
25
+ """Result of replaying a single event against the current hooks."""
26
+
27
+ event: ReplayEvent
28
+ actual_exit_code: int
29
+ actual_stdout: str
30
+ actual_stderr: str
31
+ actual_decision: str # "ALLOW", "BLOCK", "DENY", "ERROR"
32
+ actual_tier: str # parsed from stdout if available
33
+ matched: bool # expected_decision == actual_decision
34
+ regression_type: Optional[str] # None, "allow_to_block", "block_to_allow", "tier_change", "exit_code_change"
35
+ actual_metadata: dict[str, Any] = field(default_factory=dict)
36
+
37
+
38
+ _RE_TIER = re.compile(r"\bT[0-3]\b")
39
+
40
+
41
+ def _parse_decision_from_output(
42
+ exit_code: int, stdout: str
43
+ ) -> tuple[str, str]:
44
+ """Parse the hook decision and tier from stdout/exit_code.
45
+
46
+ Returns:
47
+ (decision, tier) tuple.
48
+ """
49
+ decision = "ALLOW"
50
+ tier = ""
51
+
52
+ if exit_code == 2:
53
+ decision = "BLOCK"
54
+ elif exit_code != 0:
55
+ decision = "ERROR"
56
+
57
+ # Try to parse structured JSON from stdout
58
+ stdout_stripped = stdout.strip()
59
+ if stdout_stripped:
60
+ # Hook output may have multiple lines; find the last JSON line
61
+ for line in reversed(stdout_stripped.splitlines()):
62
+ line = line.strip()
63
+ if not line.startswith("{"):
64
+ continue
65
+ try:
66
+ data = json.loads(line)
67
+ # Check for deny via hookSpecificOutput
68
+ hook_output = data.get("hookSpecificOutput", {})
69
+ perm_decision = hook_output.get("permissionDecision", "")
70
+ if perm_decision == "deny":
71
+ decision = "DENY"
72
+ break
73
+ except json.JSONDecodeError:
74
+ continue
75
+
76
+ return decision, tier
77
+
78
+
79
+ def _extract_tier_from_text(*texts: str) -> str:
80
+ """Return the first security tier found in the provided texts."""
81
+ for text in texts:
82
+ if not text:
83
+ continue
84
+ match = _RE_TIER.search(text)
85
+ if match:
86
+ return match.group(0)
87
+ return ""
88
+
89
+
90
+ def _parse_last_json_line(stdout: str) -> Optional[dict[str, Any]]:
91
+ """Parse the last JSON object emitted on stdout, if any."""
92
+ for line in reversed(stdout.strip().splitlines()):
93
+ stripped = line.strip()
94
+ if not stripped.startswith("{"):
95
+ continue
96
+ try:
97
+ return json.loads(stripped)
98
+ except json.JSONDecodeError:
99
+ continue
100
+ return None
101
+
102
+
103
+ def _classify_regression(
104
+ expected_decision: str,
105
+ actual_decision: str,
106
+ expected_exit_code: int,
107
+ actual_exit_code: int,
108
+ expected_tier: str,
109
+ actual_tier: str,
110
+ expected_metadata: Optional[dict[str, Any]] = None,
111
+ actual_metadata: Optional[dict[str, Any]] = None,
112
+ compare_tier: bool = True,
113
+ ) -> Optional[str]:
114
+ """Classify the type of regression, if any.
115
+
116
+ Returns:
117
+ None if no regression, or a string describing the regression type.
118
+ """
119
+ expected_metadata = expected_metadata or {}
120
+ actual_metadata = actual_metadata or {}
121
+
122
+ if expected_decision == actual_decision and expected_exit_code == actual_exit_code:
123
+ if compare_tier and expected_tier and actual_tier and expected_tier != actual_tier:
124
+ return "tier_change"
125
+ for key, expected_value in expected_metadata.items():
126
+ if key not in actual_metadata:
127
+ return f"{key}_missing"
128
+ if actual_metadata[key] != expected_value:
129
+ return f"{key}_change"
130
+ return None
131
+
132
+ if expected_decision == "ALLOW" and actual_decision == "BLOCK":
133
+ return "allow_to_block"
134
+ if expected_decision == "ALLOW" and actual_decision == "DENY":
135
+ return "allow_to_t3"
136
+ if expected_decision == "BLOCK" and actual_decision == "ALLOW":
137
+ return "block_to_allow"
138
+ if expected_decision == "DENY" and actual_decision == "ALLOW":
139
+ return "deny_to_allow"
140
+ if expected_exit_code != actual_exit_code:
141
+ return "exit_code_change"
142
+
143
+ return "decision_change"
144
+
145
+
146
+ class HookRunner:
147
+ """Executes hooks as subprocesses for replay testing.
148
+
149
+ Creates an isolated temporary project directory for each batch run,
150
+ mimicking the .claude/ directory structure that hooks expect.
151
+ """
152
+
153
+ def __init__(self, hooks_dir: Path, project_root: Optional[Path] = None):
154
+ """Initialize the runner.
155
+
156
+ Args:
157
+ hooks_dir: Path to the directory containing hook .py files.
158
+ project_root: Optional path to use as the simulated project root.
159
+ If None, a temporary directory is created per batch.
160
+ """
161
+ self.hooks_dir = hooks_dir
162
+ self.project_root = project_root
163
+ self._timeout = 30
164
+
165
+ def _state_file_path(self, work_dir: Path) -> Path:
166
+ """Return the hook state file path for a replay work directory."""
167
+ return work_dir / ".claude" / ".hooks_state.json"
168
+
169
+ def _load_hook_state(self, work_dir: Path) -> dict[str, Any]:
170
+ """Load hook state written by pre_tool_use, if present."""
171
+ path = self._state_file_path(work_dir)
172
+ if not path.exists():
173
+ return {}
174
+ try:
175
+ return json.loads(path.read_text())
176
+ except (OSError, json.JSONDecodeError):
177
+ return {}
178
+
179
+ def _prime_post_tool_use_state(self, event: ReplayEvent, work_dir: Path) -> None:
180
+ """Seed the pre-hook state so post_tool_use can replay faithfully."""
181
+ tool_input = event.stdin_payload.get("tool_input", {})
182
+ command = ""
183
+ if isinstance(tool_input, dict):
184
+ command = str(tool_input.get("command", ""))
185
+
186
+ state = {
187
+ "tool_name": event.tool_name,
188
+ "command": command,
189
+ "tier": event.expected_tier or "unknown",
190
+ "start_time": "2026-01-01T00:00:00",
191
+ "start_time_epoch": 0.0,
192
+ "session_id": event.stdin_payload.get("session_id", "replay"),
193
+ "pre_hook_result": "allowed",
194
+ "metadata": {},
195
+ }
196
+ self._state_file_path(work_dir).write_text(json.dumps(state))
197
+
198
+ def _read_latest_audit_record(self, work_dir: Path) -> dict[str, Any]:
199
+ """Read the most recent audit record emitted during replay, if any."""
200
+ logs_dir = work_dir / ".claude" / "logs"
201
+ audit_files = sorted(logs_dir.glob("audit-*.jsonl"))
202
+ if not audit_files:
203
+ return {}
204
+ lines = audit_files[-1].read_text(encoding="utf-8", errors="replace").splitlines()
205
+ for line in reversed(lines):
206
+ if not line.strip():
207
+ continue
208
+ try:
209
+ return json.loads(line)
210
+ except json.JSONDecodeError:
211
+ continue
212
+ return {}
213
+
214
+ def _parse_pre_tool_use_result(
215
+ self,
216
+ exit_code: int,
217
+ stdout: str,
218
+ stderr: str,
219
+ work_dir: Path,
220
+ ) -> tuple[str, str, dict[str, Any]]:
221
+ """Parse pre_tool_use results, including tier from hook state/log artifacts."""
222
+ decision, tier = _parse_decision_from_output(exit_code, stdout)
223
+ payload = _parse_last_json_line(stdout) or {}
224
+ hook_output = payload.get("hookSpecificOutput", {}) if isinstance(payload, dict) else {}
225
+
226
+ state = self._load_hook_state(work_dir)
227
+ if not tier:
228
+ tier = str(state.get("tier", "") or "")
229
+ if not tier:
230
+ tier = _extract_tier_from_text(
231
+ str(hook_output.get("permissionDecisionReason", "")),
232
+ stdout,
233
+ stderr,
234
+ )
235
+
236
+ actual_metadata: dict[str, Any] = {}
237
+ if "updatedInput" in hook_output:
238
+ actual_metadata["updated_input"] = hook_output["updatedInput"]
239
+ if "permissionDecisionReason" in hook_output:
240
+ actual_metadata["permission_reason"] = hook_output["permissionDecisionReason"]
241
+ return decision, tier, actual_metadata
242
+
243
+ def _parse_post_tool_use_result(
244
+ self,
245
+ exit_code: int,
246
+ stdout: str,
247
+ work_dir: Path,
248
+ ) -> tuple[str, str, dict[str, Any]]:
249
+ """Parse post_tool_use results using the audit record it just emitted."""
250
+ decision = "PASS" if exit_code == 0 else "ERROR"
251
+ audit_record = self._read_latest_audit_record(work_dir)
252
+ actual_tier = str(audit_record.get("tier", "") or "")
253
+ actual_metadata = {}
254
+ if audit_record:
255
+ actual_metadata["tool_exit_code"] = audit_record.get("exit_code")
256
+ actual_metadata["duration_ms"] = audit_record.get("duration_ms")
257
+ return decision, actual_tier, actual_metadata
258
+
259
+ def _parse_stop_hook_result(
260
+ self,
261
+ exit_code: int,
262
+ stdout: str,
263
+ ) -> tuple[str, str, dict[str, Any]]:
264
+ """Parse stop_hook results from its JSON stdout payload."""
265
+ decision = "PASS" if exit_code == 0 else "ERROR"
266
+ payload = _parse_last_json_line(stdout) or {}
267
+ actual_metadata: dict[str, Any] = {}
268
+ if payload:
269
+ for key in ("quality_sufficient", "score", "recommendation"):
270
+ if key in payload:
271
+ actual_metadata[key] = payload[key]
272
+ return decision, "", actual_metadata
273
+
274
+ def _parse_result(
275
+ self,
276
+ event: ReplayEvent,
277
+ exit_code: int,
278
+ stdout: str,
279
+ stderr: str,
280
+ work_dir: Path,
281
+ ) -> tuple[str, str, dict[str, Any]]:
282
+ """Dispatch hook-specific result parsing."""
283
+ if event.hook_name == "pre_tool_use":
284
+ return self._parse_pre_tool_use_result(exit_code, stdout, stderr, work_dir)
285
+ if event.hook_name == "post_tool_use":
286
+ return self._parse_post_tool_use_result(exit_code, stdout, work_dir)
287
+ if event.hook_name == "stop_hook":
288
+ return self._parse_stop_hook_result(exit_code, stdout)
289
+ return ("PASS" if exit_code == 0 else "ERROR", "", {})
290
+
291
+ def _setup_project_dir(self, base_dir: Path) -> Path:
292
+ """Create a minimal .claude/ directory structure for hooks.
293
+
294
+ Args:
295
+ base_dir: Directory to set up as the project root.
296
+
297
+ Returns:
298
+ The base_dir path.
299
+ """
300
+ claude_dir = base_dir / ".claude"
301
+ claude_dir.mkdir(parents=True, exist_ok=True)
302
+
303
+ # Logs directory
304
+ (claude_dir / "logs").mkdir(exist_ok=True)
305
+
306
+ # Session directory
307
+ session_dir = claude_dir / "session" / "active"
308
+ session_dir.mkdir(parents=True, exist_ok=True)
309
+
310
+ # Project context directory
311
+ pc_dir = claude_dir / "project-context"
312
+ pc_dir.mkdir(parents=True, exist_ok=True)
313
+
314
+ # Minimal project-context.json
315
+ minimal_context = {
316
+ "metadata": {
317
+ "version": "2.0",
318
+ "last_updated": "2026-01-01T00:00:00Z",
319
+ "scan_config": {
320
+ "last_scan": "2026-01-01T00:00:00Z",
321
+ "scanner_version": "0.1.0",
322
+ "staleness_hours": 24,
323
+ },
324
+ },
325
+ "paths": {},
326
+ "sections": {
327
+ "project_identity": {
328
+ "name": "replay-test",
329
+ "type": "application",
330
+ },
331
+ },
332
+ }
333
+ (pc_dir / "project-context.json").write_text(
334
+ json.dumps(minimal_context, indent=2)
335
+ )
336
+
337
+ # Workflow episodic memory dir
338
+ wem_dir = pc_dir / "workflow-episodic-memory"
339
+ wem_dir.mkdir(parents=True, exist_ok=True)
340
+ (wem_dir / "signals").mkdir(exist_ok=True)
341
+
342
+ # Config, memory, metrics directories
343
+ (claude_dir / "config").mkdir(exist_ok=True)
344
+ (claude_dir / "memory").mkdir(exist_ok=True)
345
+ (claude_dir / "metrics").mkdir(exist_ok=True)
346
+
347
+ # Settings.json
348
+ settings = {
349
+ "permissions": {"allow": ["Bash(*)"], "deny": []},
350
+ }
351
+ (claude_dir / "settings.json").write_text(json.dumps(settings, indent=2))
352
+
353
+ return base_dir
354
+
355
+ # Tools that the orchestrator is allowed to use directly.
356
+ # Payloads for these tools should NOT get agent_id injected, because
357
+ # they are orchestrator-level operations (dispatch, communication).
358
+ _ORCHESTRATOR_TOOLS = frozenset({
359
+ "agent", "task", "sendmessage", "skill",
360
+ "taskcreate", "taskupdate", "tasklist", "taskget",
361
+ "toolsearch", "websearch", "webfetch", "askuserquestion",
362
+ "stop", # stop_hook payloads are not subject to delegate mode
363
+ })
364
+
365
+ def _prepare_payload(self, event: ReplayEvent) -> str:
366
+ """Serialize the event payload for the hook subprocess.
367
+
368
+ Injects ``agent_id`` into tool-call payloads that lack one, so
369
+ delegate mode recognises them as subagent context instead of
370
+ blocking them as orchestrator calls. Agent/SendMessage/Task
371
+ payloads are left untouched since the orchestrator context is
372
+ correct for those.
373
+
374
+ Args:
375
+ event: The ReplayEvent being replayed.
376
+
377
+ Returns:
378
+ JSON string to feed to the hook subprocess via stdin.
379
+ """
380
+ payload = event.stdin_payload
381
+ tool_name = (payload.get("tool_name") or event.tool_name or "").lower()
382
+
383
+ if not payload.get("agent_id") and tool_name not in self._ORCHESTRATOR_TOOLS:
384
+ payload = {**payload, "agent_id": "replay-simulator"}
385
+
386
+ return json.dumps(payload)
387
+
388
+ def _resolve_hook_script(self, hook_name: str) -> Path:
389
+ """Resolve hook name to script path.
390
+
391
+ Args:
392
+ hook_name: Hook name like "pre_tool_use" or "subagent_stop".
393
+
394
+ Returns:
395
+ Path to the hook script.
396
+ """
397
+ script_name = f"{hook_name}.py"
398
+ return self.hooks_dir / script_name
399
+
400
+ def run(self, event: ReplayEvent, project_dir: Optional[Path] = None) -> ReplayResult:
401
+ """Run the hook with the event's stdin_payload and compare results.
402
+
403
+ Args:
404
+ event: The ReplayEvent to replay.
405
+ project_dir: Optional project directory to use. If None, uses
406
+ self.project_root or creates a temporary one.
407
+
408
+ Returns:
409
+ ReplayResult with actual vs expected comparison.
410
+ """
411
+ work_dir = project_dir or self.project_root
412
+ if work_dir is None:
413
+ tmp = tempfile.mkdtemp(prefix="replay_")
414
+ work_dir = Path(tmp)
415
+ self._setup_project_dir(work_dir)
416
+
417
+ script_path = self._resolve_hook_script(event.hook_name)
418
+ if not script_path.exists():
419
+ return ReplayResult(
420
+ event=event,
421
+ actual_exit_code=-1,
422
+ actual_stdout="",
423
+ actual_stderr=f"Hook script not found: {script_path}",
424
+ actual_decision="ERROR",
425
+ actual_tier="",
426
+ matched=False,
427
+ regression_type="missing_hook",
428
+ )
429
+
430
+ env = os.environ.copy()
431
+ env.pop("CLAUDE_PLUGIN_ROOT", None)
432
+
433
+ if event.hook_name == "post_tool_use":
434
+ self._prime_post_tool_use_state(event, work_dir)
435
+
436
+ try:
437
+ result = subprocess.run(
438
+ [sys.executable, str(script_path)],
439
+ input=self._prepare_payload(event),
440
+ capture_output=True,
441
+ text=True,
442
+ env=env,
443
+ timeout=self._timeout,
444
+ cwd=str(work_dir),
445
+ )
446
+ except subprocess.TimeoutExpired:
447
+ return ReplayResult(
448
+ event=event,
449
+ actual_exit_code=-1,
450
+ actual_stdout="",
451
+ actual_stderr="Timeout",
452
+ actual_decision="ERROR",
453
+ actual_tier="",
454
+ matched=False,
455
+ regression_type="timeout",
456
+ )
457
+ except OSError as exc:
458
+ return ReplayResult(
459
+ event=event,
460
+ actual_exit_code=-1,
461
+ actual_stdout="",
462
+ actual_stderr=str(exc),
463
+ actual_decision="ERROR",
464
+ actual_tier="",
465
+ matched=False,
466
+ regression_type="os_error",
467
+ )
468
+
469
+ actual_decision, actual_tier, actual_metadata = self._parse_result(
470
+ event,
471
+ result.returncode,
472
+ result.stdout,
473
+ result.stderr,
474
+ work_dir,
475
+ )
476
+
477
+ regression = _classify_regression(
478
+ event.expected_decision,
479
+ actual_decision,
480
+ event.expected_exit_code,
481
+ result.returncode,
482
+ event.expected_tier,
483
+ actual_tier,
484
+ expected_metadata=event.expected_metadata,
485
+ actual_metadata=actual_metadata,
486
+ compare_tier=event.compare_tier,
487
+ )
488
+
489
+ matched = regression is None
490
+
491
+ return ReplayResult(
492
+ event=event,
493
+ actual_exit_code=result.returncode,
494
+ actual_stdout=result.stdout,
495
+ actual_stderr=result.stderr,
496
+ actual_decision=actual_decision,
497
+ actual_tier=actual_tier,
498
+ matched=matched,
499
+ regression_type=regression,
500
+ actual_metadata=actual_metadata,
501
+ )
502
+
503
+ def run_batch(
504
+ self,
505
+ events: list[ReplayEvent],
506
+ progress_callback=None,
507
+ ) -> list[ReplayResult]:
508
+ """Run all events and return all results.
509
+
510
+ Creates a single isolated project directory for the batch to
511
+ share session state across sequential hook calls.
512
+
513
+ Args:
514
+ events: List of ReplayEvents to replay.
515
+ progress_callback: Optional callable(current, total) for progress.
516
+
517
+ Returns:
518
+ List of ReplayResult instances in the same order as events.
519
+ """
520
+ results: list[ReplayResult] = []
521
+
522
+ # Create a shared project directory for the batch
523
+ if self.project_root:
524
+ work_dir = self.project_root
525
+ else:
526
+ tmp = tempfile.mkdtemp(prefix="replay_batch_")
527
+ work_dir = Path(tmp)
528
+
529
+ self._setup_project_dir(work_dir)
530
+
531
+ total = len(events)
532
+ for idx, event in enumerate(events):
533
+ result = self.run(event, project_dir=work_dir)
534
+ results.append(result)
535
+
536
+ if progress_callback:
537
+ progress_callback(idx + 1, total)
538
+
539
+ return results