devflow-engine 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (393) hide show
  1. devflow_engine/__init__.py +3 -0
  2. devflow_engine/agentic_prompts.py +100 -0
  3. devflow_engine/agentic_runtime.py +398 -0
  4. devflow_engine/api_key_flow_harness.py +539 -0
  5. devflow_engine/api_keys.py +357 -0
  6. devflow_engine/bootstrap/__init__.py +2 -0
  7. devflow_engine/bootstrap/provision_from_template.py +84 -0
  8. devflow_engine/cli/__init__.py +0 -0
  9. devflow_engine/cli/app.py +7270 -0
  10. devflow_engine/core/__init__.py +0 -0
  11. devflow_engine/core/config.py +86 -0
  12. devflow_engine/core/logging.py +29 -0
  13. devflow_engine/core/paths.py +45 -0
  14. devflow_engine/core/toml_kv.py +33 -0
  15. devflow_engine/devflow_event_worker.py +1292 -0
  16. devflow_engine/devflow_state.py +201 -0
  17. devflow_engine/devin2/__init__.py +9 -0
  18. devflow_engine/devin2/agent_definition.py +120 -0
  19. devflow_engine/devin2/pi_runner.py +204 -0
  20. devflow_engine/devin_orchestration.py +69 -0
  21. devflow_engine/docs/prompts/anti-patterns.md +42 -0
  22. devflow_engine/docs/prompts/devin-agent-prompt.md +55 -0
  23. devflow_engine/docs/prompts/devin2-agent-prompt.md +81 -0
  24. devflow_engine/docs/prompts/examples/devin-vapi-clone-reference-exchange.json +85 -0
  25. devflow_engine/doctor/__init__.py +2 -0
  26. devflow_engine/doctor/triage.py +140 -0
  27. devflow_engine/error/__init__.py +0 -0
  28. devflow_engine/error/remediation.py +21 -0
  29. devflow_engine/errors/error_solver_dag.py +522 -0
  30. devflow_engine/errors/runtime_observability.py +67 -0
  31. devflow_engine/idea/__init__.py +4 -0
  32. devflow_engine/idea/actors.py +481 -0
  33. devflow_engine/idea/agentic.py +465 -0
  34. devflow_engine/idea/analyze.py +93 -0
  35. devflow_engine/idea/devin_chat_dag.py +1 -0
  36. devflow_engine/idea/diff.py +99 -0
  37. devflow_engine/idea/drafts.py +446 -0
  38. devflow_engine/idea/idea_creation_dag.py +643 -0
  39. devflow_engine/idea/ideation_enrichment.py +355 -0
  40. devflow_engine/idea/ideation_enrichment_worker.py +19 -0
  41. devflow_engine/idea/paths.py +28 -0
  42. devflow_engine/idea/promote.py +53 -0
  43. devflow_engine/idea/redaction.py +27 -0
  44. devflow_engine/idea/repo_tools.py +1277 -0
  45. devflow_engine/idea/response_mode.py +30 -0
  46. devflow_engine/idea/story_pipeline.py +1585 -0
  47. devflow_engine/idea/sufficiency.py +376 -0
  48. devflow_engine/idea/traditional_stories.py +1257 -0
  49. devflow_engine/implementation/__init__.py +0 -0
  50. devflow_engine/implementation/alembic_preflight.py +700 -0
  51. devflow_engine/implementation/dag.py +8450 -0
  52. devflow_engine/implementation/green_gate.py +93 -0
  53. devflow_engine/implementation/prompts.py +108 -0
  54. devflow_engine/implementation/test_runtime.py +623 -0
  55. devflow_engine/integration/__init__.py +19 -0
  56. devflow_engine/integration/agentic.py +66 -0
  57. devflow_engine/integration/dag.py +3539 -0
  58. devflow_engine/integration/prompts.py +114 -0
  59. devflow_engine/integration/supabase_schema.sql +31 -0
  60. devflow_engine/integration/supabase_sync.py +177 -0
  61. devflow_engine/llm/__init__.py +1 -0
  62. devflow_engine/llm/cli_one_shot.py +84 -0
  63. devflow_engine/llm/cli_stream.py +371 -0
  64. devflow_engine/llm/execution_context.py +26 -0
  65. devflow_engine/llm/invoke.py +1322 -0
  66. devflow_engine/llm/provider_api.py +304 -0
  67. devflow_engine/llm/repo_knowledge.py +588 -0
  68. devflow_engine/llm_primitives.py +315 -0
  69. devflow_engine/orchestration.py +62 -0
  70. devflow_engine/planning/__init__.py +0 -0
  71. devflow_engine/planning/analyze_repo.py +92 -0
  72. devflow_engine/planning/render_drafts.py +133 -0
  73. devflow_engine/playground/__init__.py +0 -0
  74. devflow_engine/playground/hooks.py +26 -0
  75. devflow_engine/playwright_workflow/__init__.py +5 -0
  76. devflow_engine/playwright_workflow/dag.py +1317 -0
  77. devflow_engine/process/__init__.py +5 -0
  78. devflow_engine/process/dag.py +59 -0
  79. devflow_engine/project_registration/__init__.py +3 -0
  80. devflow_engine/project_registration/dag.py +1581 -0
  81. devflow_engine/project_registry.py +109 -0
  82. devflow_engine/prompts/devin/generic/prompt.md +6 -0
  83. devflow_engine/prompts/devin/ideation/prompt.md +263 -0
  84. devflow_engine/prompts/devin/ideation/scenarios.md +5 -0
  85. devflow_engine/prompts/devin/ideation_loop/prompt.md +6 -0
  86. devflow_engine/prompts/devin/insight/prompt.md +11 -0
  87. devflow_engine/prompts/devin/insight/scenarios.md +5 -0
  88. devflow_engine/prompts/devin/intake/prompt.md +15 -0
  89. devflow_engine/prompts/devin/iterate/prompt.md +12 -0
  90. devflow_engine/prompts/devin/shared/eval_doctrine.md +9 -0
  91. devflow_engine/prompts/devin/shared/principles.md +246 -0
  92. devflow_engine/prompts/devin_eval/assessment/prompt.md +18 -0
  93. devflow_engine/prompts/idea/api_ideation_agent/prompt.md +8 -0
  94. devflow_engine/prompts/idea/api_insight_agent/prompt.md +8 -0
  95. devflow_engine/prompts/idea/response_doctrine/prompt.md +18 -0
  96. devflow_engine/prompts/implementation/dependency_assessment/prompt.md +12 -0
  97. devflow_engine/prompts/implementation/green/green/prompt.md +11 -0
  98. devflow_engine/prompts/implementation/green/node_config/prompt.md +3 -0
  99. devflow_engine/prompts/implementation/green_review/outcome_review/prompt.md +5 -0
  100. devflow_engine/prompts/implementation/green_review/prior_run_review/prompt.md +5 -0
  101. devflow_engine/prompts/implementation/red/prompt.md +27 -0
  102. devflow_engine/prompts/implementation/redreview/prompt.md +23 -0
  103. devflow_engine/prompts/implementation/redreview_repair/prompt.md +16 -0
  104. devflow_engine/prompts/implementation/setupdoc/prompt.md +10 -0
  105. devflow_engine/prompts/implementation/story_planning/prompt.md +13 -0
  106. devflow_engine/prompts/implementation/test_design/prompt.md +27 -0
  107. devflow_engine/prompts/integration/README.md +185 -0
  108. devflow_engine/prompts/integration/green/example.md +67 -0
  109. devflow_engine/prompts/integration/green/green/prompt.md +10 -0
  110. devflow_engine/prompts/integration/green/node_config/prompt.md +42 -0
  111. devflow_engine/prompts/integration/green/past_prompts/20260417T212300/green/prompt.md +15 -0
  112. devflow_engine/prompts/integration/green/past_prompts/20260417T212300/node_config/prompt.md +42 -0
  113. devflow_engine/prompts/integration/green_enrich/example.md +79 -0
  114. devflow_engine/prompts/integration/green_enrich/green_enrich/prompt.md +9 -0
  115. devflow_engine/prompts/integration/green_enrich/node_config/prompt.md +41 -0
  116. devflow_engine/prompts/integration/green_enrich/past_prompts/20260417T212300/green_enrich/prompt.md +14 -0
  117. devflow_engine/prompts/integration/green_enrich/past_prompts/20260417T212300/node_config/prompt.md +41 -0
  118. devflow_engine/prompts/integration/red/code_repair/prompt.md +12 -0
  119. devflow_engine/prompts/integration/red/example.md +152 -0
  120. devflow_engine/prompts/integration/red/node_config/prompt.md +86 -0
  121. devflow_engine/prompts/integration/red/past_prompts/20260417T212300/code_repair/prompt.md +19 -0
  122. devflow_engine/prompts/integration/red/past_prompts/20260417T212300/node_config/prompt.md +84 -0
  123. devflow_engine/prompts/integration/red/past_prompts/20260417T212300/red/prompt.md +16 -0
  124. devflow_engine/prompts/integration/red/past_prompts/20260417T212300/red_repair/prompt.md +15 -0
  125. devflow_engine/prompts/integration/red/past_prompts/20260417T215032/code_repair/prompt.md +10 -0
  126. devflow_engine/prompts/integration/red/past_prompts/20260417T215032/node_config/prompt.md +84 -0
  127. devflow_engine/prompts/integration/red/past_prompts/20260417T215032/red_repair/prompt.md +11 -0
  128. devflow_engine/prompts/integration/red/red/prompt.md +11 -0
  129. devflow_engine/prompts/integration/red/red_repair/prompt.md +12 -0
  130. devflow_engine/prompts/integration/red_review/example.md +71 -0
  131. devflow_engine/prompts/integration/red_review/node_config/prompt.md +41 -0
  132. devflow_engine/prompts/integration/red_review/past_prompts/20260417T212300/node_config/prompt.md +41 -0
  133. devflow_engine/prompts/integration/red_review/past_prompts/20260417T212300/red_review/prompt.md +15 -0
  134. devflow_engine/prompts/integration/red_review/red_review/prompt.md +9 -0
  135. devflow_engine/prompts/integration/resolve/example.md +111 -0
  136. devflow_engine/prompts/integration/resolve/node_config/prompt.md +64 -0
  137. devflow_engine/prompts/integration/resolve/past_prompts/20260417T212300/node_config/prompt.md +64 -0
  138. devflow_engine/prompts/integration/resolve/past_prompts/20260417T212300/resolve_implicated_users/prompt.md +15 -0
  139. devflow_engine/prompts/integration/resolve/past_prompts/20260417T212300/resolve_side_effects/prompt.md +15 -0
  140. devflow_engine/prompts/integration/resolve/resolve_implicated_users/prompt.md +10 -0
  141. devflow_engine/prompts/integration/resolve/resolve_side_effects/prompt.md +10 -0
  142. devflow_engine/prompts/integration/validate/build_idea_acceptance_coverage/prompt.md +12 -0
  143. devflow_engine/prompts/integration/validate/code_repair/prompt.md +13 -0
  144. devflow_engine/prompts/integration/validate/example.md +143 -0
  145. devflow_engine/prompts/integration/validate/node_config/prompt.md +87 -0
  146. devflow_engine/prompts/integration/validate/past_prompts/20260417T212300/code_repair/prompt.md +19 -0
  147. devflow_engine/prompts/integration/validate/past_prompts/20260417T212300/node_config/prompt.md +67 -0
  148. devflow_engine/prompts/integration/validate/past_prompts/20260417T212300/validate_enrich_gate/prompt.md +17 -0
  149. devflow_engine/prompts/integration/validate/past_prompts/20260417T212300/validate_repair/prompt.md +16 -0
  150. devflow_engine/prompts/integration/validate/past_prompts/20260417T215032/code_repair/prompt.md +10 -0
  151. devflow_engine/prompts/integration/validate/past_prompts/20260417T215032/node_config/prompt.md +67 -0
  152. devflow_engine/prompts/integration/validate/past_prompts/20260417T215032/validate_repair/prompt.md +9 -0
  153. devflow_engine/prompts/integration/validate/validate_enrich_gate/prompt.md +10 -0
  154. devflow_engine/prompts/integration/validate/validate_repair/prompt.md +20 -0
  155. devflow_engine/prompts/integration/write_workflows/example.md +100 -0
  156. devflow_engine/prompts/integration/write_workflows/node_config/prompt.md +44 -0
  157. devflow_engine/prompts/integration/write_workflows/past_prompts/20260417T212300/node_config/prompt.md +44 -0
  158. devflow_engine/prompts/integration/write_workflows/past_prompts/20260417T212300/write_workflows/prompt.md +17 -0
  159. devflow_engine/prompts/integration/write_workflows/write_workflows/prompt.md +11 -0
  160. devflow_engine/prompts/iterate/README.md +7 -0
  161. devflow_engine/prompts/iterate/coder/prompt.md +11 -0
  162. devflow_engine/prompts/iterate/framer/prompt.md +11 -0
  163. devflow_engine/prompts/iterate/iterator/prompt.md +13 -0
  164. devflow_engine/prompts/iterate/observer/prompt.md +11 -0
  165. devflow_engine/prompts/recovery/diagnosis/prompt.md +7 -0
  166. devflow_engine/prompts/recovery/execution/prompt.md +8 -0
  167. devflow_engine/prompts/recovery/execution_verification/prompt.md +7 -0
  168. devflow_engine/prompts/recovery/failure_investigation/prompt.md +10 -0
  169. devflow_engine/prompts/recovery/preflight_health_repo_repair/prompt.md +8 -0
  170. devflow_engine/prompts/recovery/remediation_execution/prompt.md +11 -0
  171. devflow_engine/prompts/recovery/root_cause_investigation/prompt.md +12 -0
  172. devflow_engine/prompts/scope_idea/doctrine/prompt.md +7 -0
  173. devflow_engine/prompts/source_doc_eval/document/prompt.md +6 -0
  174. devflow_engine/prompts/source_doc_eval/targeted_mutation/prompt.md +9 -0
  175. devflow_engine/prompts/source_doc_mutation/domain_entities/prompt.md +6 -0
  176. devflow_engine/prompts/source_doc_mutation/product_brief/prompt.md +6 -0
  177. devflow_engine/prompts/source_doc_mutation/project_doc_coherence/prompt.md +7 -0
  178. devflow_engine/prompts/source_doc_mutation/project_doc_render/prompt.md +9 -0
  179. devflow_engine/prompts/source_doc_mutation/source_doc_coherence/prompt.md +5 -0
  180. devflow_engine/prompts/source_doc_mutation/source_doc_enrichment_coherence/prompt.md +6 -0
  181. devflow_engine/prompts/source_doc_mutation/user_workflows/prompt.md +6 -0
  182. devflow_engine/prompts/source_scope/doctrine/prompt.md +10 -0
  183. devflow_engine/prompts/ui_grounding/doctrine/prompt.md +7 -0
  184. devflow_engine/recovery/__init__.py +3 -0
  185. devflow_engine/recovery/dag.py +2609 -0
  186. devflow_engine/recovery/models.py +220 -0
  187. devflow_engine/refactor.py +93 -0
  188. devflow_engine/registry/__init__.py +1 -0
  189. devflow_engine/registry/cards.py +238 -0
  190. devflow_engine/registry/domain_normalize.py +60 -0
  191. devflow_engine/registry/effects.py +65 -0
  192. devflow_engine/registry/enforce_report.py +150 -0
  193. devflow_engine/registry/module_cards_classify.py +164 -0
  194. devflow_engine/registry/module_cards_draft.py +184 -0
  195. devflow_engine/registry/module_cards_gate.py +59 -0
  196. devflow_engine/registry/packages.py +347 -0
  197. devflow_engine/registry/pathways.py +323 -0
  198. devflow_engine/review/__init__.py +11 -0
  199. devflow_engine/review/dag.py +588 -0
  200. devflow_engine/review/review_story.py +67 -0
  201. devflow_engine/scope_idea/__init__.py +3 -0
  202. devflow_engine/scope_idea/agentic.py +39 -0
  203. devflow_engine/scope_idea/dag.py +1069 -0
  204. devflow_engine/scope_idea/models.py +175 -0
  205. devflow_engine/skills/builtins/devflow/queue_failure_investigation/SKILL.md +112 -0
  206. devflow_engine/skills/builtins/devflow/queue_idea_to_story/SKILL.md +120 -0
  207. devflow_engine/skills/builtins/devflow/queue_integration/SKILL.md +105 -0
  208. devflow_engine/skills/builtins/devflow/queue_recovery/SKILL.md +108 -0
  209. devflow_engine/skills/builtins/devflow/queue_runtime_core/SKILL.md +155 -0
  210. devflow_engine/skills/builtins/devflow/queue_story_implementation/SKILL.md +122 -0
  211. devflow_engine/skills/builtins/devin/idea_to_story_handoff/SKILL.md +120 -0
  212. devflow_engine/skills/builtins/devin/ideation/SKILL.md +168 -0
  213. devflow_engine/skills/builtins/devin/ideation/state-and-phrasing-reference.md +18 -0
  214. devflow_engine/skills/builtins/devin/insight/SKILL.md +22 -0
  215. devflow_engine/skills/registry.example.yaml +42 -0
  216. devflow_engine/source_doc_assumptions.py +291 -0
  217. devflow_engine/source_doc_mutation_dag.py +1606 -0
  218. devflow_engine/source_doc_mutation_eval.py +417 -0
  219. devflow_engine/source_doc_mutation_worker.py +25 -0
  220. devflow_engine/source_docs_schema.py +207 -0
  221. devflow_engine/source_docs_updater.py +309 -0
  222. devflow_engine/source_scope/__init__.py +15 -0
  223. devflow_engine/source_scope/agentic.py +45 -0
  224. devflow_engine/source_scope/dag.py +1626 -0
  225. devflow_engine/source_scope/models.py +177 -0
  226. devflow_engine/stores/__init__.py +0 -0
  227. devflow_engine/stores/execution_store.py +3534 -0
  228. devflow_engine/story/__init__.py +0 -0
  229. devflow_engine/story/contracts.py +160 -0
  230. devflow_engine/story/discovery.py +47 -0
  231. devflow_engine/story/evidence.py +118 -0
  232. devflow_engine/story/hashing.py +27 -0
  233. devflow_engine/story/implemented_queue_purge.py +148 -0
  234. devflow_engine/story/indexer.py +105 -0
  235. devflow_engine/story/io.py +20 -0
  236. devflow_engine/story/markdown_contracts.py +298 -0
  237. devflow_engine/story/reconciliation.py +408 -0
  238. devflow_engine/story/validate_stories.py +149 -0
  239. devflow_engine/story/validate_tests_story.py +512 -0
  240. devflow_engine/story/validation.py +133 -0
  241. devflow_engine/ui_grounding/__init__.py +11 -0
  242. devflow_engine/ui_grounding/agentic.py +31 -0
  243. devflow_engine/ui_grounding/dag.py +874 -0
  244. devflow_engine/ui_grounding/models.py +224 -0
  245. devflow_engine/ui_grounding/pencil_bridge.py +247 -0
  246. devflow_engine/vendor/__init__.py +0 -0
  247. devflow_engine/vendor/datalumina_genai/__init__.py +11 -0
  248. devflow_engine/vendor/datalumina_genai/core/__init__.py +0 -0
  249. devflow_engine/vendor/datalumina_genai/core/exceptions.py +9 -0
  250. devflow_engine/vendor/datalumina_genai/core/nodes/__init__.py +0 -0
  251. devflow_engine/vendor/datalumina_genai/core/nodes/agent.py +48 -0
  252. devflow_engine/vendor/datalumina_genai/core/nodes/agent_streaming_node.py +26 -0
  253. devflow_engine/vendor/datalumina_genai/core/nodes/base.py +89 -0
  254. devflow_engine/vendor/datalumina_genai/core/nodes/concurrent.py +30 -0
  255. devflow_engine/vendor/datalumina_genai/core/nodes/router.py +69 -0
  256. devflow_engine/vendor/datalumina_genai/core/schema.py +72 -0
  257. devflow_engine/vendor/datalumina_genai/core/task.py +52 -0
  258. devflow_engine/vendor/datalumina_genai/core/validate.py +139 -0
  259. devflow_engine/vendor/datalumina_genai/core/workflow.py +200 -0
  260. devflow_engine/worker.py +1086 -0
  261. devflow_engine/worker_guard.py +233 -0
  262. devflow_engine-1.0.0.dist-info/METADATA +235 -0
  263. devflow_engine-1.0.0.dist-info/RECORD +393 -0
  264. devflow_engine-1.0.0.dist-info/WHEEL +4 -0
  265. devflow_engine-1.0.0.dist-info/entry_points.txt +3 -0
  266. devin/__init__.py +6 -0
  267. devin/dag.py +58 -0
  268. devin/dag_two_arm.py +138 -0
  269. devin/devin_chat_scenario_catalog.json +588 -0
  270. devin/devin_eval.py +677 -0
  271. devin/nodes/__init__.py +0 -0
  272. devin/nodes/ideation/__init__.py +0 -0
  273. devin/nodes/ideation/node.py +195 -0
  274. devin/nodes/ideation/playground.py +267 -0
  275. devin/nodes/ideation/prompt.md +65 -0
  276. devin/nodes/ideation/scenarios/continue_refinement.py +13 -0
  277. devin/nodes/ideation/scenarios/continue_refinement_evals.py +18 -0
  278. devin/nodes/ideation/scenarios/idea_fits_existing_patterns.py +17 -0
  279. devin/nodes/ideation/scenarios/idea_fits_existing_patterns_evals.py +16 -0
  280. devin/nodes/ideation/scenarios/large_idea_split.py +4 -0
  281. devin/nodes/ideation/scenarios/large_idea_split_evals.py +17 -0
  282. devin/nodes/ideation/scenarios/source_documentation_added.py +4 -0
  283. devin/nodes/ideation/scenarios/source_documentation_added_evals.py +16 -0
  284. devin/nodes/ideation/scenarios/user_says_create_it.py +30 -0
  285. devin/nodes/ideation/scenarios/user_says_create_it_evals.py +23 -0
  286. devin/nodes/ideation/scenarios/vague_idea.py +16 -0
  287. devin/nodes/ideation/scenarios/vague_idea_evals.py +47 -0
  288. devin/nodes/ideation/tools.json +312 -0
  289. devin/nodes/insight/__init__.py +0 -0
  290. devin/nodes/insight/node.py +49 -0
  291. devin/nodes/insight/playground.py +154 -0
  292. devin/nodes/insight/prompt.md +61 -0
  293. devin/nodes/insight/scenarios/architecture_pattern_query.py +15 -0
  294. devin/nodes/insight/scenarios/architecture_pattern_query_evals.py +25 -0
  295. devin/nodes/insight/scenarios/codebase_exploration.py +15 -0
  296. devin/nodes/insight/scenarios/codebase_exploration_evals.py +23 -0
  297. devin/nodes/insight/scenarios/devin_ideation_routing.py +19 -0
  298. devin/nodes/insight/scenarios/devin_ideation_routing_evals.py +39 -0
  299. devin/nodes/insight/scenarios/devin_insight_routing.py +20 -0
  300. devin/nodes/insight/scenarios/devin_insight_routing_evals.py +40 -0
  301. devin/nodes/insight/scenarios/operational_debugging.py +15 -0
  302. devin/nodes/insight/scenarios/operational_debugging_evals.py +23 -0
  303. devin/nodes/insight/scenarios/operational_question.py +9 -0
  304. devin/nodes/insight/scenarios/operational_question_evals.py +8 -0
  305. devin/nodes/insight/scenarios/queue_status.py +15 -0
  306. devin/nodes/insight/scenarios/queue_status_evals.py +23 -0
  307. devin/nodes/insight/scenarios/source_doc_explanation.py +14 -0
  308. devin/nodes/insight/scenarios/source_doc_explanation_evals.py +21 -0
  309. devin/nodes/insight/scenarios/worker_state_check.py +15 -0
  310. devin/nodes/insight/scenarios/worker_state_check_evals.py +22 -0
  311. devin/nodes/insight/tools.json +126 -0
  312. devin/nodes/intake/__init__.py +0 -0
  313. devin/nodes/intake/node.py +27 -0
  314. devin/nodes/intake/playground.py +47 -0
  315. devin/nodes/intake/prompt.md +12 -0
  316. devin/nodes/intake/scenarios/ideation_routing.py +4 -0
  317. devin/nodes/intake/scenarios/ideation_routing_evals.py +5 -0
  318. devin/nodes/intake/scenarios/insight_routing.py +4 -0
  319. devin/nodes/intake/scenarios/insight_routing_evals.py +5 -0
  320. devin/nodes/iterate/README.md +44 -0
  321. devin/nodes/iterate/__init__.py +1 -0
  322. devin/nodes/iterate/_archived_design_stages/01-objectives-requirements.md +112 -0
  323. devin/nodes/iterate/_archived_design_stages/02-evals.md +131 -0
  324. devin/nodes/iterate/_archived_design_stages/03-tools-and-boundaries.md +110 -0
  325. devin/nodes/iterate/_archived_design_stages/04-harness-and-playground.md +32 -0
  326. devin/nodes/iterate/_archived_design_stages/05-prompt-deferred.md +11 -0
  327. devin/nodes/iterate/_archived_design_stages/coder_agent_design/01-objectives-requirements.md +20 -0
  328. devin/nodes/iterate/_archived_design_stages/coder_agent_design/02-evals.md +8 -0
  329. devin/nodes/iterate/_archived_design_stages/coder_agent_design/03-tools-and-boundaries.md +14 -0
  330. devin/nodes/iterate/_archived_design_stages/coder_agent_design/04-harness-and-playground.md +12 -0
  331. devin/nodes/iterate/_archived_design_stages/framer_agent_design/01-objectives-requirements.md +20 -0
  332. devin/nodes/iterate/_archived_design_stages/framer_agent_design/02-evals.md +8 -0
  333. devin/nodes/iterate/_archived_design_stages/framer_agent_design/03-tools-and-boundaries.md +13 -0
  334. devin/nodes/iterate/_archived_design_stages/framer_agent_design/04-harness-and-playground.md +12 -0
  335. devin/nodes/iterate/_archived_design_stages/iterator_agent_design/01-objectives-requirements.md +25 -0
  336. devin/nodes/iterate/_archived_design_stages/iterator_agent_design/02-evals.md +9 -0
  337. devin/nodes/iterate/_archived_design_stages/iterator_agent_design/03-tools-and-boundaries.md +14 -0
  338. devin/nodes/iterate/_archived_design_stages/iterator_agent_design/04-harness-and-playground.md +12 -0
  339. devin/nodes/iterate/_archived_design_stages/observer_agent_design/01-objectives-requirements.md +20 -0
  340. devin/nodes/iterate/_archived_design_stages/observer_agent_design/02-evals.md +8 -0
  341. devin/nodes/iterate/_archived_design_stages/observer_agent_design/03-tools-and-boundaries.md +14 -0
  342. devin/nodes/iterate/_archived_design_stages/observer_agent_design/04-harness-and-playground.md +13 -0
  343. devin/nodes/iterate/agent-roles.md +89 -0
  344. devin/nodes/iterate/agents/README.md +10 -0
  345. devin/nodes/iterate/artifacts.md +504 -0
  346. devin/nodes/iterate/contract.md +100 -0
  347. devin/nodes/iterate/eval-plan.md +74 -0
  348. devin/nodes/iterate/node.py +100 -0
  349. devin/nodes/iterate/pipeline/README.md +13 -0
  350. devin/nodes/iterate/playground-contract.md +76 -0
  351. devin/nodes/iterate/prompt.md +11 -0
  352. devin/nodes/iterate/scenarios/README.md +38 -0
  353. devin/nodes/iterate/scenarios/artifact-and-loop-scenarios.md +101 -0
  354. devin/nodes/iterate/scenarios/coder_artifact_alignment.py +32 -0
  355. devin/nodes/iterate/scenarios/coder_artifact_alignment_evals.py +45 -0
  356. devin/nodes/iterate/scenarios/coder_bounded_fix.py +27 -0
  357. devin/nodes/iterate/scenarios/coder_bounded_fix_evals.py +45 -0
  358. devin/nodes/iterate/scenarios/devin_iterate_routing.py +21 -0
  359. devin/nodes/iterate/scenarios/devin_iterate_routing_evals.py +36 -0
  360. devin/nodes/iterate/scenarios/framer_scope_boundary.py +25 -0
  361. devin/nodes/iterate/scenarios/framer_scope_boundary_evals.py +57 -0
  362. devin/nodes/iterate/scenarios/framer_task_framing.py +25 -0
  363. devin/nodes/iterate/scenarios/framer_task_framing_evals.py +58 -0
  364. devin/nodes/iterate/scenarios/iterate_error_fix.py +21 -0
  365. devin/nodes/iterate/scenarios/iterate_error_fix_evals.py +39 -0
  366. devin/nodes/iterate/scenarios/iterate_quick_change.py +21 -0
  367. devin/nodes/iterate/scenarios/iterate_quick_change_evals.py +35 -0
  368. devin/nodes/iterate/scenarios/iterate_to_idea_promotion.py +23 -0
  369. devin/nodes/iterate/scenarios/iterate_to_idea_promotion_evals.py +53 -0
  370. devin/nodes/iterate/scenarios/iterate_to_insight_reroute.py +23 -0
  371. devin/nodes/iterate/scenarios/iterate_to_insight_reroute_evals.py +53 -0
  372. devin/nodes/iterate/scenarios/observer_evidence_seam.py +28 -0
  373. devin/nodes/iterate/scenarios/observer_evidence_seam_evals.py +55 -0
  374. devin/nodes/iterate/scenarios/observer_repro_creation.py +28 -0
  375. devin/nodes/iterate/scenarios/observer_repro_creation_evals.py +45 -0
  376. devin/nodes/iterate/scenarios/routing-matrix.md +45 -0
  377. devin/nodes/shared/__init__.py +0 -0
  378. devin/nodes/shared/filemaker_expert.md +80 -0
  379. devin/nodes/shared/filemaker_expert.py +354 -0
  380. devin/nodes/shared/filemaker_expert_eval/runner.py +176 -0
  381. devin/nodes/shared/filemaker_expert_eval/scenarios.json +65 -0
  382. devin/nodes/shared/goldilocks_advisor_eval/runner.py +214 -0
  383. devin/nodes/shared/goldilocks_advisor_eval/scenarios.json +58 -0
  384. devin/nodes/shared/helpers.py +156 -0
  385. devin/nodes/shared/idea_compliance_advisor_eval/runner.py +252 -0
  386. devin/nodes/shared/idea_compliance_advisor_eval/scenarios.json +75 -0
  387. devin/nodes/shared/models.py +44 -0
  388. devin/nodes/shared/post.py +40 -0
  389. devin/nodes/shared/router.py +107 -0
  390. devin/nodes/shared/tools.py +191 -0
  391. devin/shared/devin-chat-rubric.md +237 -0
  392. devin/shared/devin-chat-scenario-suite.md +90 -0
  393. devin/shared/eval_doctrine.md +9 -0
@@ -0,0 +1,539 @@
1
+ from __future__ import annotations
2
+
3
+ import base64
4
+ import json
5
+ import os
6
+ import threading
7
+ import uuid
8
+ from dataclasses import asdict, dataclass, field
9
+ from datetime import UTC, datetime, timedelta
10
+ from hashlib import sha256
11
+ from http.server import BaseHTTPRequestHandler, ThreadingHTTPServer
12
+ from typing import Any, Literal
13
+ from urllib.parse import parse_qs, urlparse
14
+
15
+ from cryptography.hazmat.primitives.ciphers.aead import AESGCM
16
+
17
+ from . import api_keys
18
+ from .devflow_event_worker import DevflowEventWorkerService
19
+ import devflow_engine.devflow_event_worker as worker_module
20
+
21
+ FailureMode = Literal["success", "caller_contract", "grant_resolution", "decrypt", "storage"]
22
+ StorageMode = Literal["mock", "real"]
23
+
24
+
25
+ @dataclass(frozen=True)
26
+ class ApiKeyTransportSmokeScenario:
27
+ provider: str = "openai"
28
+ api_key: str = "smoke-openai-key-12345678"
29
+ tier: str = "light"
30
+ storage_mode: StorageMode = "mock"
31
+ failure_mode: FailureMode = "success"
32
+ worker_id: str = "devflow-api-key-smoke"
33
+ project_id: str = field(default_factory=lambda: str(uuid.uuid4()))
34
+ event_id: str = field(default_factory=lambda: str(uuid.uuid4()))
35
+ grant_id: str = field(default_factory=lambda: str(uuid.uuid4()))
36
+ grant_token: str = "temporary-transport-secret"
37
+ occurred_at: str = field(default_factory=lambda: datetime.now(UTC).isoformat())
38
+
39
+
40
+ @dataclass(frozen=True)
41
+ class ApiKeyTransportSmokeResult:
42
+ ok: bool
43
+ failure_seam: str | None
44
+ message: str | None
45
+ scenario: dict[str, Any]
46
+ dispatch_result: dict[str, Any] | None
47
+ final_event: dict[str, Any] | None
48
+ execution_runs: list[dict[str, Any]]
49
+ execution_step_runs: list[dict[str, Any]]
50
+ grant_requests: list[dict[str, Any]]
51
+ supabase_requests: list[dict[str, Any]]
52
+ storage: dict[str, Any]
53
+
54
+ def to_dict(self) -> dict[str, Any]:
55
+ return asdict(self)
56
+
57
+
58
+ class _MockStorageRecorder:
59
+ def __init__(self) -> None:
60
+ self.keychain_writes: list[dict[str, Any]] = []
61
+ self.runtime_writes: list[dict[str, Any]] = []
62
+ self.runtime_env_vars: list[str] = []
63
+
64
+ def store_provider_api_key(self, provider: str, api_key: str) -> None:
65
+ spec = api_keys._resolve_provider_spec(provider)
66
+ credential = api_keys.validate_provider_api_key(provider=spec.provider, api_key=api_key)
67
+ self.keychain_writes.append(
68
+ {
69
+ "provider": spec.provider,
70
+ "length": len(credential),
71
+ "last4": credential[-4:],
72
+ }
73
+ )
74
+
75
+ def set_runtime_provider_api_key(self, provider: str, api_key: str) -> str:
76
+ spec = api_keys._resolve_provider_spec(provider)
77
+ credential = api_keys.validate_provider_api_key(provider=spec.provider, api_key=api_key)
78
+ self.runtime_writes.append(
79
+ {
80
+ "provider": spec.provider,
81
+ "env_var": spec.env_var,
82
+ "length": len(credential),
83
+ "last4": credential[-4:],
84
+ }
85
+ )
86
+ self.runtime_env_vars.append(spec.env_var)
87
+ return spec.env_var
88
+
89
+ def snapshot(self) -> dict[str, Any]:
90
+ return {
91
+ "mode": "mock",
92
+ "keychain_writes": list(self.keychain_writes),
93
+ "runtime_writes": list(self.runtime_writes),
94
+ "runtime_env_vars": list(self.runtime_env_vars),
95
+ }
96
+
97
+
98
+ class _InMemorySupabase:
99
+ def __init__(self, *, scenario: ApiKeyTransportSmokeScenario, event_payload: dict[str, Any]) -> None:
100
+ self._lock = threading.Lock()
101
+ self.next_run_id = 1
102
+ self.next_step_id = 1
103
+ self.requests: list[dict[str, Any]] = []
104
+ self.tables: dict[str, list[dict[str, Any]]] = {
105
+ "devflow_projects": [
106
+ {
107
+ "id": scenario.project_id,
108
+ "name": "API Key Smoke Project",
109
+ "environment": "development",
110
+ "metadata": {},
111
+ "devflow_repo_root": None,
112
+ }
113
+ ],
114
+ "devflow_execution_events": [
115
+ {
116
+ "id": scenario.event_id,
117
+ "project_id": scenario.project_id,
118
+ "event_type": "devflow_API_KEY",
119
+ "status": "queued",
120
+ "stage": None,
121
+ "error": None,
122
+ "run_id": None,
123
+ "producer": None,
124
+ "occurred_at": scenario.occurred_at,
125
+ "payload": event_payload,
126
+ }
127
+ ],
128
+ "devflow_execution_runs": [],
129
+ "devflow_execution_step_runs": [],
130
+ }
131
+
132
+ def handle(self, *, method: str, path: str, headers: dict[str, str], body: Any | None) -> tuple[int, Any]:
133
+ parsed = urlparse(path)
134
+ table = parsed.path.removeprefix("/rest/v1/")
135
+ query = parse_qs(parsed.query, keep_blank_values=True)
136
+ with self._lock:
137
+ self.requests.append(
138
+ {
139
+ "method": method,
140
+ "path": parsed.path,
141
+ "query": {key: list(values) for key, values in query.items()},
142
+ "body": body,
143
+ }
144
+ )
145
+ if table not in self.tables:
146
+ return 404, {"detail": f"Unknown table: {table}"}
147
+ if method == "GET":
148
+ return 200, self._select(table=table, query=query)
149
+ if method == "PATCH":
150
+ rows = self._patch(table=table, query=query, fields=body or {})
151
+ prefer = str(headers.get("Prefer") or "")
152
+ return 200, rows if "return=representation" in prefer else []
153
+ if method == "POST":
154
+ row = self._insert(table=table, payload=body or {})
155
+ prefer = str(headers.get("Prefer") or "")
156
+ return 201, [row] if "return=representation" in prefer else []
157
+ return 405, {"detail": f"Unsupported method: {method}"}
158
+
159
+ def _select(self, *, table: str, query: dict[str, list[str]]) -> list[dict[str, Any]]:
160
+ rows = [dict(row) for row in self.tables[table] if self._matches(row=row, query=query)]
161
+ order = self._single_value(query, "order")
162
+ if order:
163
+ field, _, direction = order.partition(".")
164
+ rows.sort(key=lambda item: item.get(field))
165
+ if direction.lower() == "desc":
166
+ rows.reverse()
167
+ limit = self._single_value(query, "limit")
168
+ if limit and limit.isdigit():
169
+ rows = rows[: int(limit)]
170
+ return rows
171
+
172
+ def _patch(self, *, table: str, query: dict[str, list[str]], fields: dict[str, Any]) -> list[dict[str, Any]]:
173
+ rows: list[dict[str, Any]] = []
174
+ for row in self.tables[table]:
175
+ if not self._matches(row=row, query=query):
176
+ continue
177
+ row.update(fields)
178
+ rows.append(dict(row))
179
+ return rows
180
+
181
+ def _insert(self, *, table: str, payload: dict[str, Any]) -> dict[str, Any]:
182
+ row = dict(payload)
183
+ if table == "devflow_execution_runs":
184
+ row.setdefault("id", self.next_run_id)
185
+ self.next_run_id += 1
186
+ elif table == "devflow_execution_step_runs":
187
+ row.setdefault("id", self.next_step_id)
188
+ self.next_step_id += 1
189
+ self.tables[table].append(row)
190
+ return dict(row)
191
+
192
+ def _matches(self, *, row: dict[str, Any], query: dict[str, list[str]]) -> bool:
193
+ for key, values in query.items():
194
+ if key in {"select", "order", "limit"}:
195
+ continue
196
+ if not values:
197
+ continue
198
+ raw = values[-1]
199
+ if raw.startswith("eq."):
200
+ expected = raw[3:]
201
+ if str(row.get(key)) != expected:
202
+ return False
203
+ continue
204
+ if raw == "is.null":
205
+ if row.get(key) is not None:
206
+ return False
207
+ continue
208
+ return True
209
+
210
+ @staticmethod
211
+ def _single_value(query: dict[str, list[str]], key: str) -> str | None:
212
+ values = query.get(key)
213
+ if not values:
214
+ return None
215
+ return values[-1]
216
+
217
+
218
+ class _SupabaseHandler(BaseHTTPRequestHandler):
219
+ server: "_HarnessHttpServer"
220
+
221
+ def do_GET(self) -> None: # noqa: N802
222
+ self._handle()
223
+
224
+ def do_PATCH(self) -> None: # noqa: N802
225
+ self._handle()
226
+
227
+ def do_POST(self) -> None: # noqa: N802
228
+ self._handle()
229
+
230
+ def _handle(self) -> None:
231
+ length = int(self.headers.get("Content-Length") or "0")
232
+ raw = self.rfile.read(length) if length else b""
233
+ body = json.loads(raw.decode("utf-8")) if raw else None
234
+ status, payload = self.server.dispatch(method=self.command, path=self.path, headers=dict(self.headers), body=body)
235
+ encoded = json.dumps(payload).encode("utf-8")
236
+ self.send_response(status)
237
+ self.send_header("Content-Type", "application/json")
238
+ self.send_header("Content-Length", str(len(encoded)))
239
+ self.end_headers()
240
+ self.wfile.write(encoded)
241
+
242
+ def log_message(self, format: str, *args: object) -> None:
243
+ return None
244
+
245
+
246
+ class _GrantResolutionServer:
247
+ def __init__(self, *, scenario: ApiKeyTransportSmokeScenario) -> None:
248
+ self.scenario = scenario
249
+ self.secret = "smoke-grant-secret"
250
+ self.requests: list[dict[str, Any]] = []
251
+ self.base_url: str = ""
252
+
253
+ def handle(self, *, method: str, path: str, headers: dict[str, str], body: Any | None) -> tuple[int, Any]:
254
+ parsed = urlparse(path)
255
+ request = {
256
+ "method": method,
257
+ "path": parsed.path,
258
+ "authorization": headers.get("Authorization"),
259
+ }
260
+ self.requests.append(request)
261
+
262
+ canonical_path = f"/api/devflow/settings/transport-grant/{self.scenario.grant_id}"
263
+ legacy_resolve_path = "/api/devflow/settings/transport-grant/resolve"
264
+
265
+ if self.scenario.failure_mode == "caller_contract":
266
+ if method == "POST" and parsed.path == legacy_resolve_path:
267
+ return 200, {"detail": "legacy endpoint available"}
268
+ request["response_status"] = 404
269
+ return 404, {"detail": "Not Found"}
270
+
271
+ if method != "GET" or parsed.path != canonical_path:
272
+ request["response_status"] = 404
273
+ return 404, {"detail": "Not Found"}
274
+
275
+ if self.scenario.failure_mode == "grant_resolution":
276
+ request["response_status"] = 404
277
+ return 404, {"detail": "DevFlow transport grant not found or expired"}
278
+
279
+ grant_token = self.scenario.grant_token
280
+ if self.scenario.failure_mode == "decrypt":
281
+ grant_token = "wrong-transport-secret"
282
+
283
+ payload = {
284
+ "grantId": self.scenario.grant_id,
285
+ "grantToken": grant_token,
286
+ "wrappedKey": "ciphertext",
287
+ "wrappingAlgorithm": "AES-GCM",
288
+ "wrappingKeyId": "kid-smoke-123",
289
+ "iv": "nonce-smoke",
290
+ "metadata": {
291
+ "algorithm": "AES-GCM",
292
+ "version": "devflow.api_key.v1",
293
+ },
294
+ "expiresAt": (datetime.now(UTC) + timedelta(minutes=5)).isoformat(),
295
+ }
296
+ request["response_status"] = 200
297
+ return 200, payload
298
+
299
+
300
+ class _GrantHandler(BaseHTTPRequestHandler):
301
+ server: "_HarnessHttpServer"
302
+
303
+ def do_GET(self) -> None: # noqa: N802
304
+ self._handle()
305
+
306
+ def do_POST(self) -> None: # noqa: N802
307
+ self._handle()
308
+
309
+ def _handle(self) -> None:
310
+ length = int(self.headers.get("Content-Length") or "0")
311
+ raw = self.rfile.read(length) if length else b""
312
+ body = json.loads(raw.decode("utf-8")) if raw else None
313
+ status, payload = self.server.dispatch(method=self.command, path=self.path, headers=dict(self.headers), body=body)
314
+ encoded = json.dumps(payload).encode("utf-8")
315
+ self.send_response(status)
316
+ self.send_header("Content-Type", "application/json")
317
+ self.send_header("Content-Length", str(len(encoded)))
318
+ self.end_headers()
319
+ self.wfile.write(encoded)
320
+
321
+ def log_message(self, format: str, *args: object) -> None:
322
+ return None
323
+
324
+
325
+ class _HarnessHttpServer(ThreadingHTTPServer):
326
+ def __init__(self, server_address: tuple[str, int], handler_class: type[BaseHTTPRequestHandler], dispatcher) -> None:
327
+ super().__init__(server_address, handler_class)
328
+ self._dispatcher = dispatcher
329
+
330
+ def dispatch(self, *, method: str, path: str, headers: dict[str, str], body: Any | None) -> tuple[int, Any]:
331
+ return self._dispatcher(method=method, path=path, headers=headers, body=body)
332
+
333
+
334
+ class _ServerThread:
335
+ def __init__(self, server: _HarnessHttpServer) -> None:
336
+ self.server = server
337
+ self.thread = threading.Thread(target=self.server.serve_forever, daemon=True)
338
+
339
+ def __enter__(self) -> "_ServerThread":
340
+ self.thread.start()
341
+ return self
342
+
343
+ def __exit__(self, exc_type, exc, tb) -> None:
344
+ self.server.shutdown()
345
+ self.server.server_close()
346
+ self.thread.join(timeout=5)
347
+
348
+
349
+ def _encrypt_transport_payload(*, grant_token: str, provider: str, credential: str, tier: str) -> dict[str, Any]:
350
+ plaintext = json.dumps(
351
+ {
352
+ "submitted_at": datetime.now(UTC).isoformat(),
353
+ "secret": {
354
+ "tier": tier,
355
+ "provider": provider,
356
+ "credential": credential,
357
+ },
358
+ }
359
+ ).encode("utf-8")
360
+ iv = b"0123456789ab"
361
+ key = sha256(grant_token.encode("utf-8")).digest()
362
+ ciphertext = AESGCM(key).encrypt(iv, plaintext, None)
363
+ return {
364
+ "ciphertext": base64.b64encode(ciphertext).decode("ascii"),
365
+ "iv": base64.b64encode(iv).decode("ascii"),
366
+ "metadata": {
367
+ "algorithm": "AES-GCM",
368
+ "key_derivation": "SHA-256",
369
+ "key_material": "transport-grant-token",
370
+ "content_type": "application/json",
371
+ "content_encoding": "utf-8",
372
+ "version": "devflow.api_key.v1",
373
+ },
374
+ }
375
+
376
+
377
+ def _build_event_payload(scenario: ApiKeyTransportSmokeScenario) -> dict[str, Any]:
378
+ return {
379
+ "transport": {
380
+ "format": "devflow.api_key.v1",
381
+ "grant_id": scenario.grant_id,
382
+ "expires_at": (datetime.now(UTC) + timedelta(minutes=5)).isoformat(),
383
+ "secret_count": 1,
384
+ "wrapping_key_id": "kid-smoke-123",
385
+ },
386
+ "secret_descriptor": {
387
+ "tier": scenario.tier,
388
+ "provider": scenario.provider,
389
+ "last4": scenario.api_key[-4:],
390
+ "length": len(scenario.api_key),
391
+ },
392
+ "transport_payload": _encrypt_transport_payload(
393
+ grant_token=scenario.grant_token,
394
+ provider=scenario.provider,
395
+ credential=scenario.api_key,
396
+ tier=scenario.tier,
397
+ ),
398
+ }
399
+
400
+
401
+ def _classify_failure(*, exc: Exception, scenario: ApiKeyTransportSmokeScenario, grant_requests: list[dict[str, Any]]) -> str:
402
+ message = str(exc)
403
+ if scenario.failure_mode == "caller_contract":
404
+ return "dfe_caller_contract"
405
+ if scenario.failure_mode == "grant_resolution":
406
+ return "clarity_grant_resolution"
407
+ if scenario.failure_mode == "decrypt":
408
+ return "decrypt_logic"
409
+ if scenario.failure_mode == "storage":
410
+ return "keychain_env_setting"
411
+ if "transport grant resolution request failed" in message:
412
+ last_status = None if not grant_requests else grant_requests[-1].get("response_status")
413
+ if last_status in {404, 405}:
414
+ return "dfe_caller_contract"
415
+ return "clarity_grant_resolution"
416
+ if "transport grant" in message or "unwrap material" in message:
417
+ return "clarity_grant_resolution"
418
+ if "decrypt" in message or "transport payload" in message:
419
+ return "decrypt_logic"
420
+ if "keychain" in message or "storage" in message:
421
+ return "keychain_env_setting"
422
+ return "worker_runtime"
423
+
424
+
425
+ def _restore_environ(previous: dict[str, str | None]) -> None:
426
+ for key, value in previous.items():
427
+ if value is None:
428
+ os.environ.pop(key, None)
429
+ else:
430
+ os.environ[key] = value
431
+
432
+
433
+ def run_api_key_transport_smoke(
434
+ scenario: ApiKeyTransportSmokeScenario | None = None,
435
+ ) -> ApiKeyTransportSmokeResult:
436
+ scenario = scenario or ApiKeyTransportSmokeScenario()
437
+ event_payload = _build_event_payload(scenario)
438
+ supabase = _InMemorySupabase(scenario=scenario, event_payload=event_payload)
439
+ grant_server = _GrantResolutionServer(scenario=scenario)
440
+ storage = _MockStorageRecorder()
441
+
442
+ supabase_http = _HarnessHttpServer(("127.0.0.1", 0), _SupabaseHandler, supabase.handle)
443
+ grant_http = _HarnessHttpServer(("127.0.0.1", 0), _GrantHandler, grant_server.handle)
444
+ grant_server.base_url = f"http://127.0.0.1:{grant_http.server_address[1]}/api/devflow/settings/transport-grant"
445
+ supabase_url = f"http://127.0.0.1:{supabase_http.server_address[1]}"
446
+
447
+ env_previous = {
448
+ key: os.environ.get(key)
449
+ for key in (
450
+ "DEVFLOW_TRANSPORT_GRANT_RESOLUTION_URL",
451
+ "DEVFLOW_TRANSPORT_GRANT_RESOLUTION_SECRET",
452
+ )
453
+ }
454
+ original_bootstrap = worker_module.bootstrap_provider_api_keys
455
+ original_resolve_config = worker_module._resolve_supabase_rest_config
456
+ original_store = worker_module.store_provider_api_key
457
+ original_set_runtime = worker_module.set_runtime_provider_api_key
458
+
459
+ dispatch_result: dict[str, Any] | None = None
460
+ failure_seam: str | None = None
461
+ message: str | None = None
462
+
463
+ try:
464
+ os.environ["DEVFLOW_TRANSPORT_GRANT_RESOLUTION_URL"] = grant_server.base_url
465
+ os.environ["DEVFLOW_TRANSPORT_GRANT_RESOLUTION_SECRET"] = grant_server.secret
466
+ worker_module.bootstrap_provider_api_keys = lambda env=None: {}
467
+ worker_module._resolve_supabase_rest_config = lambda: (supabase_url, "svc-key")
468
+
469
+ if scenario.storage_mode == "mock":
470
+ worker_module.store_provider_api_key = storage.store_provider_api_key
471
+ worker_module.set_runtime_provider_api_key = storage.set_runtime_provider_api_key
472
+ if scenario.failure_mode == "storage":
473
+ worker_module.store_provider_api_key = lambda provider, api_key: (_ for _ in ()).throw(
474
+ RuntimeError("Failed to write macOS keychain entry for provider smoke")
475
+ )
476
+
477
+ with _ServerThread(supabase_http), _ServerThread(grant_http):
478
+ service = DevflowEventWorkerService(worker_id=scenario.worker_id)
479
+ result = service.dispatch_next_event()
480
+ if result is None:
481
+ raise RuntimeError("No queued devflow_API_KEY event was dispatched")
482
+
483
+ dispatch_result = {
484
+ "event_id": result.event_id,
485
+ "execution_run_id": result.execution_run_id,
486
+ "workflow_key": result.workflow_key,
487
+ "command": result.command,
488
+ "result": result.result,
489
+ }
490
+ if result.workflow_key != "api_key":
491
+ raise RuntimeError(f"Unexpected workflow_key: {result.workflow_key}")
492
+ if result.result.get("provider") != scenario.provider:
493
+ raise RuntimeError("Worker reported an unexpected provider")
494
+ if not grant_server.requests:
495
+ raise RuntimeError("Worker never requested transport grant resolution")
496
+ request = grant_server.requests[-1]
497
+ if request.get("method") != "GET":
498
+ raise RuntimeError("Worker did not use GET for transport grant resolution")
499
+ auth_header = str(request.get("authorization") or "")
500
+ if not auth_header.startswith("Bearer "):
501
+ raise RuntimeError("Worker omitted HMAC auth for transport grant resolution")
502
+ except Exception as exc:
503
+ failure_seam = _classify_failure(exc=exc, scenario=scenario, grant_requests=grant_server.requests)
504
+ message = str(exc)
505
+ finally:
506
+ worker_module.bootstrap_provider_api_keys = original_bootstrap
507
+ worker_module._resolve_supabase_rest_config = original_resolve_config
508
+ worker_module.store_provider_api_key = original_store
509
+ worker_module.set_runtime_provider_api_key = original_set_runtime
510
+ _restore_environ(env_previous)
511
+
512
+ final_event = None
513
+ for row in supabase.tables["devflow_execution_events"]:
514
+ if str(row.get("id")) == scenario.event_id:
515
+ final_event = dict(row)
516
+ break
517
+
518
+ storage_snapshot = storage.snapshot() if scenario.storage_mode == "mock" else {"mode": "real"}
519
+ return ApiKeyTransportSmokeResult(
520
+ ok=failure_seam is None,
521
+ failure_seam=failure_seam,
522
+ message=message,
523
+ scenario={
524
+ "provider": scenario.provider,
525
+ "tier": scenario.tier,
526
+ "storage_mode": scenario.storage_mode,
527
+ "failure_mode": scenario.failure_mode,
528
+ "project_id": scenario.project_id,
529
+ "event_id": scenario.event_id,
530
+ "grant_id": scenario.grant_id,
531
+ },
532
+ dispatch_result=dispatch_result,
533
+ final_event=final_event,
534
+ execution_runs=[dict(row) for row in supabase.tables["devflow_execution_runs"]],
535
+ execution_step_runs=[dict(row) for row in supabase.tables["devflow_execution_step_runs"]],
536
+ grant_requests=list(grant_server.requests),
537
+ supabase_requests=list(supabase.requests),
538
+ storage=storage_snapshot,
539
+ )