PyPI - devflow-engine - Versions diffs - 1.0.0__py3-none-any.whl - Mend

devflow-engine 1.0.0__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (393) hide show

devflow_engine/__init__.py +3 -0
devflow_engine/agentic_prompts.py +100 -0
devflow_engine/agentic_runtime.py +398 -0
devflow_engine/api_key_flow_harness.py +539 -0
devflow_engine/api_keys.py +357 -0
devflow_engine/bootstrap/__init__.py +2 -0
devflow_engine/bootstrap/provision_from_template.py +84 -0
devflow_engine/cli/__init__.py +0 -0
devflow_engine/cli/app.py +7270 -0
devflow_engine/core/__init__.py +0 -0
devflow_engine/core/config.py +86 -0
devflow_engine/core/logging.py +29 -0
devflow_engine/core/paths.py +45 -0
devflow_engine/core/toml_kv.py +33 -0
devflow_engine/devflow_event_worker.py +1292 -0
devflow_engine/devflow_state.py +201 -0
devflow_engine/devin2/__init__.py +9 -0
devflow_engine/devin2/agent_definition.py +120 -0
devflow_engine/devin2/pi_runner.py +204 -0
devflow_engine/devin_orchestration.py +69 -0
devflow_engine/docs/prompts/anti-patterns.md +42 -0
devflow_engine/docs/prompts/devin-agent-prompt.md +55 -0
devflow_engine/docs/prompts/devin2-agent-prompt.md +81 -0
devflow_engine/docs/prompts/examples/devin-vapi-clone-reference-exchange.json +85 -0
devflow_engine/doctor/__init__.py +2 -0
devflow_engine/doctor/triage.py +140 -0
devflow_engine/error/__init__.py +0 -0
devflow_engine/error/remediation.py +21 -0
devflow_engine/errors/error_solver_dag.py +522 -0
devflow_engine/errors/runtime_observability.py +67 -0
devflow_engine/idea/__init__.py +4 -0
devflow_engine/idea/actors.py +481 -0
devflow_engine/idea/agentic.py +465 -0
devflow_engine/idea/analyze.py +93 -0
devflow_engine/idea/devin_chat_dag.py +1 -0
devflow_engine/idea/diff.py +99 -0
devflow_engine/idea/drafts.py +446 -0
devflow_engine/idea/idea_creation_dag.py +643 -0
devflow_engine/idea/ideation_enrichment.py +355 -0
devflow_engine/idea/ideation_enrichment_worker.py +19 -0
devflow_engine/idea/paths.py +28 -0
devflow_engine/idea/promote.py +53 -0
devflow_engine/idea/redaction.py +27 -0
devflow_engine/idea/repo_tools.py +1277 -0
devflow_engine/idea/response_mode.py +30 -0
devflow_engine/idea/story_pipeline.py +1585 -0
devflow_engine/idea/sufficiency.py +376 -0
devflow_engine/idea/traditional_stories.py +1257 -0
devflow_engine/implementation/__init__.py +0 -0
devflow_engine/implementation/alembic_preflight.py +700 -0
devflow_engine/implementation/dag.py +8450 -0
devflow_engine/implementation/green_gate.py +93 -0
devflow_engine/implementation/prompts.py +108 -0
devflow_engine/implementation/test_runtime.py +623 -0
devflow_engine/integration/__init__.py +19 -0
devflow_engine/integration/agentic.py +66 -0
devflow_engine/integration/dag.py +3539 -0
devflow_engine/integration/prompts.py +114 -0
devflow_engine/integration/supabase_schema.sql +31 -0
devflow_engine/integration/supabase_sync.py +177 -0
devflow_engine/llm/__init__.py +1 -0
devflow_engine/llm/cli_one_shot.py +84 -0
devflow_engine/llm/cli_stream.py +371 -0
devflow_engine/llm/execution_context.py +26 -0
devflow_engine/llm/invoke.py +1322 -0
devflow_engine/llm/provider_api.py +304 -0
devflow_engine/llm/repo_knowledge.py +588 -0
devflow_engine/llm_primitives.py +315 -0
devflow_engine/orchestration.py +62 -0
devflow_engine/planning/__init__.py +0 -0
devflow_engine/planning/analyze_repo.py +92 -0
devflow_engine/planning/render_drafts.py +133 -0
devflow_engine/playground/__init__.py +0 -0
devflow_engine/playground/hooks.py +26 -0
devflow_engine/playwright_workflow/__init__.py +5 -0
devflow_engine/playwright_workflow/dag.py +1317 -0
devflow_engine/process/__init__.py +5 -0
devflow_engine/process/dag.py +59 -0
devflow_engine/project_registration/__init__.py +3 -0
devflow_engine/project_registration/dag.py +1581 -0
devflow_engine/project_registry.py +109 -0
devflow_engine/prompts/devin/generic/prompt.md +6 -0
devflow_engine/prompts/devin/ideation/prompt.md +263 -0
devflow_engine/prompts/devin/ideation/scenarios.md +5 -0
devflow_engine/prompts/devin/ideation_loop/prompt.md +6 -0
devflow_engine/prompts/devin/insight/prompt.md +11 -0
devflow_engine/prompts/devin/insight/scenarios.md +5 -0
devflow_engine/prompts/devin/intake/prompt.md +15 -0
devflow_engine/prompts/devin/iterate/prompt.md +12 -0
devflow_engine/prompts/devin/shared/eval_doctrine.md +9 -0
devflow_engine/prompts/devin/shared/principles.md +246 -0
devflow_engine/prompts/devin_eval/assessment/prompt.md +18 -0
devflow_engine/prompts/idea/api_ideation_agent/prompt.md +8 -0
devflow_engine/prompts/idea/api_insight_agent/prompt.md +8 -0
devflow_engine/prompts/idea/response_doctrine/prompt.md +18 -0
devflow_engine/prompts/implementation/dependency_assessment/prompt.md +12 -0
devflow_engine/prompts/implementation/green/green/prompt.md +11 -0
devflow_engine/prompts/implementation/green/node_config/prompt.md +3 -0
devflow_engine/prompts/implementation/green_review/outcome_review/prompt.md +5 -0
devflow_engine/prompts/implementation/green_review/prior_run_review/prompt.md +5 -0
devflow_engine/prompts/implementation/red/prompt.md +27 -0
devflow_engine/prompts/implementation/redreview/prompt.md +23 -0
devflow_engine/prompts/implementation/redreview_repair/prompt.md +16 -0
devflow_engine/prompts/implementation/setupdoc/prompt.md +10 -0
devflow_engine/prompts/implementation/story_planning/prompt.md +13 -0
devflow_engine/prompts/implementation/test_design/prompt.md +27 -0
devflow_engine/prompts/integration/README.md +185 -0
devflow_engine/prompts/integration/green/example.md +67 -0
devflow_engine/prompts/integration/green/green/prompt.md +10 -0
devflow_engine/prompts/integration/green/node_config/prompt.md +42 -0
devflow_engine/prompts/integration/green/past_prompts/20260417T212300/green/prompt.md +15 -0
devflow_engine/prompts/integration/green/past_prompts/20260417T212300/node_config/prompt.md +42 -0
devflow_engine/prompts/integration/green_enrich/example.md +79 -0
devflow_engine/prompts/integration/green_enrich/green_enrich/prompt.md +9 -0
devflow_engine/prompts/integration/green_enrich/node_config/prompt.md +41 -0
devflow_engine/prompts/integration/green_enrich/past_prompts/20260417T212300/green_enrich/prompt.md +14 -0
devflow_engine/prompts/integration/green_enrich/past_prompts/20260417T212300/node_config/prompt.md +41 -0
devflow_engine/prompts/integration/red/code_repair/prompt.md +12 -0
devflow_engine/prompts/integration/red/example.md +152 -0
devflow_engine/prompts/integration/red/node_config/prompt.md +86 -0
devflow_engine/prompts/integration/red/past_prompts/20260417T212300/code_repair/prompt.md +19 -0
devflow_engine/prompts/integration/red/past_prompts/20260417T212300/node_config/prompt.md +84 -0
devflow_engine/prompts/integration/red/past_prompts/20260417T212300/red/prompt.md +16 -0
devflow_engine/prompts/integration/red/past_prompts/20260417T212300/red_repair/prompt.md +15 -0
devflow_engine/prompts/integration/red/past_prompts/20260417T215032/code_repair/prompt.md +10 -0
devflow_engine/prompts/integration/red/past_prompts/20260417T215032/node_config/prompt.md +84 -0
devflow_engine/prompts/integration/red/past_prompts/20260417T215032/red_repair/prompt.md +11 -0
devflow_engine/prompts/integration/red/red/prompt.md +11 -0
devflow_engine/prompts/integration/red/red_repair/prompt.md +12 -0
devflow_engine/prompts/integration/red_review/example.md +71 -0
devflow_engine/prompts/integration/red_review/node_config/prompt.md +41 -0
devflow_engine/prompts/integration/red_review/past_prompts/20260417T212300/node_config/prompt.md +41 -0
devflow_engine/prompts/integration/red_review/past_prompts/20260417T212300/red_review/prompt.md +15 -0
devflow_engine/prompts/integration/red_review/red_review/prompt.md +9 -0
devflow_engine/prompts/integration/resolve/example.md +111 -0
devflow_engine/prompts/integration/resolve/node_config/prompt.md +64 -0
devflow_engine/prompts/integration/resolve/past_prompts/20260417T212300/node_config/prompt.md +64 -0
devflow_engine/prompts/integration/resolve/past_prompts/20260417T212300/resolve_implicated_users/prompt.md +15 -0
devflow_engine/prompts/integration/resolve/past_prompts/20260417T212300/resolve_side_effects/prompt.md +15 -0
devflow_engine/prompts/integration/resolve/resolve_implicated_users/prompt.md +10 -0
devflow_engine/prompts/integration/resolve/resolve_side_effects/prompt.md +10 -0
devflow_engine/prompts/integration/validate/build_idea_acceptance_coverage/prompt.md +12 -0
devflow_engine/prompts/integration/validate/code_repair/prompt.md +13 -0
devflow_engine/prompts/integration/validate/example.md +143 -0
devflow_engine/prompts/integration/validate/node_config/prompt.md +87 -0
devflow_engine/prompts/integration/validate/past_prompts/20260417T212300/code_repair/prompt.md +19 -0
devflow_engine/prompts/integration/validate/past_prompts/20260417T212300/node_config/prompt.md +67 -0
devflow_engine/prompts/integration/validate/past_prompts/20260417T212300/validate_enrich_gate/prompt.md +17 -0
devflow_engine/prompts/integration/validate/past_prompts/20260417T212300/validate_repair/prompt.md +16 -0
devflow_engine/prompts/integration/validate/past_prompts/20260417T215032/code_repair/prompt.md +10 -0
devflow_engine/prompts/integration/validate/past_prompts/20260417T215032/node_config/prompt.md +67 -0
devflow_engine/prompts/integration/validate/past_prompts/20260417T215032/validate_repair/prompt.md +9 -0
devflow_engine/prompts/integration/validate/validate_enrich_gate/prompt.md +10 -0
devflow_engine/prompts/integration/validate/validate_repair/prompt.md +20 -0
devflow_engine/prompts/integration/write_workflows/example.md +100 -0
devflow_engine/prompts/integration/write_workflows/node_config/prompt.md +44 -0
devflow_engine/prompts/integration/write_workflows/past_prompts/20260417T212300/node_config/prompt.md +44 -0
devflow_engine/prompts/integration/write_workflows/past_prompts/20260417T212300/write_workflows/prompt.md +17 -0
devflow_engine/prompts/integration/write_workflows/write_workflows/prompt.md +11 -0
devflow_engine/prompts/iterate/README.md +7 -0
devflow_engine/prompts/iterate/coder/prompt.md +11 -0
devflow_engine/prompts/iterate/framer/prompt.md +11 -0
devflow_engine/prompts/iterate/iterator/prompt.md +13 -0
devflow_engine/prompts/iterate/observer/prompt.md +11 -0
devflow_engine/prompts/recovery/diagnosis/prompt.md +7 -0
devflow_engine/prompts/recovery/execution/prompt.md +8 -0
devflow_engine/prompts/recovery/execution_verification/prompt.md +7 -0
devflow_engine/prompts/recovery/failure_investigation/prompt.md +10 -0
devflow_engine/prompts/recovery/preflight_health_repo_repair/prompt.md +8 -0
devflow_engine/prompts/recovery/remediation_execution/prompt.md +11 -0
devflow_engine/prompts/recovery/root_cause_investigation/prompt.md +12 -0
devflow_engine/prompts/scope_idea/doctrine/prompt.md +7 -0
devflow_engine/prompts/source_doc_eval/document/prompt.md +6 -0
devflow_engine/prompts/source_doc_eval/targeted_mutation/prompt.md +9 -0
devflow_engine/prompts/source_doc_mutation/domain_entities/prompt.md +6 -0
devflow_engine/prompts/source_doc_mutation/product_brief/prompt.md +6 -0
devflow_engine/prompts/source_doc_mutation/project_doc_coherence/prompt.md +7 -0
devflow_engine/prompts/source_doc_mutation/project_doc_render/prompt.md +9 -0
devflow_engine/prompts/source_doc_mutation/source_doc_coherence/prompt.md +5 -0
devflow_engine/prompts/source_doc_mutation/source_doc_enrichment_coherence/prompt.md +6 -0
devflow_engine/prompts/source_doc_mutation/user_workflows/prompt.md +6 -0
devflow_engine/prompts/source_scope/doctrine/prompt.md +10 -0
devflow_engine/prompts/ui_grounding/doctrine/prompt.md +7 -0
devflow_engine/recovery/__init__.py +3 -0
devflow_engine/recovery/dag.py +2609 -0
devflow_engine/recovery/models.py +220 -0
devflow_engine/refactor.py +93 -0
devflow_engine/registry/__init__.py +1 -0
devflow_engine/registry/cards.py +238 -0
devflow_engine/registry/domain_normalize.py +60 -0
devflow_engine/registry/effects.py +65 -0
devflow_engine/registry/enforce_report.py +150 -0
devflow_engine/registry/module_cards_classify.py +164 -0
devflow_engine/registry/module_cards_draft.py +184 -0
devflow_engine/registry/module_cards_gate.py +59 -0
devflow_engine/registry/packages.py +347 -0
devflow_engine/registry/pathways.py +323 -0
devflow_engine/review/__init__.py +11 -0
devflow_engine/review/dag.py +588 -0
devflow_engine/review/review_story.py +67 -0
devflow_engine/scope_idea/__init__.py +3 -0
devflow_engine/scope_idea/agentic.py +39 -0
devflow_engine/scope_idea/dag.py +1069 -0
devflow_engine/scope_idea/models.py +175 -0
devflow_engine/skills/builtins/devflow/queue_failure_investigation/SKILL.md +112 -0
devflow_engine/skills/builtins/devflow/queue_idea_to_story/SKILL.md +120 -0
devflow_engine/skills/builtins/devflow/queue_integration/SKILL.md +105 -0
devflow_engine/skills/builtins/devflow/queue_recovery/SKILL.md +108 -0
devflow_engine/skills/builtins/devflow/queue_runtime_core/SKILL.md +155 -0
devflow_engine/skills/builtins/devflow/queue_story_implementation/SKILL.md +122 -0
devflow_engine/skills/builtins/devin/idea_to_story_handoff/SKILL.md +120 -0
devflow_engine/skills/builtins/devin/ideation/SKILL.md +168 -0
devflow_engine/skills/builtins/devin/ideation/state-and-phrasing-reference.md +18 -0
devflow_engine/skills/builtins/devin/insight/SKILL.md +22 -0
devflow_engine/skills/registry.example.yaml +42 -0
devflow_engine/source_doc_assumptions.py +291 -0
devflow_engine/source_doc_mutation_dag.py +1606 -0
devflow_engine/source_doc_mutation_eval.py +417 -0
devflow_engine/source_doc_mutation_worker.py +25 -0
devflow_engine/source_docs_schema.py +207 -0
devflow_engine/source_docs_updater.py +309 -0
devflow_engine/source_scope/__init__.py +15 -0
devflow_engine/source_scope/agentic.py +45 -0
devflow_engine/source_scope/dag.py +1626 -0
devflow_engine/source_scope/models.py +177 -0
devflow_engine/stores/__init__.py +0 -0
devflow_engine/stores/execution_store.py +3534 -0
devflow_engine/story/__init__.py +0 -0
devflow_engine/story/contracts.py +160 -0
devflow_engine/story/discovery.py +47 -0
devflow_engine/story/evidence.py +118 -0
devflow_engine/story/hashing.py +27 -0
devflow_engine/story/implemented_queue_purge.py +148 -0
devflow_engine/story/indexer.py +105 -0
devflow_engine/story/io.py +20 -0
devflow_engine/story/markdown_contracts.py +298 -0
devflow_engine/story/reconciliation.py +408 -0
devflow_engine/story/validate_stories.py +149 -0
devflow_engine/story/validate_tests_story.py +512 -0
devflow_engine/story/validation.py +133 -0
devflow_engine/ui_grounding/__init__.py +11 -0
devflow_engine/ui_grounding/agentic.py +31 -0
devflow_engine/ui_grounding/dag.py +874 -0
devflow_engine/ui_grounding/models.py +224 -0
devflow_engine/ui_grounding/pencil_bridge.py +247 -0
devflow_engine/vendor/__init__.py +0 -0
devflow_engine/vendor/datalumina_genai/__init__.py +11 -0
devflow_engine/vendor/datalumina_genai/core/__init__.py +0 -0
devflow_engine/vendor/datalumina_genai/core/exceptions.py +9 -0
devflow_engine/vendor/datalumina_genai/core/nodes/__init__.py +0 -0
devflow_engine/vendor/datalumina_genai/core/nodes/agent.py +48 -0
devflow_engine/vendor/datalumina_genai/core/nodes/agent_streaming_node.py +26 -0
devflow_engine/vendor/datalumina_genai/core/nodes/base.py +89 -0
devflow_engine/vendor/datalumina_genai/core/nodes/concurrent.py +30 -0
devflow_engine/vendor/datalumina_genai/core/nodes/router.py +69 -0
devflow_engine/vendor/datalumina_genai/core/schema.py +72 -0
devflow_engine/vendor/datalumina_genai/core/task.py +52 -0
devflow_engine/vendor/datalumina_genai/core/validate.py +139 -0
devflow_engine/vendor/datalumina_genai/core/workflow.py +200 -0
devflow_engine/worker.py +1086 -0
devflow_engine/worker_guard.py +233 -0
devflow_engine-1.0.0.dist-info/METADATA +235 -0
devflow_engine-1.0.0.dist-info/RECORD +393 -0
devflow_engine-1.0.0.dist-info/WHEEL +4 -0
devflow_engine-1.0.0.dist-info/entry_points.txt +3 -0
devin/__init__.py +6 -0
devin/dag.py +58 -0
devin/dag_two_arm.py +138 -0
devin/devin_chat_scenario_catalog.json +588 -0
devin/devin_eval.py +677 -0
devin/nodes/__init__.py +0 -0
devin/nodes/ideation/__init__.py +0 -0
devin/nodes/ideation/node.py +195 -0
devin/nodes/ideation/playground.py +267 -0
devin/nodes/ideation/prompt.md +65 -0
devin/nodes/ideation/scenarios/continue_refinement.py +13 -0
devin/nodes/ideation/scenarios/continue_refinement_evals.py +18 -0
devin/nodes/ideation/scenarios/idea_fits_existing_patterns.py +17 -0
devin/nodes/ideation/scenarios/idea_fits_existing_patterns_evals.py +16 -0
devin/nodes/ideation/scenarios/large_idea_split.py +4 -0
devin/nodes/ideation/scenarios/large_idea_split_evals.py +17 -0
devin/nodes/ideation/scenarios/source_documentation_added.py +4 -0
devin/nodes/ideation/scenarios/source_documentation_added_evals.py +16 -0
devin/nodes/ideation/scenarios/user_says_create_it.py +30 -0
devin/nodes/ideation/scenarios/user_says_create_it_evals.py +23 -0
devin/nodes/ideation/scenarios/vague_idea.py +16 -0
devin/nodes/ideation/scenarios/vague_idea_evals.py +47 -0
devin/nodes/ideation/tools.json +312 -0
devin/nodes/insight/__init__.py +0 -0
devin/nodes/insight/node.py +49 -0
devin/nodes/insight/playground.py +154 -0
devin/nodes/insight/prompt.md +61 -0
devin/nodes/insight/scenarios/architecture_pattern_query.py +15 -0
devin/nodes/insight/scenarios/architecture_pattern_query_evals.py +25 -0
devin/nodes/insight/scenarios/codebase_exploration.py +15 -0
devin/nodes/insight/scenarios/codebase_exploration_evals.py +23 -0
devin/nodes/insight/scenarios/devin_ideation_routing.py +19 -0
devin/nodes/insight/scenarios/devin_ideation_routing_evals.py +39 -0
devin/nodes/insight/scenarios/devin_insight_routing.py +20 -0
devin/nodes/insight/scenarios/devin_insight_routing_evals.py +40 -0
devin/nodes/insight/scenarios/operational_debugging.py +15 -0
devin/nodes/insight/scenarios/operational_debugging_evals.py +23 -0
devin/nodes/insight/scenarios/operational_question.py +9 -0
devin/nodes/insight/scenarios/operational_question_evals.py +8 -0
devin/nodes/insight/scenarios/queue_status.py +15 -0
devin/nodes/insight/scenarios/queue_status_evals.py +23 -0
devin/nodes/insight/scenarios/source_doc_explanation.py +14 -0
devin/nodes/insight/scenarios/source_doc_explanation_evals.py +21 -0
devin/nodes/insight/scenarios/worker_state_check.py +15 -0
devin/nodes/insight/scenarios/worker_state_check_evals.py +22 -0
devin/nodes/insight/tools.json +126 -0
devin/nodes/intake/__init__.py +0 -0
devin/nodes/intake/node.py +27 -0
devin/nodes/intake/playground.py +47 -0
devin/nodes/intake/prompt.md +12 -0
devin/nodes/intake/scenarios/ideation_routing.py +4 -0
devin/nodes/intake/scenarios/ideation_routing_evals.py +5 -0
devin/nodes/intake/scenarios/insight_routing.py +4 -0
devin/nodes/intake/scenarios/insight_routing_evals.py +5 -0
devin/nodes/iterate/README.md +44 -0
devin/nodes/iterate/__init__.py +1 -0
devin/nodes/iterate/_archived_design_stages/01-objectives-requirements.md +112 -0
devin/nodes/iterate/_archived_design_stages/02-evals.md +131 -0
devin/nodes/iterate/_archived_design_stages/03-tools-and-boundaries.md +110 -0
devin/nodes/iterate/_archived_design_stages/04-harness-and-playground.md +32 -0
devin/nodes/iterate/_archived_design_stages/05-prompt-deferred.md +11 -0
devin/nodes/iterate/_archived_design_stages/coder_agent_design/01-objectives-requirements.md +20 -0
devin/nodes/iterate/_archived_design_stages/coder_agent_design/02-evals.md +8 -0
devin/nodes/iterate/_archived_design_stages/coder_agent_design/03-tools-and-boundaries.md +14 -0
devin/nodes/iterate/_archived_design_stages/coder_agent_design/04-harness-and-playground.md +12 -0
devin/nodes/iterate/_archived_design_stages/framer_agent_design/01-objectives-requirements.md +20 -0
devin/nodes/iterate/_archived_design_stages/framer_agent_design/02-evals.md +8 -0
devin/nodes/iterate/_archived_design_stages/framer_agent_design/03-tools-and-boundaries.md +13 -0
devin/nodes/iterate/_archived_design_stages/framer_agent_design/04-harness-and-playground.md +12 -0
devin/nodes/iterate/_archived_design_stages/iterator_agent_design/01-objectives-requirements.md +25 -0
devin/nodes/iterate/_archived_design_stages/iterator_agent_design/02-evals.md +9 -0
devin/nodes/iterate/_archived_design_stages/iterator_agent_design/03-tools-and-boundaries.md +14 -0
devin/nodes/iterate/_archived_design_stages/iterator_agent_design/04-harness-and-playground.md +12 -0
devin/nodes/iterate/_archived_design_stages/observer_agent_design/01-objectives-requirements.md +20 -0
devin/nodes/iterate/_archived_design_stages/observer_agent_design/02-evals.md +8 -0
devin/nodes/iterate/_archived_design_stages/observer_agent_design/03-tools-and-boundaries.md +14 -0
devin/nodes/iterate/_archived_design_stages/observer_agent_design/04-harness-and-playground.md +13 -0
devin/nodes/iterate/agent-roles.md +89 -0
devin/nodes/iterate/agents/README.md +10 -0
devin/nodes/iterate/artifacts.md +504 -0
devin/nodes/iterate/contract.md +100 -0
devin/nodes/iterate/eval-plan.md +74 -0
devin/nodes/iterate/node.py +100 -0
devin/nodes/iterate/pipeline/README.md +13 -0
devin/nodes/iterate/playground-contract.md +76 -0
devin/nodes/iterate/prompt.md +11 -0
devin/nodes/iterate/scenarios/README.md +38 -0
devin/nodes/iterate/scenarios/artifact-and-loop-scenarios.md +101 -0
devin/nodes/iterate/scenarios/coder_artifact_alignment.py +32 -0
devin/nodes/iterate/scenarios/coder_artifact_alignment_evals.py +45 -0
devin/nodes/iterate/scenarios/coder_bounded_fix.py +27 -0
devin/nodes/iterate/scenarios/coder_bounded_fix_evals.py +45 -0
devin/nodes/iterate/scenarios/devin_iterate_routing.py +21 -0
devin/nodes/iterate/scenarios/devin_iterate_routing_evals.py +36 -0
devin/nodes/iterate/scenarios/framer_scope_boundary.py +25 -0
devin/nodes/iterate/scenarios/framer_scope_boundary_evals.py +57 -0
devin/nodes/iterate/scenarios/framer_task_framing.py +25 -0
devin/nodes/iterate/scenarios/framer_task_framing_evals.py +58 -0
devin/nodes/iterate/scenarios/iterate_error_fix.py +21 -0
devin/nodes/iterate/scenarios/iterate_error_fix_evals.py +39 -0
devin/nodes/iterate/scenarios/iterate_quick_change.py +21 -0
devin/nodes/iterate/scenarios/iterate_quick_change_evals.py +35 -0
devin/nodes/iterate/scenarios/iterate_to_idea_promotion.py +23 -0
devin/nodes/iterate/scenarios/iterate_to_idea_promotion_evals.py +53 -0
devin/nodes/iterate/scenarios/iterate_to_insight_reroute.py +23 -0
devin/nodes/iterate/scenarios/iterate_to_insight_reroute_evals.py +53 -0
devin/nodes/iterate/scenarios/observer_evidence_seam.py +28 -0
devin/nodes/iterate/scenarios/observer_evidence_seam_evals.py +55 -0
devin/nodes/iterate/scenarios/observer_repro_creation.py +28 -0
devin/nodes/iterate/scenarios/observer_repro_creation_evals.py +45 -0
devin/nodes/iterate/scenarios/routing-matrix.md +45 -0
devin/nodes/shared/__init__.py +0 -0
devin/nodes/shared/filemaker_expert.md +80 -0
devin/nodes/shared/filemaker_expert.py +354 -0
devin/nodes/shared/filemaker_expert_eval/runner.py +176 -0
devin/nodes/shared/filemaker_expert_eval/scenarios.json +65 -0
devin/nodes/shared/goldilocks_advisor_eval/runner.py +214 -0
devin/nodes/shared/goldilocks_advisor_eval/scenarios.json +58 -0
devin/nodes/shared/helpers.py +156 -0
devin/nodes/shared/idea_compliance_advisor_eval/runner.py +252 -0
devin/nodes/shared/idea_compliance_advisor_eval/scenarios.json +75 -0
devin/nodes/shared/models.py +44 -0
devin/nodes/shared/post.py +40 -0
devin/nodes/shared/router.py +107 -0
devin/nodes/shared/tools.py +191 -0
devin/shared/devin-chat-rubric.md +237 -0
devin/shared/devin-chat-scenario-suite.md +90 -0
devin/shared/eval_doctrine.md +9 -0

devflow_engine/scope_idea/models.py ADDED Viewed

@@ -0,0 +1,175 @@
+from __future__ import annotations
+from typing import Any, Literal
+from pydantic import BaseModel, Field
+ScopeShape = Literal["too_broad", "just_right", "too_narrow"]
+ResolutionStatus = Literal["ideas_registered", "narrow_scope_review_required"]
+class SourceEvidenceRef(BaseModel):
+    ref: str
+    summary: str | None = None
+class ArtifactLineage(BaseModel):
+    stage: str
+    origin: Literal["model", "fallback", "deterministic"]
+    mode: str
+    artifact_path: str | None = None
+    agent_run_ref: str | None = None
+    generated_from: list[str] = Field(default_factory=list)
+    notes: list[str] = Field(default_factory=list)
+    metadata: dict[str, Any] = Field(default_factory=dict)
+class ScopeContextArtifact(BaseModel):
+    project_id: str
+    scope_set_id: str
+    scope_id: str
+    scope_title: str
+    scope_description: str
+    source_support: list[SourceEvidenceRef] = Field(default_factory=list)
+    assumptions: list[str] = Field(default_factory=list)
+    cross_cutting_constraints: list[str] = Field(default_factory=list)
+    neighbor_scope_refs: list[str] = Field(default_factory=list)
+    approval_status: str = "approved"
+class GoldilocksAssessmentArtifact(BaseModel):
+    execution_lineage: ArtifactLineage | None = None
+    scope_shape: ScopeShape
+    reasoning: str
+    dominant_outcomes: list[str] = Field(default_factory=list)
+    workflow_clusters: list[str] = Field(default_factory=list)
+    actor_clusters: list[str] = Field(default_factory=list)
+    outcome_coherence_summary: str | None = None
+    business_outcome_signals: list[str] = Field(default_factory=list)
+    implementation_detail_signals: list[str] = Field(default_factory=list)
+    breadth_signals: list[str] = Field(default_factory=list)
+    cohesion_notes: list[str] = Field(default_factory=list)
+    split_recommended: bool = False
+    recommended_child_idea_count: int = 1
+    merge_review_recommended: bool = False
+    notes: list[str] = Field(default_factory=list)
+class GoldilocksDecisionArtifact(BaseModel):
+    decision: ScopeShape
+    reason: str
+    next_node: str
+class IdeaCandidateArtifact(BaseModel):
+    execution_lineage: ArtifactLineage | None = None
+    idea_candidate_id: str
+    project_id: str
+    scope_set_id: str
+    scope_id: str
+    parent_scope_id: str
+    refs: list[str] = Field(default_factory=list)
+    title: str
+    problem: str
+    users: list[str]
+    goal: str
+    scope: list[str]
+    constraints: list[str]
+    acceptance_criteria: list[str]
+    assumptions: list[str]
+    traceability: list[str]
+    split_rationale: str | None = None
+class IdeaSplitPlanArtifact(BaseModel):
+    execution_lineage: ArtifactLineage | None = None
+    project_id: str
+    scope_set_id: str
+    scope_id: str
+    parent_scope_id: str
+    refs: list[str] = Field(default_factory=list)
+    split_required: bool
+    split_rationale: str
+    child_ideas: list[IdeaCandidateArtifact]
+    coverage_of_parent_scope: list[str] = Field(default_factory=list)
+    remaining_risks: list[str] = Field(default_factory=list)
+class IdeaCandidateSetArtifact(BaseModel):
+    lineage: list[ArtifactLineage] = Field(default_factory=list)
+    project_id: str
+    scope_set_id: str
+    scope_id: str
+    parent_scope_id: str
+    refs: list[str] = Field(default_factory=list)
+    idea_candidates: list[IdeaCandidateArtifact]
+    candidate_count: int
+    split_applied: bool
+    split_rationale: str | None = None
+class RegisteredIdeaArtifact(BaseModel):
+    execution_lineage: ArtifactLineage | None = None
+    idea_id: str
+    source_scope_id: str
+    parent_scope_id: str
+    idea_candidate_id: str
+    title: str
+    summary: str
+    registry_ref: str
+    idea_ref: str
+    status: str
+class IdeaRegistryRecordArtifact(BaseModel):
+    lineage: list[ArtifactLineage] = Field(default_factory=list)
+    project_id: str
+    scope_set_id: str
+    scope_id: str
+    parent_scope_id: str
+    refs: list[str] = Field(default_factory=list)
+    scope_shape: ScopeShape
+    registered_ideas: list[RegisteredIdeaArtifact]
+    registration_timestamp: str
+    registry_root: str
+class NarrowScopeReviewArtifact(BaseModel):
+    execution_lineage: ArtifactLineage | None = None
+    project_id: str
+    scope_set_id: str
+    scope_id: str
+    parent_scope_id: str
+    refs: list[str] = Field(default_factory=list)
+    reason_too_narrow: str
+    suggested_merge_targets: list[str] = Field(default_factory=list)
+    human_review_required: bool = True
+    recommended_next_action: str
+class IdeaResolutionPackageArtifact(BaseModel):
+    lineage: list[ArtifactLineage] = Field(default_factory=list)
+    project_id: str
+    scope_set_id: str
+    scope_id: str
+    parent_scope_id: str
+    refs: list[str] = Field(default_factory=list)
+    scope_shape: ScopeShape
+    split_applied: bool
+    resolution_status: ResolutionStatus
+    registered_idea_count: int
+    registered_ideas: list[RegisteredIdeaArtifact] = Field(default_factory=list)
+    assumptions_added: list[str] = Field(default_factory=list)
+    remaining_risks: list[str] = Field(default_factory=list)
+    recommended_next_action: str
+    review_required: bool = False
+    review_package_ref: str | None = None
+class ScopeIdeaDagSummary(BaseModel):
+    exit_code: int
+    run_id: str
+    pipeline_dir: str
+    message: str
+    outcome: dict[str, object]

devflow_engine/skills/builtins/devflow/queue_failure_investigation/SKILL.md ADDED Viewed

@@ -0,0 +1,112 @@
+---
+name: devflow-queue-failure-investigation
+description: Cross-cutting DevFlow skill for failure/log investigation across queue lanes, with log-first evidence order and run-correlation doctrine.
+owner: devflow
+scope: built-in
+version: 1
+---
+# DevFlow queue: failure investigation / logs
+Use this skill when the task is to answer:
+- what failed
+- where it failed
+- whether the queue state matches the real failure
+- whether recovery is acting on the correct seam
+- whether a run is actually stuck, stale, or merely mis-correlated
+This is the cross-cutting investigation module for all queue lanes.
+## Core doctrine
+Do not start from summary rows alone when richer evidence exists.
+Prefer this evidence order:
+1. **Primary:** streamed LLM / agent logs and session evidence
+   - `/Users/devflow/.devflow/llm_logs/*.jsonl`
+   - `/Users/devflow/.devflow/llm_sessions.sqlite`
+2. **Secondary:** node-level artifacts and errors
+   - `artifacts`
+   - `errors`
+   - `nodes`
+3. **Tertiary:** queue rows and worker summary state
+   - `idea_queue`
+   - `story_queue`
+   - `integration_queue`
+   - `recovery_queue`
+   - `project_workers`
+## Standard investigation loop
+1. Identify the lane and durable item id.
+2. Read the queue row and current worker state.
+3. Correlate to the wrapper/orchestration run.
+4. Search for the real child DAG run if the wrapper is thin.
+5. Read logs/artifacts for the failing stage.
+6. Classify the failure as one of:
+   - real code/runtime failure
+   - stale worker / reconciliation failure
+   - wrong-run investigation
+   - repeated churn with no material change
+   - blocked by prerequisite/state boundary
+## Wrapper-vs-child run rule
+Never assume the user-facing wrapper run id is the same as the actual child DAG run id.
+Check for mismatch explicitly.
+Correlate on:
+- queue item id
+- `story_id` or `idea_id` when relevant
+- repo root
+- created-at time window
+- artifact paths
+- node sequence
+A wrapper run can look stranded even while the child DAG succeeded correctly.
+Do not call the whole flow failed until both layers are checked.
+## First inspection targets
+### For any failed lane
+- queue row `failure_message`
+- queue row `failure_context_json`
+- matching run(s) in `runs`
+- matching node rows in `nodes`
+- matching `errors`
+- high-value `artifacts`
+### For story churn
+- `actual_failed_node`
+- `churn_state`
+- streamed transcripts for Green/Refactor/Security/etc.
+- whether the edits hit the correct seam
+### For recovery churn
+- recovery diagnosis/execution artifacts
+- durable churn-gate evidence
+- whether the same failure signature repeated without material repo/state change
+## What counts as success
+A failure investigation is successful when it produces a grounded answer to:
+- the failing boundary
+- the best primary evidence
+- whether the state is real failure vs stale/mis-correlated state
+- the next correct lane: retry, recovery, escalate, or declare blocked
+## What counts as blockage
+Treat the investigation itself as blocked when:
+- the queue item cannot be correlated to any relevant run or artifact
+- logs are missing and DB evidence is internally inconsistent
+- the worker/report state is stale and must be reconciled first
+- the operator is still looking at the wrong wrapper run
+## Strong future tool candidates
+- log-first failure packet reader
+- queue item -> run/artifact/session correlation helper
+- wrapper-child mismatch detector
+- churn explainer for story/recovery lanes
+- lane-specific first-evidence summary helper

devflow_engine/skills/builtins/devflow/queue_idea_to_story/SKILL.md ADDED Viewed

@@ -0,0 +1,120 @@
+---
+name: devflow-queue-idea-to-story
+description: Operational DevFlow skill for starting, observing, and investigating the idea-to-story queue lane.
+owner: devflow
+scope: built-in
+version: 1
+---
+# DevFlow queue: idea -> story
+Use this skill when the task is about the **runtime lane that turns an already-approved idea into story outputs**.
+This skill starts at the queue/runtime boundary.
+It does **not** replace:
+- `devin/ideation`
+- `devin/idea_to_story_handoff`
+Those own conversational approval truth.
+This skill owns operational inspection after the idea payload exists or the queue lane is being discussed.
+## Core job
+Determine whether an idea has:
+- been queued for story generation
+- been claimed and started
+- produced durable story outputs
+- failed, blocked, or stalled
+## How to start / kick the lane
+Primary runtime path:
+- ensure an `idea_queue` item exists for the `idea_id`
+- run `devflow worker start --project <project_id> --once` for one-step pickup
+- or `devflow worker start --project <project_id>` to drain the queue
+Supabase/control-plane path in this repo:
+- `devflow worker supabase-events`
+- supported request event: `devflow.idea.stories.generate.request`
+Do not say story generation started just because the idea was approved in conversation.
+Runtime start begins when the queue item is claimed and the worker starts `worker.idea_to_story`.
+## Observe status
+Check in this order:
+1. `devflow worker report --project <project_id>`
+2. `idea_queue` row in `<repo_root>/.devflow/execution.sqlite`
+3. correlated run in `runs` for kind `worker.idea_to_story`
+4. generated idea/story artifacts under `.devflow/ideas/<idea_id>/...`
+5. canonical story outputs under `ai_docs/context/v2/project_docs/user_stories/`
+Good first SQL snapshot:
+```sql
+select idea_queue_id, idea_id, status, started_run_id, finished_run_id, failure_message, updated_at
+from idea_queue
+where project_id = '<project_id>'
+order by updated_at desc;
+```
+High-value artifact locations:
+- `.devflow/ideas/<idea_id>/traditional_user_stories/<story_set_id>/`
+- `.devflow/ideas/<idea_id>/devflow_story_sets/<devflow_story_set_id>/`
+- `ai_docs/context/v2/project_docs/user_stories/`
+## Investigate failures
+Look first at:
+1. `idea_queue.failure_message`
+2. `idea_queue.failure_context_json`
+3. `runs` / `nodes` / `artifacts` for the correlated run
+4. any `resume_cursor` recorded in failure context
+5. story-generation artifacts in the idea directory
+Helpful current commands:
+- `devflow worker failed-ideas --project <project_id>`
+- `devflow worker retry-idea --project <project_id> --latest`
+- `devflow worker retry-idea --project <project_id> --latest --run-now`
+If the lane failed after partial output, verify whether the failure happened in:
+- traditional story decomposition
+- story-plane adjudication
+- DevFlow story compilation
+- downstream sync/publication after story artifacts already exist
+## Primary evidence to inspect first
+1. `idea_queue` row
+2. run + node records
+3. `.devflow/ideas/<idea_id>/traditional_user_stories/...`
+4. `.devflow/ideas/<idea_id>/devflow_story_sets/...`
+5. canonical generated story docs
+If richer agent logs exist for the failure, prefer those over summary fields.
+## What counts as success
+Only treat the lane as successful when:
+- the `idea_queue` row is terminal-complete
+- the run finished successfully
+- durable story outputs exist for the idea
+- the canonical generated story surface was updated when that step belongs to the run
+## What counts as blockage
+Treat these as blocked/problem states:
+- `idea_queue.status = failed`
+- repeated retries with the same `resume_cursor` and no new durable outputs
+- story artifacts exist but queue/run reconciliation is inconsistent
+- the idea payload is missing or stale for the referenced `idea_id`
+- recovery has taken over the lane
+## Strong future tool candidates
+- latest `idea_queue` summary for an `idea_id`
+- `resume_cursor` explainer
+- story-output locator for an `idea_id`
+- latest failed idea retry helper
+- queue-row -> run/artifact correlation helper

devflow_engine/skills/builtins/devflow/queue_integration/SKILL.md ADDED Viewed

@@ -0,0 +1,105 @@
+---
+name: devflow-queue-integration
+description: Operational DevFlow skill for kicking, observing, and investigating integration_queue work and integration DAG outputs.
+owner: devflow
+scope: built-in
+version: 1
+---
+# DevFlow queue: integration
+Use this skill when the task is about **integration follow-through for an implemented idea**.
+## Core job
+Determine whether integration work for an `idea_id` has:
+- had a payload prepared
+- been enqueued
+- started via worker execution
+- completed with durable current artifacts
+- failed and handed off to recovery
+## How to start / kick the lane
+Current repo surfaces:
+- `devflow integration prepare <idea_id>`
+- `devflow integration enqueue <idea_id> --project <project_id>`
+- `devflow worker start --project <project_id> --once`
+Manual direct run exists but is not the queue path:
+- `devflow integration run <idea_id>`
+When operating the queue lane, prefer enqueue + worker over claiming queue progress from a manual run.
+## Observe status
+Check in this order:
+1. `devflow integration status <idea_id>`
+2. `devflow worker report --project <project_id>`
+3. `integration_queue` row in `.devflow/execution.sqlite`
+4. correlated run of kind `worker.integration`
+5. idea-local integration artifacts
+High-value artifact locations:
+- `.devflow/ideas/<idea_id>/integration_payload.json`
+- `.devflow/ideas/<idea_id>/integration/current/`
+- `.devflow/ideas/<idea_id>/integration/runs/`
+- legacy fallback location: `.devflow/ideas/<idea_id>/pipelines/integration_dag/`
+Good first SQL snapshot:
+```sql
+select integration_queue_id, idea_id, status, started_run_id, finished_run_id, failure_message, updated_at
+from integration_queue
+where project_id = '<project_id>'
+order by updated_at desc;
+```
+## Investigate failures
+Look first at:
+1. `integration_queue.failure_message`
+2. `integration_queue.failure_context_json`
+3. `integration_payload.json`
+4. latest pipeline run directory
+5. run/node/artifact/error rows for `worker.integration`
+6. recovery queue state if the failure already escalated
+Common real failure shapes:
+- payload missing or stale for the `idea_id`
+- implemented-story evidence incomplete
+- integration DAG failed after starting
+- queue row failed but current artifacts partially exist
+## Primary evidence to inspect first
+1. `integration_queue` row
+2. `devflow integration status <idea_id>` output
+3. payload path
+4. latest integration run dir
+5. correlated DB run/artifact/error records
+## What counts as success
+Only treat the lane as successful when:
+- `integration_queue.status = completed`
+- the integration run succeeded
+- `.devflow/ideas/<idea_id>/integration/current/` exists or equivalent latest durable current state exists
+- any registered-project sync side effects completed when expected
+## What counts as blockage
+Treat these as blocked/problem states:
+- queue row failed
+- payload cannot be prepared/resolved
+- latest run exists but current durable integration state was not updated
+- recovery is now the active owner of the failed integration item
+## Strong future tool candidates
+- `idea_id` -> integration status summary
+- integration payload validator/locator
+- latest integration run summary
+- integration queue retry / inspect helper
+- queue-to-artifact correlation helper

devflow_engine/skills/builtins/devflow/queue_recovery/SKILL.md ADDED Viewed

@@ -0,0 +1,108 @@
+---
+name: devflow-queue-recovery
+description: Operational DevFlow skill for recovery_queue execution, recovery outcome classification, and recovery handoff inspection.
+owner: devflow
+scope: built-in
+version: 1
+---
+# DevFlow queue: recovery
+Use this skill when the task is about **post-failure recovery work** in `recovery_queue`.
+This skill complements `docs/recovery-dag-contract.md`.
+That doc explains the DAG contract.
+This skill explains how to operate and inspect the recovery lane concretely.
+## Core job
+Determine whether a failed queue item has:
+- been handed off into `recovery_queue`
+- started a real recovery run
+- been re-enqueued, delegated, blocked, or fully recovered
+- produced the expected recovery handoff artifact
+## How to start / kick the lane
+Normal path:
+- recovery items are enqueued automatically when a queue lane fails
+- run `devflow worker start --project <project_id> --once` or drain the worker
+Separate command with different purpose:
+- `devflow worker recover --project <project_id>` repairs **stale worker ownership state**
+- it does **not** itself run the business recovery DAG for a fresh failure
+Do not bypass recovery state with direct SQL edits unless the task is explicitly DB repair.
+## Observe status
+Check in this order:
+1. `devflow worker report --project <project_id>`
+2. `recovery_queue` row in `.devflow/execution.sqlite`
+3. correlated recovery run, usually `post_queue_failure_recovery_dag`
+4. recovery execution metadata / artifacts
+5. recovery handoff artifact on disk
+6. source queue row after recovery action
+Good first SQL snapshot:
+```sql
+select recovery_queue_id, source_queue_type, source_item_id, status, started_run_id, finished_run_id, failure_message, updated_at
+from recovery_queue
+where project_id = '<project_id>'
+order by updated_at desc;
+```
+High-value handoff artifact locations:
+- story-scoped: `.devflow/stories/<story_id>/recovery_handoff.json`
+- non-story fallback: `.devflow/recovery_handoffs/<queue_type>/<item_id>.json`
+## Investigate failures
+Look first at:
+1. `recovery_queue` row
+2. correlated recovery run + node/artifact/error records
+3. recovery handoff artifact
+4. source queue item state after attempted recovery
+5. rich logs gathered during recovery investigation/execution
+Important recovery outcomes to classify correctly:
+- `reenqueued`
+- `delegated`
+- `blocked`
+- `recovered`
+Do not compress those into a generic "fixed" claim.
+## Primary evidence to inspect first
+1. `recovery_queue.status`
+2. recovery run status
+3. published recovery summary / handoff artifact
+4. source queue row reconciliation
+5. churn/no-material-change evidence if retries repeat
+## What counts as success
+Only treat recovery as successful when the durable result matches the declared outcome:
+- `reenqueued` -> source queue row was actually reset/re-queued
+- `delegated` -> the handoff/delegation artifact exists and the target lane is explicit
+- `recovered` -> the recovery row completed and the source item is reconciled as intended
+## What counts as blockage
+Treat these as blocked/problem states:
+- `recovery_queue.status = failed` or `blocked`
+- durable churn gate fired for repeated no-material-change recovery
+- recovery kept acting on the wrong seam
+- handoff artifact is missing despite a claimed publish step
+- source queue row did not reconcile to the declared outcome
+## Strong future tool candidates
+- latest recovery queue item summary
+- source queue item -> recovery chain reader
+- recovery handoff locator
+- recovery outcome explainer
+- durable churn-gate state reader