RubyGems - aidp - Versions diffs - 0.33.0 → 0.34.0 - Mend

aidp 0.33.0 → 0.34.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

checksums.yaml +4 -4
data/README.md +35 -0
data/lib/aidp/analyze/tree_sitter_scan.rb +3 -0
data/lib/aidp/cli/eval_command.rb +399 -0
data/lib/aidp/cli/harness_command.rb +1 -1
data/lib/aidp/cli/security_command.rb +416 -0
data/lib/aidp/cli/tools_command.rb +6 -4
data/lib/aidp/cli.rb +170 -3
data/lib/aidp/concurrency/exec.rb +3 -0
data/lib/aidp/config.rb +113 -0
data/lib/aidp/config_paths.rb +20 -0
data/lib/aidp/daemon/runner.rb +8 -4
data/lib/aidp/errors.rb +134 -0
data/lib/aidp/evaluations/context_capture.rb +205 -0
data/lib/aidp/evaluations/evaluation_record.rb +114 -0
data/lib/aidp/evaluations/evaluation_storage.rb +250 -0
data/lib/aidp/evaluations.rb +23 -0
data/lib/aidp/execute/async_work_loop_runner.rb +4 -1
data/lib/aidp/execute/interactive_repl.rb +6 -2
data/lib/aidp/execute/prompt_evaluator.rb +359 -0
data/lib/aidp/execute/repl_macros.rb +100 -1
data/lib/aidp/execute/work_loop_runner.rb +399 -47
data/lib/aidp/execute/work_loop_state.rb +4 -1
data/lib/aidp/execute/workflow_selector.rb +3 -0
data/lib/aidp/harness/ai_decision_engine.rb +79 -0
data/lib/aidp/harness/capability_registry.rb +2 -0
data/lib/aidp/harness/condition_detector.rb +3 -0
data/lib/aidp/harness/config_loader.rb +3 -0
data/lib/aidp/harness/enhanced_runner.rb +14 -11
data/lib/aidp/harness/error_handler.rb +3 -0
data/lib/aidp/harness/provider_factory.rb +3 -0
data/lib/aidp/harness/provider_manager.rb +6 -0
data/lib/aidp/harness/runner.rb +5 -1
data/lib/aidp/harness/state/persistence.rb +3 -0
data/lib/aidp/harness/state_manager.rb +3 -0
data/lib/aidp/harness/status_display.rb +28 -20
data/lib/aidp/harness/thinking_depth_manager.rb +32 -32
data/lib/aidp/harness/ui/enhanced_tui.rb +4 -0
data/lib/aidp/harness/ui/enhanced_workflow_selector.rb +4 -0
data/lib/aidp/harness/ui/error_handler.rb +3 -0
data/lib/aidp/harness/ui/job_monitor.rb +4 -0
data/lib/aidp/harness/ui/navigation/submenu.rb +2 -0
data/lib/aidp/harness/ui/navigation/workflow_selector.rb +6 -0
data/lib/aidp/harness/ui/spinner_helper.rb +3 -0
data/lib/aidp/harness/ui/workflow_controller.rb +3 -0
data/lib/aidp/harness/user_interface.rb +3 -0
data/lib/aidp/loader.rb +2 -2
data/lib/aidp/logger.rb +3 -0
data/lib/aidp/message_display.rb +31 -0
data/lib/aidp/pr_worktree_manager.rb +18 -6
data/lib/aidp/provider_manager.rb +3 -0
data/lib/aidp/providers/base.rb +2 -0
data/lib/aidp/security/rule_of_two_enforcer.rb +210 -0
data/lib/aidp/security/secrets_proxy.rb +328 -0
data/lib/aidp/security/secrets_registry.rb +227 -0
data/lib/aidp/security/trifecta_state.rb +220 -0
data/lib/aidp/security/watch_mode_handler.rb +306 -0
data/lib/aidp/security/work_loop_adapter.rb +277 -0
data/lib/aidp/security.rb +56 -0
data/lib/aidp/setup/wizard.rb +4 -2
data/lib/aidp/version.rb +1 -1
data/lib/aidp/watch/auto_merger.rb +274 -0
data/lib/aidp/watch/auto_pr_processor.rb +125 -7
data/lib/aidp/watch/build_processor.rb +16 -1
data/lib/aidp/watch/change_request_processor.rb +680 -286
data/lib/aidp/watch/ci_fix_processor.rb +262 -4
data/lib/aidp/watch/feedback_collector.rb +191 -0
data/lib/aidp/watch/hierarchical_pr_strategy.rb +256 -0
data/lib/aidp/watch/implementation_verifier.rb +142 -1
data/lib/aidp/watch/plan_generator.rb +70 -13
data/lib/aidp/watch/plan_processor.rb +12 -5
data/lib/aidp/watch/projects_processor.rb +286 -0
data/lib/aidp/watch/repository_client.rb +861 -53
data/lib/aidp/watch/review_processor.rb +33 -6
data/lib/aidp/watch/runner.rb +51 -11
data/lib/aidp/watch/state_store.rb +233 -0
data/lib/aidp/watch/sub_issue_creator.rb +221 -0
data/lib/aidp/workflows/guided_agent.rb +4 -0
data/lib/aidp/workstream_executor.rb +3 -0
data/lib/aidp/worktree.rb +61 -11
data/lib/aidp/worktree_branch_manager.rb +347 -101
data/templates/implementation/iterative_implementation.md +46 -3
metadata +20 -1

data/lib/aidp/execute/work_loop_runner.rb CHANGED Viewed

@@ -1,6 +1,7 @@
 # frozen_string_literal: true
 require_relative "prompt_manager"
+require_relative "prompt_evaluator"
 require_relative "checkpoint"
 require_relative "checkpoint_display"
 require_relative "guard_policy"
@@ -11,6 +12,7 @@ require_relative "steps"
 require_relative "../harness/test_runner"
 require_relative "../errors"
 require_relative "../style_guide/selector"
+require_relative "../security"
 module Aidp
   module Execute
@@ -39,7 +41,10 @@ module Aidp
       }.freeze
       include Aidp::MessageDisplay
-      attr_reader :iteration_count, :project_dir, :current_state
+      # Expose state for testability
+      attr_accessor :iteration_count, :step_name, :options, :persistent_tasklist
+      attr_reader :project_dir, :current_state, :state_history, :test_runner, :prompt_manager, :checkpoint
+      attr_writer :guard_policy, :prompt_manager, :style_guide_selector
       MAX_ITERATIONS = 50 # Safety limit
       CHECKPOINT_INTERVAL = 5 # Record checkpoint every N iterations
@@ -67,12 +72,18 @@ module Aidp
         # Initialize thinking depth manager for intelligent model selection
         require_relative "../harness/thinking_depth_manager"
-        @thinking_depth_manager = options[:thinking_depth_manager] || Aidp::Harness::ThinkingDepthManager.new(config)
+        @thinking_depth_manager = options[:thinking_depth_manager] || Aidp::Harness::ThinkingDepthManager.new(config, root_dir: @project_dir)
         @consecutive_failures = 0
         @last_tier = nil
         # Initialize style guide selector for intelligent section selection
         @style_guide_selector = options[:style_guide_selector] || Aidp::StyleGuide::Selector.new(project_dir: project_dir)
+        # FIX for issue #391: Initialize prompt evaluator for iteration threshold assessment
+        @prompt_evaluator = options[:prompt_evaluator] || PromptEvaluator.new(config)
+        # Initialize security adapter for Rule of Two enforcement
+        @security_adapter = options[:security_adapter] || Aidp::Security::WorkLoopAdapter.new(project_dir: project_dir)
       end
       # Execute a step using fix-forward work loop pattern
@@ -143,6 +154,11 @@ module Aidp
         @current_state = :ready
         @state_history.clear
+        # Begin security tracking for this agentic work unit
+        work_unit_id = "agentic_#{@step_name}_#{SecureRandom.hex(4)}"
+        @security_adapter.begin_work_unit(work_unit_id: work_unit_id, context: context)
+        display_security_status
         create_initial_prompt(step_spec, context)
         loop do
@@ -154,6 +170,10 @@ module Aidp
             display_message("⚠️  Max iterations (#{MAX_ITERATIONS}) reached for #{@step_name}", type: :warning)
             display_state_summary
             archive_and_cleanup
+            # End security tracking for this work unit
+            @security_adapter.end_work_unit
             return build_agentic_payload(
               agent_result: nil,
               response: build_max_iterations_result,
@@ -178,6 +198,30 @@ module Aidp
             prompt_length: prompt_length,
             checks: checks_summary)
+          # Check security policy before agent call (Rule of Two enforcement)
+          # Agent calls enable egress capability
+          begin
+            @security_adapter.check_agent_call_allowed!(operation: :agent_execution)
+          rescue Aidp::Security::PolicyViolation => e
+            # Security policy violation - cannot proceed with agent call
+            Aidp.logger.error("work_loop", "Security policy violation",
+              step: @step_name,
+              iteration: @iteration_count,
+              error: e.message)
+            display_message("  🛡️  Security policy violation: #{e.message}", type: :error)
+            display_message("  Cannot proceed - Rule of Two would be violated", type: :error)
+            # End security tracking and return error
+            @security_adapter.end_work_unit
+            return build_agentic_payload(
+              agent_result: nil,
+              response: {status: "error", message: "Security policy violation: #{e.message}"},
+              summary: nil,
+              completed: false,
+              terminate: true
+            )
+          end
           # Wrap agent call in exception handling for true fix-forward
           begin
             agent_result = apply_patch(preview_provider, preview_model)
@@ -185,6 +229,15 @@ module Aidp
             # Configuration errors should crash immediately (crash-early principle)
             # Re-raise without catching
             raise
+          rescue Aidp::Security::PolicyViolation => e
+            # Security violations should not continue - they are policy failures
+            Aidp.logger.error("work_loop", "Security policy violation during agent call",
+              step: @step_name,
+              iteration: @iteration_count,
+              error: e.message)
+            display_message("  🛡️  Security violation: #{e.message}", type: :error)
+            @security_adapter.end_work_unit
+            raise
           rescue => e
             # Convert exception to error result for fix-forward handling
             Aidp.logger.error("work_loop", "Exception during agent call",
@@ -263,13 +316,31 @@ module Aidp
           # Check task completion status
           task_completion_result = check_task_completion
+          agent_completed = agent_marked_complete?(agent_result)
+          # FIX for issue #391: Comprehensive logging at completion decision point
+          Aidp.log_debug("work_loop", "completion_decision_point",
+            iteration: @iteration_count,
+            all_checks_pass: all_checks_pass,
+            agent_marked_complete: agent_completed,
+            task_completion_complete: task_completion_result[:complete],
+            task_completion_reason: task_completion_result[:reason],
+            test_success: test_results[:success],
+            lint_success: lint_results[:success],
+            formatter_success: formatter_results[:success],
+            build_success: build_results[:success],
+            doc_success: doc_results[:success])
           if all_checks_pass
             transition_to(:pass)
-            if agent_marked_complete?(agent_result)
+            if agent_completed
               # Check if tasks are complete
               if task_completion_result[:complete]
+                Aidp.log_debug("work_loop", "completion_approved",
+                  iteration: @iteration_count,
+                  reason: task_completion_result[:reason])
                 transition_to(:done)
                 record_final_checkpoint(all_results)
                 display_task_summary
@@ -280,9 +351,13 @@ module Aidp
                   model: preview_model,
                   prompt_length: prompt_length,
                   checks: checks_summary,
-                  task_status: "complete")
+                  task_status: "complete",
+                  completion_reason: task_completion_result[:reason])
                 archive_and_cleanup
+                # End security tracking for this work unit
+                @security_adapter.end_work_unit
                 return build_agentic_payload(
                   agent_result: agent_result,
                   response: build_success_result(agent_result),
@@ -292,6 +367,11 @@ module Aidp
                 )
               else
                 # All checks passed but tasks not complete
+                Aidp.log_debug("work_loop", "completion_blocked_tasks_incomplete",
+                  iteration: @iteration_count,
+                  reason: task_completion_result[:reason],
+                  message: task_completion_result[:message])
                 display_message("  All checks passed but tasks not complete", type: :warning)
                 display_message("  #{task_completion_result[:message]}", type: :warning)
                 display_task_summary
@@ -300,13 +380,17 @@ module Aidp
                   model: preview_model,
                   prompt_length: prompt_length,
                   checks: checks_summary,
-                  task_status: "incomplete")
+                  task_status: "incomplete",
+                  task_completion_reason: task_completion_result[:reason])
                 transition_to(:next_patch)
                 # Append task completion requirement to PROMPT.md
                 append_task_requirement_to_prompt(task_completion_result[:message])
               end
             else
+              Aidp.log_debug("work_loop", "completion_blocked_agent_not_complete",
+                iteration: @iteration_count)
               display_message("  All checks passed but work not marked complete", type: :info)
               log_iteration_status("checks_passed_waiting_agent_completion",
                 provider: preview_provider,
@@ -331,7 +415,146 @@ module Aidp
               failures: failure_summary_for_log(all_results))
             prepare_next_iteration(all_results, diagnostic)
           end
+          # FIX for issue #391: Evaluate prompt effectiveness at iteration thresholds
+          # After 10+ iterations, assess whether the prompt is leading to progress
+          evaluate_prompt_effectiveness(all_results)
+        end
+      end
+      # Evaluate prompt effectiveness at iteration thresholds
+      # FIX for issue #391: Provides feedback when work loop is stuck
+      # Note: Errors during evaluation are logged but don't fail the work loop
+      def evaluate_prompt_effectiveness(all_results)
+        return unless @prompt_evaluator.should_evaluate?(@iteration_count)
+        Aidp.log_debug("work_loop", "evaluating_prompt_effectiveness",
+          iteration: @iteration_count)
+        display_message("📊 Evaluating prompt effectiveness (iteration #{@iteration_count})...", type: :info)
+        task_summary = build_task_summary_for_evaluation
+        prompt_content = @prompt_manager.read
+        evaluation = @prompt_evaluator.evaluate(
+          prompt_content: prompt_content,
+          iteration_count: @iteration_count,
+          task_summary: task_summary,
+          recent_failures: all_results,
+          step_name: @step_name
+        )
+        display_prompt_evaluation_results(evaluation)
+        # If prompt is deemed ineffective, append suggestions to PROMPT.md
+        unless evaluation[:effective]
+          append_evaluation_feedback_to_prompt(evaluation)
+        end
+        Aidp.log_info("work_loop", "prompt_evaluation_complete",
+          iteration: @iteration_count,
+          effective: evaluation[:effective],
+          confidence: evaluation[:confidence])
+      rescue => e
+        # Don't let evaluation errors break the work loop
+        Aidp.log_warn("work_loop", "prompt_evaluation_error",
+          iteration: @iteration_count,
+          error: e.message,
+          error_class: e.class.name)
+        display_message("  ⚠️  Prompt evaluation skipped due to error: #{e.message}", type: :muted)
+      end
+      def build_task_summary_for_evaluation
+        all_tasks = @persistent_tasklist.all
+        return {} if all_tasks.empty?
+        {
+          total: all_tasks.size,
+          done: all_tasks.count { |t| t.status == :done },
+          in_progress: all_tasks.count { |t| t.status == :in_progress },
+          pending: all_tasks.count { |t| t.status == :pending },
+          abandoned: all_tasks.count { |t| t.status == :abandoned }
+        }
+      end
+      def display_prompt_evaluation_results(evaluation)
+        # Skip display if evaluation was skipped
+        if evaluation[:skipped]
+          display_message("  ℹ️  Prompt evaluation skipped: #{evaluation[:skip_reason]}", type: :muted)
+          return
+        end
+        if evaluation[:effective]
+          display_message("  ✅ Prompt appears effective, continuing...", type: :success)
+        else
+          display_message("  ⚠️  Prompt may need improvement:", type: :warning)
+          if evaluation[:issues]&.any?
+            display_message("  Issues identified:", type: :info)
+            evaluation[:issues].each { |issue| display_message("    - #{issue}", type: :warning) }
+          end
+          if evaluation[:suggestions]&.any?
+            display_message("  Suggestions:", type: :info)
+            evaluation[:suggestions].take(3).each { |s| display_message("    - #{s}", type: :info) }
+          end
+          if evaluation[:likely_blockers]&.any?
+            display_message("  Likely blockers:", type: :warning)
+            evaluation[:likely_blockers].each { |b| display_message("    - #{b}", type: :error) }
+          end
+        end
+        display_message("  Confidence: #{(evaluation[:confidence] * 100).round}%", type: :muted)
+      end
+      def append_evaluation_feedback_to_prompt(evaluation)
+        feedback_section = build_evaluation_feedback_section(evaluation)
+        @prompt_manager.append(feedback_section)
+        Aidp.log_debug("work_loop", "appended_evaluation_feedback",
+          iteration: @iteration_count,
+          feedback_size: feedback_section.length)
+      end
+      def build_evaluation_feedback_section(evaluation)
+        parts = []
+        parts << "\n\n## ⚠️ Work Loop Progress Assessment (Iteration #{@iteration_count})"
+        parts << ""
+        parts << "The work loop has been running for #{@iteration_count} iterations without completion."
+        parts << "An automated assessment identified the following:"
+        parts << ""
+        if evaluation[:issues]&.any?
+          parts << "### Issues Identified"
+          evaluation[:issues].each { |i| parts << "- #{i}" }
+          parts << ""
+        end
+        if evaluation[:suggestions]&.any?
+          parts << "### Suggestions for Progress"
+          evaluation[:suggestions].each { |s| parts << "- #{s}" }
+          parts << ""
+        end
+        if evaluation[:recommended_actions]&.any?
+          parts << "### Recommended Actions"
+          evaluation[:recommended_actions].each do |action|
+            parts << "- [#{action[:priority]&.upcase || "MEDIUM"}] #{action[:action]}"
+            parts << "  Rationale: #{action[:rationale]}" if action[:rationale]
+          end
+          parts << ""
         end
+        parts << "### Next Steps"
+        parts << "Please address the above issues and either:"
+        parts << "1. Complete the remaining work and mark STATUS: COMPLETE"
+        parts << "2. File tasks for remaining work and complete them systematically"
+        parts << "3. If blocked, explain the blocker clearly in your response"
+        parts << ""
+        parts.join("\n")
       end
       def run_decider_agentic_unit(context)
@@ -802,18 +1025,27 @@ module Aidp
         # CRITICAL: Change to project directory before calling provider
         # This ensures Claude CLI runs in the correct directory and can create files
         Dir.chdir(@project_dir) do
-          # Send to provider via provider_manager with selected model
-          @provider_manager.execute_with_provider(
-            provider_name,
-            full_prompt,
-            {
-              step_name: @step_name,
-              iteration: @iteration_count,
-              project_dir: @project_dir,
-              model: model_name,
-              tier: @thinking_depth_manager.current_tier
-            }
-          )
+          # Execute with sanitized environment (secrets stripped) when security is enabled
+          # This ensures agent processes cannot access registered secrets directly
+          execute_block = lambda do
+            @provider_manager.execute_with_provider(
+              provider_name,
+              full_prompt,
+              {
+                step_name: @step_name,
+                iteration: @iteration_count,
+                project_dir: @project_dir,
+                model: model_name,
+                tier: @thinking_depth_manager.current_tier
+              }
+            )
+          end
+          if @security_adapter.enabled?
+            @security_adapter.with_sanitized_environment(&execute_block)
+          else
+            execute_block.call
+          end
         end
       end
@@ -947,7 +1179,9 @@ module Aidp
         []
       end
-      def log_iteration_status(status, provider:, model:, prompt_length:, checks: nil, failures: nil, task_status: nil)
+      # FIX for issue #391: Added completion_reason and task_completion_reason parameters for better logging
+      def log_iteration_status(status, provider:, model:, prompt_length:, checks: nil, failures: nil, task_status: nil,
+        completion_reason: nil, task_completion_reason: nil)
         context_labels = iteration_context_labels
         metadata = {
           step: @step_name,
@@ -959,7 +1193,9 @@ module Aidp
           prompt_length: prompt_length,
           checks: checks,
           failures: failures,
-          task_status: task_status
+          task_status: task_status,
+          completion_reason: completion_reason,
+          task_completion_reason: task_completion_reason
         }
         metadata.merge!(iteration_context_metadata)
@@ -975,17 +1211,19 @@ module Aidp
         Aidp.log_warn("work_loop", "failed_to_log_iteration_status", error: e.message)
       end
+      # FIX for issue #391: Enhanced work loop header with upfront task filing requirements
       def build_work_loop_header(step_name, iteration)
         parts = []
         parts << "# Work Loop: #{step_name} (Iteration #{iteration})"
         parts << ""
         parts << "## Instructions"
         parts << "You are working in a work loop. Your responsibilities:"
-        parts << "1. Read the task description below to understand what needs to be done"
-        parts << "2. **Write/edit code files** to implement the required changes"
-        parts << "3. Run tests to verify your changes work correctly"
-        parts << "4. Update the task list in PROMPT.md as you complete items"
-        parts << "5. When ALL tasks are complete and tests pass, mark the step COMPLETE"
+        parts << "1. **FIRST**: File tasks for all work items (see Task Filing section below)"
+        parts << "2. Read the task description below to understand what needs to be done"
+        parts << "3. **Write/edit CODE files** to implement the required changes"
+        parts << "4. Run tests to verify your changes work correctly"
+        parts << "5. Update task status as you complete items"
+        parts << "6. When ALL tasks are complete and tests pass, mark the step COMPLETE"
         parts << ""
         parts << "## Important Notes"
         parts << "- You have full file system access - create and edit files as needed"
@@ -993,29 +1231,53 @@ module Aidp
         parts << "- After you finish, tests and linters will run automatically"
         parts << "- If tests/linters fail, you'll see the errors in the next iteration and can fix them"
         parts << ""
+        parts << "## ⚠️  Code Changes Required"
+        parts << "**IMPORTANT**: This implementation requires actual code changes."
+        parts << "- Documentation-only changes will NOT be accepted as complete"
+        parts << "- Configuration-only changes will NOT be accepted as complete"
+        parts << "- You must modify/create code files (.rb, .py, .js, etc.) to implement the feature/fix"
+        parts << "- Tests should accompany code changes"
+        parts << ""
         if @config.task_completion_required?
-          parts << "## Task Tracking (REQUIRED)"
-          parts << "**CRITICAL**: This work loop requires task tracking for completion."
+          parts << "## Task Filing (REQUIRED - DO THIS FIRST)"
+          parts << "**CRITICAL**: This work loop requires task tracking. You MUST file tasks before implementation."
+          parts << ""
+          parts << "### Step 1: File Tasks Immediately"
+          parts << "In your FIRST iteration, analyze the requirements and file tasks for ALL work:"
           parts << ""
-          parts << "You must:"
-          parts << "1. Create at least one task for this session using: `File task: \"description\"`"
-          parts << "2. Track all work items as tasks"
-          parts << "3. Update task status as you progress"
-          parts << "4. All tasks must be DONE or ABANDONED (with reason) before completion"
-          parts << "5. **IMPORTANT**: When you write STATUS: COMPLETE, also mark all your tasks as done!"
+          parts << "```text"
+          parts << "File task: \"Implement [feature/fix description]\" priority: high tags: implementation"
+          parts << "File task: \"Add unit tests for [feature]\" priority: high tags: testing"
+          parts << "File task: \"Add integration tests if needed\" priority: medium tags: testing"
+          parts << "```"
           parts << ""
-          parts << "**Important**: Tasks in the list exist due to careful planning and requirements analysis."
-          parts << "Do NOT abandon tasks due to perceived complexity or scope concerns - these factors were"
-          parts << "considered during planning. Only abandon tasks when truly obsolete (requirements changed,"
-          parts << "duplicate work, external blockers). When in doubt, mark in_progress and implement."
+          parts << "### Step 2: Work Through Tasks"
+          parts << "- Pick the highest priority pending task"
+          parts << "- Implement it completely"
+          parts << "- Mark it done: `Update task: task_id status: done`"
+          parts << "- Repeat until all tasks are complete"
           parts << ""
-          parts << "Task filing examples:"
+          parts << "### Step 3: Complete the Work Loop"
+          parts << "Only after ALL tasks are done:"
+          parts << "- Verify tests pass"
+          parts << "- Add STATUS: COMPLETE to PROMPT.md"
+          parts << ""
+          parts << "### Task Rules"
+          parts << "- **At least ONE task must be filed** - completion blocked without tasks"
+          parts << "- **At least ONE task must be DONE** - completion blocked if all abandoned"
+          parts << "- **Substantive work required** - doc-only changes rejected"
+          parts << ""
+          parts << "**Important**: Tasks exist due to careful planning. Do NOT abandon tasks due to"
+          parts << "perceived complexity - these factors were considered during planning. Only abandon"
+          parts << "when truly obsolete (requirements changed, duplicate, external blockers)."
+          parts << ""
+          parts << "### Task Filing Examples"
           parts << "- `File task: \"Implement user authentication\" priority: high tags: security,auth`"
           parts << "- `File task: \"Add tests for login flow\" priority: medium tags: testing`"
           parts << "- `File task: \"Update documentation\" priority: low tags: docs`"
           parts << ""
-          parts << "Task status update examples:"
+          parts << "### Task Status Update Examples"
           parts << "- `Update task: task_123_abc status: in_progress`"
           parts << "- `Update task: task_456_def status: done`"
           parts << "- `Update task: task_789_ghi status: abandoned reason: \"Requirements changed\"`"
@@ -1454,6 +1716,29 @@ module Aidp
         display_message("")
       end
+      # Display security status for Rule of Two enforcement
+      def display_security_status
+        status = @security_adapter.status
+        return unless status[:enabled]
+        display_message("\n🔒 Security (Rule of Two):", type: :info)
+        display_message("  #{status[:status_string]}", type: :info)
+        if status[:state]
+          state = status[:state]
+          flags = []
+          flags << "untrusted_input (#{state[:untrusted_input_source]})" if state[:untrusted_input]
+          flags << "private_data (#{state[:private_data_source]})" if state[:private_data]
+          flags << "egress (#{state[:egress_source]})" if state[:egress]
+          if flags.any?
+            display_message("  Active flags: #{flags.join(", ")}", type: :info)
+          end
+        end
+        display_message("")
+      end
       # Display pending tasks from persistent tasklist
       def display_pending_tasks
         pending_tasks = @persistent_tasklist.pending
@@ -1530,46 +1815,113 @@ module Aidp
       end
       # Check if tasks are required and all are completed or abandoned
-      # Returns {complete: boolean, message: string}
+      # Returns {complete: boolean, message: string, reason: string}
       # Note: Tasks are project-scoped, not session-scoped. This allows tasks created
       # in planning phases to be completed in build phases.
+      #
+      # FIX for issue #391: Prevent premature completion when tasks haven't been created
+      # The previous logic allowed completion with empty task list, which enabled
+      # the work loop to complete before actually implementing anything.
       def check_task_completion
-        return {complete: true, message: nil} unless @config.task_completion_required?
+        Aidp.log_debug("work_loop", "check_task_completion_start",
+          task_completion_required: @config.task_completion_required?,
+          iteration: @iteration_count)
+        unless @config.task_completion_required?
+          Aidp.log_debug("work_loop", "check_task_completion_skipped",
+            reason: "task_completion_not_required")
+          return {complete: true, message: nil, reason: "task_completion_not_required"}
+        end
         all_tasks = @persistent_tasklist.all
-        # If no tasks exist yet, allow completion - agent can work without tasks initially
-        # This supports workflows where no planning phase created tasks
+        Aidp.log_debug("work_loop", "check_task_completion_task_count",
+          total_tasks: all_tasks.size,
+          task_ids: all_tasks.map(&:id))
+        # FIX for issue #391: Require at least one task when task_completion is enabled
+        # Empty task list now blocks completion to prevent premature PR creation
+        # This ensures the agent has actually created and completed work items
         if all_tasks.empty?
-          return {complete: true, message: nil}
+          Aidp.log_debug("work_loop", "check_task_completion_empty_tasks",
+            reason: "no_tasks_filed",
+            iteration: @iteration_count)
+          # After multiple iterations, require tasks - agent should have filed some by now
+          if @iteration_count >= 3
+            return {
+              complete: false,
+              message: "No tasks have been filed yet. You must create at least one task using:\n" \
+                      "  File task: \"description\" priority: high|medium|low tags: tag1,tag2\n\n" \
+                      "Tasks help track progress and ensure complete implementation.",
+              reason: "no_tasks_after_iterations"
+            }
+          end
+          # In early iterations, allow progress but don't allow completion
+          return {
+            complete: false,
+            message: "Please file tasks to track your implementation work.",
+            reason: "no_tasks_early_iteration"
+          }
         end
         # Count tasks by status
         pending_tasks = all_tasks.select { |t| t.status == :pending }
         in_progress_tasks = all_tasks.select { |t| t.status == :in_progress }
         abandoned_tasks = all_tasks.select { |t| t.status == :abandoned }
-        all_tasks.select { |t| t.status == :done }
+        done_tasks = all_tasks.select { |t| t.status == :done }
+        Aidp.log_debug("work_loop", "check_task_completion_status_counts",
+          pending: pending_tasks.size,
+          in_progress: in_progress_tasks.size,
+          abandoned: abandoned_tasks.size,
+          done: done_tasks.size)
         # If tasks exist, all must be done or abandoned before completion
         incomplete_tasks = pending_tasks + in_progress_tasks
         if incomplete_tasks.any?
           task_list = incomplete_tasks.map { |t| "- #{t.description} (#{t.status}, session: #{t.session})" }.join("\n")
+          Aidp.log_debug("work_loop", "check_task_completion_incomplete",
+            incomplete_count: incomplete_tasks.size,
+            incomplete_ids: incomplete_tasks.map(&:id))
+          return {
+            complete: false,
+            message: "Tasks remain incomplete:\n#{task_list}\n\nComplete all tasks or abandon them with reason before marking work complete.",
+            reason: "incomplete_tasks"
+          }
+        end
+        # FIX for issue #391: Require at least one done task, not just abandoned
+        # This prevents scenarios where all tasks are abandoned without any work
+        if done_tasks.empty? && abandoned_tasks.any?
+          Aidp.log_debug("work_loop", "check_task_completion_all_abandoned",
+            abandoned_count: abandoned_tasks.size)
           return {
             complete: false,
-            message: "Tasks remain incomplete:\n#{task_list}\n\nComplete all tasks or abandon them with reason before marking work complete."
+            message: "All tasks have been abandoned with no completed work. " \
+                    "At least one task must be completed, or explain why no implementation is needed.",
+            reason: "all_tasks_abandoned"
           }
         end
         # If there are abandoned tasks, confirm with user
         if abandoned_tasks.any? && !all_abandoned_tasks_confirmed?(abandoned_tasks)
+          Aidp.log_debug("work_loop", "check_task_completion_unconfirmed_abandoned",
+            abandoned_count: abandoned_tasks.size)
           return {
             complete: false,
-            message: "Abandoned tasks require user confirmation. Please confirm abandoned tasks."
+            message: "Abandoned tasks require user confirmation. Please confirm abandoned tasks.",
+            reason: "unconfirmed_abandoned_tasks"
           }
         end
-        {complete: true, message: nil}
+        Aidp.log_debug("work_loop", "check_task_completion_success",
+          done_count: done_tasks.size,
+          abandoned_count: abandoned_tasks.size)
+        {complete: true, message: nil, reason: "all_tasks_complete"}
       end
       # Check if all abandoned tasks have been confirmed

data/lib/aidp/execute/work_loop_state.rb CHANGED Viewed

@@ -18,7 +18,10 @@ module Aidp
         error: "ERROR"
       }.freeze
-      attr_reader :current_state, :iteration, :queued_instructions, :last_error
+      attr_reader :iteration, :queued_instructions, :last_error
+      # Expose current_state for testability (use state transition methods in production)
+      attr_accessor :current_state
       def initialize
         super # Initialize MonitorMixin

data/lib/aidp/execute/workflow_selector.rb CHANGED Viewed

@@ -10,6 +10,9 @@ module Aidp
     class WorkflowSelector
       include Aidp::MessageDisplay
+      # Expose for testability
+      attr_reader :user_input
       def initialize(prompt: TTY::Prompt.new, workflow_selector: nil)
         @user_input = {}
         @prompt = prompt