npm - claude-evolve - Versions diffs - 1.8.11 → 1.8.13 - Mend

claude-evolve 1.8.11 → 1.8.13

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (4) hide show

package/bin/claude-evolve-ideate +83 -41
package/bin/claude-evolve-worker +27 -5
package/lib/memory_limit_wrapper.py +152 -64
package/package.json +1 -1

package/bin/claude-evolve-ideate CHANGED Viewed

@@ -362,6 +362,12 @@ print(max_id + 1)
 "
 }
+# AIDEV-NOTE: This function had a critical race condition bug that caused wrong rows to be updated
+# The bug occurred when parallel processes modified the main CSV between temp CSV creation and append.
+# FIX: Now requires original_main_csv_lines parameter (6th arg) to track the exact line count at copy time.
+# This ensures we always append the correct new rows from temp CSV, regardless of concurrent modifications.
+# Without this fix, the system would update wrong IDs (e.g., claim to add gen81 but update gen80 instead).
+#
 # Validate that AI directly modified the CSV file
 validate_direct_csv_modification() {
   local temp_csv="$1"
@@ -369,6 +375,7 @@ validate_direct_csv_modification() {
   local idea_type="$3"
   local ai_model="${4:-}"  # AI model that generated the ideas
   local expected_ids="${5:-}"  # Optional: comma or space separated list of expected IDs
+  local original_main_csv_lines="${6:-}"  # CRITICAL: Line count of main CSV when temp CSV was created
   # Check if the file was actually modified
   if [[ ! -f "$temp_csv" ]]; then
@@ -376,32 +383,37 @@ validate_direct_csv_modification() {
     return 1
   fi
-  # Get the count before modification from the temp CSV (which was copied from original before AI ran)
-  # We need to track this before the AI runs by reading from the beginning state
-  # First, get a fresh count from the current main CSV (which reflects any previous operations in this session)
-  local current_original_count
-  current_original_count=$(grep -v '^[[:space:]]*$' "$FULL_CSV_PATH" | tail -n +2 | wc -l | tr -d '[:space:]')
   # Count data rows in the modified temp CSV
   local new_count
   new_count=$(grep -v '^[[:space:]]*$' "$temp_csv" | tail -n +2 | wc -l | tr -d '[:space:]')
+  # If original line count wasn't provided, fall back to current main CSV count (old behavior)
+  # This preserves backward compatibility but may have race conditions
+  if [[ -z "$original_main_csv_lines" ]]; then
+    echo "[WARN] No original line count provided - using current main CSV count (may cause race conditions)" >&2
+    original_main_csv_lines=$(wc -l < "$FULL_CSV_PATH" | tr -d '[:space:]')
+  fi
+  # Calculate how many data rows the temp CSV started with (before stubs were added)
+  # This should match the original main CSV line count (including header)
+  local original_data_rows=$((original_main_csv_lines - 1))  # Subtract header
+  # Calculate how many rows were actually added to temp CSV
+  local added_count=$((new_count - original_data_rows))
   # Check if AI overwrote the file instead of appending
-  if [[ $new_count -lt $current_original_count ]]; then
-    echo "[ERROR] AI overwrote the CSV file instead of appending ($new_count < $current_original_count)" >&2
+  if [[ $new_count -lt $original_data_rows ]]; then
+    echo "[ERROR] AI overwrote the CSV file instead of appending ($new_count < $original_data_rows)" >&2
     head -10 "$temp_csv" >&2
     return 1
   fi
   # Check if no changes were made
-  if [[ $new_count -eq $current_original_count ]]; then
-    echo "[ERROR] CSV file wasn't modified - same number of data rows ($new_count = $current_original_count)" >&2
+  if [[ $new_count -eq $original_data_rows ]]; then
+    echo "[ERROR] CSV file wasn't modified - same number of data rows ($new_count = $original_data_rows)" >&2
     head -10 "$temp_csv" >&2
     return 1
   fi
-  local added_count=$((new_count - current_original_count))
   if [[ $added_count -ne $expected_count ]]; then
     echo "[ERROR] Expected to add $expected_count ideas but only added $added_count" >&2
     echo "[ERROR] Ideation failed - rejecting partial results to prevent endless loops" >&2
@@ -434,43 +446,47 @@ validate_direct_csv_modification() {
   # Use proper locking to safely update the CSV
   echo "[INFO] Acquiring CSV lock to apply changes..."
   # Set the lockfile path
   CSV_LOCKFILE="$FULL_EVOLUTION_DIR/.evolution.csv.lock"
   if ! acquire_csv_lock; then
     echo "[ERROR] Failed to acquire CSV lock for update" >&2
     rm -f "$temp_csv"
     return 1
   fi
-  # Get just the new entries (skip header and existing entries)
-  local original_line_count=$(wc -l < "$FULL_CSV_PATH" | tr -d '[:space:]')
-  # Append only the new lines from temp CSV to the main CSV
-  tail -n +$((original_line_count + 1)) "$temp_csv" >> "$FULL_CSV_PATH"
+  # CRITICAL FIX: Use the original line count (when temp CSV was created) to determine which lines to append
+  # This prevents race conditions where other processes modify the main CSV between temp CSV creation and append
+  # Append only the NEW lines from temp CSV (those added after the original content)
+  echo "[DEBUG] Appending last $added_count rows from temp CSV (from line $((original_main_csv_lines + 1)) onwards)" >&2
+  tail -n +$((original_main_csv_lines + 1)) "$temp_csv" >> "$FULL_CSV_PATH"
+  # Get the IDs that were actually added by reading them from temp CSV (not main CSV)
+  # This avoids race conditions where other processes add rows to main CSV
+  local new_ids
+  new_ids=$(tail -n $added_count "$temp_csv" | grep -v "^id," | cut -d',' -f1 | tr -d '"')
+  echo "[DEBUG] IDs being added: $new_ids" >&2
   # Clean up temp file
   rm -f "$temp_csv"
   # Update idea-LLM field for newly added rows if model is known
   if [[ -n "$ai_model" ]]; then
     echo "[INFO] Recording that $ai_model generated the ideas" >&2
-    # Get the IDs of the newly added rows (skip header line and strip quotes)
-    local new_ids
-    new_ids=$(tail -n $added_count "$FULL_CSV_PATH" | grep -v "^id," | cut -d',' -f1 | tr -d '"')
     # Update each new row with the model that generated it
     for id in $new_ids; do
       if [[ -n "$id" && "$id" != "id" ]]; then
+        echo "[DEBUG] Updating field for $id" >&2
         "$PYTHON_CMD" "$SCRIPT_DIR/../lib/evolution_csv.py" "$FULL_CSV_PATH" field "$id" "idea-LLM" "$ai_model" || echo "[WARN] Failed to update $id" >&2
       fi
     done
   fi
   # Release the lock
   release_csv_lock
   echo "[INFO] Successfully added $added_count $idea_type ideas to CSV"
   return 0
 }
@@ -1001,6 +1017,12 @@ generate_novel_ideas_direct() {
   local temp_csv="$FULL_EVOLUTION_DIR/temp-csv-$$.csv"
   cp "$FULL_CSV_PATH" "$temp_csv"
+  # CRITICAL: Capture the original line count immediately after copying
+  # This is needed to correctly append rows later, preventing race conditions
+  local original_csv_lines
+  original_csv_lines=$(wc -l < "$temp_csv" | tr -d '[:space:]')
+  echo "[DEBUG] Original CSV has $original_csv_lines lines (including header)" >&2
   # Pre-populate the CSV with stub rows containing the correct IDs
   # This ensures the AI can't possibly use wrong IDs - it just fills in descriptions
   echo "[INFO] Pre-populating CSV with stub rows: $required_ids_str"
@@ -1098,10 +1120,10 @@ CRITICAL: Do NOT use any git commands (git add, git commit, git reset, etc.). On
   # Restore working directory
   cd "$original_pwd"
   # Validate that the CSV file was actually modified with correct IDs
-  if ! validate_direct_csv_modification "$temp_csv" "$count" "novel" "$ai_response" "$required_ids_str"; then
+  # Pass original_csv_lines to prevent race conditions
+  if ! validate_direct_csv_modification "$temp_csv" "$count" "novel" "$ai_response" "$required_ids_str" "$original_csv_lines"; then
     rm -f "$temp_csv"
     return 1
   fi
@@ -1135,6 +1157,11 @@ generate_hill_climbing_direct() {
   local temp_csv="$FULL_EVOLUTION_DIR/temp-csv-$$.csv"
   cp "$FULL_CSV_PATH" "$temp_csv"
+  # CRITICAL: Capture the original line count immediately after copying
+  local original_csv_lines
+  original_csv_lines=$(wc -l < "$temp_csv" | tr -d '[:space:]')
+  echo "[DEBUG] Original CSV has $original_csv_lines lines (including header)" >&2
   # Extract just the IDs from top performers for clarity (needed before pre-populating)
   local valid_parent_ids
   valid_parent_ids=$(echo "$top_performers" | cut -d',' -f1 | paste -sd ',' -)
@@ -1230,10 +1257,10 @@ CRITICAL INSTRUCTIONS:
   # Restore working directory
   cd "$original_pwd"
   # Validate that the CSV file was actually modified with correct IDs
-  if ! validate_direct_csv_modification "$temp_csv" "$count" "hill-climbing" "$ai_response" "$required_ids_str"; then
+  # Pass original_csv_lines to prevent race conditions
+  if ! validate_direct_csv_modification "$temp_csv" "$count" "hill-climbing" "$ai_response" "$required_ids_str" "$original_csv_lines"; then
     rm -f "$temp_csv"
     return 1
   fi
@@ -1267,6 +1294,11 @@ generate_structural_mutation_direct() {
   local temp_csv="$FULL_EVOLUTION_DIR/temp-csv-$$.csv"
   cp "$FULL_CSV_PATH" "$temp_csv"
+  # CRITICAL: Capture the original line count immediately after copying
+  local original_csv_lines
+  original_csv_lines=$(wc -l < "$temp_csv" | tr -d '[:space:]')
+  echo "[DEBUG] Original CSV has $original_csv_lines lines (including header)" >&2
   # Extract just the IDs from top performers for clarity (needed before pre-populating)
   local valid_parent_ids
   valid_parent_ids=$(echo "$top_performers" | cut -d',' -f1 | paste -sd ',' -)
@@ -1352,10 +1384,10 @@ CRITICAL INSTRUCTIONS:
   # Restore working directory
   cd "$original_pwd"
   # Validate that the CSV file was actually modified with correct IDs
-  if ! validate_direct_csv_modification "$temp_csv" "$count" "structural" "$ai_response" "$required_ids_str"; then
+  # Pass original_csv_lines to prevent race conditions
+  if ! validate_direct_csv_modification "$temp_csv" "$count" "structural" "$ai_response" "$required_ids_str" "$original_csv_lines"; then
     rm -f "$temp_csv"
     return 1
   fi
@@ -1389,6 +1421,11 @@ generate_crossover_direct() {
   local temp_csv="$FULL_EVOLUTION_DIR/temp-csv-$$.csv"
   cp "$FULL_CSV_PATH" "$temp_csv"
+  # CRITICAL: Capture the original line count immediately after copying
+  local original_csv_lines
+  original_csv_lines=$(wc -l < "$temp_csv" | tr -d '[:space:]')
+  echo "[DEBUG] Original CSV has $original_csv_lines lines (including header)" >&2
   # Extract just the IDs from top performers for clarity (needed before pre-populating)
   local valid_parent_ids
   valid_parent_ids=$(echo "$top_performers" | cut -d',' -f1 | paste -sd ',' -)
@@ -1474,10 +1511,10 @@ CRITICAL INSTRUCTIONS:
   # Restore working directory
   cd "$original_pwd"
   # Validate that the CSV file was actually modified with correct IDs
-  if ! validate_direct_csv_modification "$temp_csv" "$count" "crossover" "$ai_response" "$required_ids_str"; then
+  # Pass original_csv_lines to prevent race conditions
+  if ! validate_direct_csv_modification "$temp_csv" "$count" "crossover" "$ai_response" "$required_ids_str" "$original_csv_lines"; then
     rm -f "$temp_csv"
     return 1
   fi
@@ -1496,7 +1533,12 @@ ideate_ai_legacy() {
   # Create temporary CSV copy in evolution directory (so AI can access it)
   local temp_csv="$FULL_EVOLUTION_DIR/temp-csv-$$.csv"
   cp "$FULL_CSV_PATH" "$temp_csv"
+  # CRITICAL: Capture the original line count immediately after copying
+  local original_csv_lines
+  original_csv_lines=$(wc -l < "$temp_csv" | tr -d '[:space:]')
+  echo "[DEBUG] Original CSV has $original_csv_lines lines (including header)" >&2
   echo "[INFO] Generating $TOTAL_IDEAS ideas (legacy mode)..."
   # Get top performers for context
@@ -1580,14 +1622,14 @@ CRITICAL: Do NOT use any git commands (git add, git commit, git reset, etc.). On
   # Restore working directory
   cd "$original_pwd"
   # Validate that the CSV file was actually modified
-  if ! validate_direct_csv_modification "$temp_csv" "$TOTAL_IDEAS" "mixed" "$ai_response"; then
+  # Pass original_csv_lines to prevent race conditions
+  if ! validate_direct_csv_modification "$temp_csv" "$TOTAL_IDEAS" "mixed" "$ai_response" "" "$original_csv_lines"; then
     rm -f "$temp_csv"
     return 1
   fi
   echo "[INFO] Legacy ideas generated"
   return 0
 }

package/bin/claude-evolve-worker CHANGED Viewed

@@ -407,19 +407,41 @@ with EvolutionCSV('$FULL_CSV_PATH') as csv:
     eval_arg=""
   fi
   local eval_cmd=("$PYTHON_CMD" "$FULL_EVALUATOR_PATH" "$eval_arg")
   # Add memory limiting if configured
+  # CRITICAL: Use multiple layers of protection (ulimit + Python wrapper + monitoring)
+  local memory_protection=""
   if [[ -n "$MEMORY_LIMIT_MB" ]] && [[ "$MEMORY_LIMIT_MB" -gt 0 ]]; then
+    # Layer 1: ulimit for hard memory limit (kernel-enforced)
+    # IMPORTANT: Use -m (RSS) not -v (virtual memory) because:
+    # - Neural networks use mmap() which bypasses RLIMIT_AS (-v)
+    # - RSS limit is more reliable for actual memory consumption
+    # Convert MB to KB for ulimit
+    local memory_limit_kb=$((MEMORY_LIMIT_MB * 1024))
+    # Try -m first (RSS limit), fall back to -v if not supported
+    if ulimit -m $memory_limit_kb 2>/dev/null; then
+      memory_protection="ulimit -m $memory_limit_kb 2>/dev/null; "
+      echo "[MEMORY] Layer 1: ulimit -m ${memory_limit_kb}KB (RSS limit - catches neural networks)" >&2
+    else
+      memory_protection="ulimit -v $memory_limit_kb 2>/dev/null; "
+      echo "[MEMORY] Layer 1: ulimit -v ${memory_limit_kb}KB (fallback - may not catch neural networks)" >&2
+    fi
+    # Layer 2: Python wrapper with PROCESS TREE monitoring (backup protection)
     eval_cmd=("$PYTHON_CMD" "$SCRIPT_DIR/../lib/memory_limit_wrapper.py" "$MEMORY_LIMIT_MB" "${eval_cmd[@]}")
+    echo "[MEMORY] Layer 2: Python process tree monitoring (kills entire subprocess tree)" >&2
   fi
   # Add timeout if configured
   [[ -n "$timeout_seconds" ]] && eval_cmd=(timeout "$timeout_seconds" "${eval_cmd[@]}")
-  # Run evaluation with tee to both display and capture output
+  # Run evaluation with memory protection, tee to both display and capture output
   # Use stdbuf to disable buffering for real-time output
   # IMPORTANT: Use PIPESTATUS to get the exit code of the evaluation command, not tee
-  stdbuf -o0 -e0 "${eval_cmd[@]}" 2>&1 | tee "$eval_output_file" >&2
+  # The subshell ensures ulimit is applied before the command runs
+  stdbuf -o0 -e0 bash -c "${memory_protection}$(printf '%q ' "${eval_cmd[@]}")" 2>&1 | tee "$eval_output_file" >&2
   local eval_exit_code=${PIPESTATUS[0]}  # Get exit code of first command in pipe
   if [[ $eval_exit_code -eq 0 ]]; then

package/lib/memory_limit_wrapper.py CHANGED Viewed

@@ -4,6 +4,16 @@ Memory-limited execution wrapper for claude-evolve evaluations.
 This script runs a command with memory limits to prevent runaway algorithms
 from consuming all system memory and crashing the machine.
+CRITICAL: Multi-layer protection approach (both must work together):
+1. ulimit -m (RSS limit) set by calling shell script - kernel-enforced, catches neural networks
+2. This Python wrapper monitors ENTIRE PROCESS TREE every 0.1s and kills if limit exceeded
+AIDEV-NOTE: Previous bugs fixed:
+- ulimit -v (virtual memory) doesn't catch neural networks that use mmap()
+- Was only monitoring direct child, not entire process tree (missed grandchildren)
+- Monitoring interval was 0.5s - too slow for fast memory allocations
+- Resource limit failures were silently ignored instead of failing fast
 """
 import sys
 import os
@@ -11,119 +21,197 @@ import subprocess
 import signal
 import time
 import resource
-from typing import Optional
+from typing import Optional, Tuple
-def set_memory_limit(limit_mb: int) -> None:
-    """Set memory limit in MB using resource module."""
+def verify_memory_limit_set(limit_mb: int) -> Tuple[bool, str]:
+    """Verify that memory limits are actually enforced."""
+    try:
+        limit_bytes = limit_mb * 1024 * 1024
+        # Check RLIMIT_AS (virtual memory)
+        soft_as, hard_as = resource.getrlimit(resource.RLIMIT_AS)
+        if soft_as != resource.RLIM_INFINITY and soft_as <= limit_bytes * 1.1:
+            return True, f"RLIMIT_AS set to {soft_as / (1024*1024):.0f}MB"
+        # Check RLIMIT_DATA (data segment)
+        try:
+            soft_data, hard_data = resource.getrlimit(resource.RLIMIT_DATA)
+            if soft_data != resource.RLIM_INFINITY and soft_data <= limit_bytes * 1.1:
+                return True, f"RLIMIT_DATA set to {soft_data / (1024*1024):.0f}MB"
+        except (OSError, ValueError):
+            pass
+        return False, "No hard memory limits detected"
+    except Exception as e:
+        return False, f"Error checking limits: {e}"
+def set_memory_limit(limit_mb: int) -> bool:
+    """
+    Set memory limit in MB using resource module.
+    Returns True if successful, False otherwise.
+    """
     try:
         # Convert MB to bytes
         limit_bytes = limit_mb * 1024 * 1024
         # Set virtual memory limit (address space)
         # On macOS this is the most reliable way to limit memory
         resource.setrlimit(resource.RLIMIT_AS, (limit_bytes, limit_bytes))
         # Also try to set data segment limit if available
         try:
             resource.setrlimit(resource.RLIMIT_DATA, (limit_bytes, limit_bytes))
         except (OSError, ValueError):
             # Not available on all systems
             pass
-        print(f"[MEMORY] Set memory limit to {limit_mb}MB", file=sys.stderr)
+        # Verify it was actually set
+        is_set, msg = verify_memory_limit_set(limit_mb)
+        if is_set:
+            print(f"[MEMORY] ✓ Hard limit enforced: {msg}", file=sys.stderr)
+            return True
+        else:
+            print(f"[MEMORY] ✗ Hard limit NOT enforced: {msg}", file=sys.stderr)
+            return False
     except (OSError, ValueError) as e:
-        print(f"[MEMORY] Warning: Could not set memory limit: {e}", file=sys.stderr)
+        print(f"[MEMORY] ✗ Could not set memory limit: {e}", file=sys.stderr)
+        return False
+def get_process_tree_memory_native(pid: int) -> float:
+    """Get total memory usage of entire process group using native ps command."""
+    try:
+        # Get the process group ID
+        pgid = os.getpgid(pid)
+        # Get all processes in the process group
+        ps_result = subprocess.run(
+            ["ps", "-o", "rss=", "-g", str(pgid)],
+            capture_output=True,
+            text=True,
+            timeout=1
+        )
+        if ps_result.returncode != 0:
+            return 0.0
+        # Sum all RSS values from the process group
+        total_rss_kb = 0
+        for line in ps_result.stdout.strip().split('\n'):
+            line = line.strip()
+            if line:
+                try:
+                    total_rss_kb += int(line)
+                except ValueError:
+                    continue
+        # Convert KB to MB
+        return total_rss_kb / 1024.0
+    except Exception:
+        return 0.0
 def monitor_memory_usage_native(process: subprocess.Popen, limit_mb: int) -> Optional[str]:
-    """Monitor process memory usage using native tools and kill if it exceeds limits."""
-    # print(f"[MEMORY] Starting native monitoring for PID {process.pid} with limit {limit_mb}MB", file=sys.stderr)
+    """Monitor ENTIRE PROCESS TREE memory usage using native tools and kill if it exceeds limits."""
+    print(f"[MEMORY] Monitoring process tree from root PID {process.pid} (limit: {limit_mb}MB)", file=sys.stderr)
     while process.poll() is None:
         try:
-            # Use ps command to get memory usage
-            ps_result = subprocess.run(
-                ["ps", "-o", "rss=", "-p", str(process.pid)],
-                capture_output=True,
-                text=True,
-                timeout=1
-            )
-            if ps_result.returncode == 0 and ps_result.stdout.strip():
-                # ps returns RSS in KB, convert to MB
-                memory_kb = int(ps_result.stdout.strip())
-                memory_mb = memory_kb / 1024
-                # print(f"[MEMORY] PID {process.pid} using {memory_mb:.1f}MB (limit: {limit_mb}MB)", file=sys.stderr)
-                if memory_mb > limit_mb:
-                    print(f"[MEMORY] Process exceeded {limit_mb}MB limit (using {memory_mb:.1f}MB), terminating", file=sys.stderr)
-                    # Kill the entire process group - fix race condition
-                    try:
-                        pgid = os.getpgid(process.pid)
-                        os.killpg(pgid, signal.SIGTERM)
-                    except ProcessLookupError:
-                        return f"Memory limit exceeded: {memory_mb:.1f}MB > {limit_mb}MB"
-                    time.sleep(2)  # Give it time to cleanup
-                    try:
-                        if process.poll() is None:
-                            pgid = os.getpgid(process.pid)
-                            os.killpg(pgid, signal.SIGKILL)
-                    except ProcessLookupError:
-                        pass
+            # Get total memory for entire process tree
+            memory_mb = get_process_tree_memory_native(process.pid)
+            if memory_mb > limit_mb:
+                print(f"[MEMORY] Process tree exceeded {limit_mb}MB limit (using {memory_mb:.1f}MB), terminating entire tree", file=sys.stderr)
+                # Kill the entire process group
+                try:
+                    pgid = os.getpgid(process.pid)
+                    os.killpg(pgid, signal.SIGTERM)
+                except ProcessLookupError:
                     return f"Memory limit exceeded: {memory_mb:.1f}MB > {limit_mb}MB"
-            time.sleep(0.5)  # Check every 500ms
+                time.sleep(2)  # Give it time to cleanup
+                try:
+                    if process.poll() is None:
+                        pgid = os.getpgid(process.pid)
+                        os.killpg(pgid, signal.SIGKILL)
+                except ProcessLookupError:
+                    pass
+                return f"Memory limit exceeded: {memory_mb:.1f}MB > {limit_mb}MB"
+            time.sleep(0.1)  # Check every 100ms for faster response
         except (subprocess.TimeoutExpired, ValueError, ProcessLookupError):
             # Process might have terminated or ps command failed
-            time.sleep(0.5)
+            time.sleep(0.1)
             continue
-    # print(f"[MEMORY] Monitoring stopped for PID {process.pid}", file=sys.stderr)
     return None
+def get_process_tree_memory_psutil(ps_process) -> float:
+    """Get total memory usage of entire process tree using psutil."""
+    try:
+        import psutil
+        total_mb = 0.0
+        # Get memory of root process
+        try:
+            total_mb += ps_process.memory_info().rss / (1024 * 1024)
+        except (psutil.NoSuchProcess, psutil.AccessDenied):
+            return 0.0
+        # Get memory of all children (recursive)
+        try:
+            for child in ps_process.children(recursive=True):
+                try:
+                    total_mb += child.memory_info().rss / (1024 * 1024)
+                except (psutil.NoSuchProcess, psutil.AccessDenied):
+                    continue
+        except (psutil.NoSuchProcess, psutil.AccessDenied):
+            pass
+        return total_mb
+    except ImportError:
+        return 0.0
 def monitor_memory_usage(process: subprocess.Popen, limit_mb: int) -> Optional[str]:
-    """Monitor process memory usage and kill if it exceeds limits."""
+    """Monitor ENTIRE PROCESS TREE memory usage and kill if it exceeds limits."""
     try:
         import psutil
         ps_process = psutil.Process(process.pid)
+        print(f"[MEMORY] Monitoring process tree from root PID {process.pid} (limit: {limit_mb}MB, using psutil)", file=sys.stderr)
         while process.poll() is None:
             try:
-                # Get memory usage in MB
-                memory_info = ps_process.memory_info()
-                memory_mb = memory_info.rss / (1024 * 1024)
+                # Get total memory for entire process tree
+                memory_mb = get_process_tree_memory_psutil(ps_process)
                 if memory_mb > limit_mb:
-                    print(f"[MEMORY] Process exceeded {limit_mb}MB limit (using {memory_mb:.1f}MB), terminating", file=sys.stderr)
-                    # Kill the entire process group - fix race condition
+                    print(f"[MEMORY] Process tree exceeded {limit_mb}MB limit (using {memory_mb:.1f}MB), terminating entire tree", file=sys.stderr)
+                    # Kill the entire process group
                     try:
                         pgid = os.getpgid(process.pid)
                         os.killpg(pgid, signal.SIGTERM)
                     except ProcessLookupError:
                         return f"Memory limit exceeded: {memory_mb:.1f}MB > {limit_mb}MB"
                     time.sleep(2)  # Give it time to cleanup
                     try:
                         if process.poll() is None:
-                            pgid = os.getpgid(process.pid)
+                            pgid = os.getpgid(process.pid)
                             os.killpg(pgid, signal.SIGKILL)
                     except ProcessLookupError:
                         pass
                     return f"Memory limit exceeded: {memory_mb:.1f}MB > {limit_mb}MB"
-                time.sleep(0.5)  # Check every 500ms
+                time.sleep(0.1)  # Check every 100ms for faster response
             except (psutil.NoSuchProcess, psutil.AccessDenied):
                 # Process already terminated
                 break
     except ImportError:
         # psutil not available, use native monitoring
         return monitor_memory_usage_native(process, limit_mb)
     return None
 def validate_memory_limit(limit_mb: int) -> bool:

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "claude-evolve",
-  "version": "1.8.11",
+  "version": "1.8.13",
   "bin": {
     "claude-evolve": "./bin/claude-evolve",
     "claude-evolve-main": "./bin/claude-evolve-main",