npm - codeharness - Versions diffs - 0.19.5 → 0.21.0 - Mend

codeharness 0.19.5 → 0.21.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (18) hide show

package/dist/index.js +3149 -2656
package/dist/modules/observability/index.d.ts +295 -0
package/dist/modules/observability/index.js +366 -0
package/package.json +6 -1
package/patches/AGENTS.md +19 -1
package/patches/observability/AGENTS.md +27 -0
package/patches/observability/__tests__/catch-without-logging.ts +36 -0
package/patches/observability/__tests__/error-path-no-log.ts +47 -0
package/patches/observability/__tests__/function-no-debug-log.ts +54 -0
package/patches/observability/catch-without-logging.ts +36 -0
package/patches/observability/catch-without-logging.yaml +35 -0
package/patches/observability/error-path-no-log.ts +47 -0
package/patches/observability/error-path-no-log.yaml +68 -0
package/patches/observability/function-no-debug-log.ts +54 -0
package/patches/observability/function-no-debug-log.yaml +114 -0
package/ralph/drivers/claude-code.sh +2 -28
package/ralph/ralph.sh +153 -9
package/templates/Dockerfile.verify +8 -1

package/ralph/ralph.sh CHANGED Viewed

@@ -47,7 +47,7 @@ RATE_LIMIT_SLEEP=3600  # 1 hour
 # Driver
 PLATFORM_DRIVER="${PLATFORM_DRIVER:-claude-code}"
-CLAUDE_OUTPUT_FORMAT="${CLAUDE_OUTPUT_FORMAT:-json}"
+CLAUDE_OUTPUT_FORMAT="${CLAUDE_OUTPUT_FORMAT:-stream-json}"
 CLAUDE_ALLOWED_TOOLS="${CLAUDE_ALLOWED_TOOLS:-}"
 CLAUDE_USE_CONTINUE="${CLAUDE_USE_CONTINUE:-false}"  # Fresh context per iteration by default
@@ -98,6 +98,14 @@ log_status() {
         "LOOP")    color=$PURPLE ;;
     esac
+    # DEBUG level: log file only, no terminal output
+    if [[ "$level" == "DEBUG" ]]; then
+        if [[ -n "$LOG_DIR" ]]; then
+            echo "[$timestamp] [$level] $message" >> "$LOG_DIR/ralph.log"
+        fi
+        return
+    fi
     echo -e "${color}[$timestamp] [$level] $message${NC}" >&2
     if [[ -n "$LOG_DIR" ]]; then
         echo "[$timestamp] [$level] $message" >> "$LOG_DIR/ralph.log"
@@ -444,6 +452,58 @@ detect_story_changes() {
     done <<< "$after_snapshot"
 }
+# ─── Sprint State Progress Polling ─────────────────────────────────────────
+# Previous state tracking for change detection
+PREV_STORY=""
+PREV_PHASE=""
+PREV_AC_PROGRESS=""
+PREV_LAST_ACTION=""
+# Poll sprint-state.json for progress changes during background execution.
+# Prints structured update lines when progress fields change.
+poll_sprint_state_progress() {
+    local state_file="sprint-state.json"
+    [[ -f "$state_file" ]] || return 0
+    # Single jq call to extract all fields (avoids 4 process spawns per poll cycle)
+    local raw
+    raw=$(jq -r '[.run.currentStory // "", .run.currentPhase // "", .run.lastAction // "", .run.acProgress // ""] | join("\t")' "$state_file" 2>/dev/null) || return 0
+    [[ -n "$raw" ]] || return 0
+    local cur_story cur_phase cur_action cur_ac
+    IFS=$'\t' read -r cur_story cur_phase cur_action cur_ac <<< "$raw"
+    # Nothing to report if no story is active
+    [[ -z "$cur_story" ]] && return 0
+    # Detect changes and print structured updates
+    if [[ "$cur_story" != "$PREV_STORY" || "$cur_phase" != "$PREV_PHASE" ]]; then
+        if [[ -n "$cur_action" && "$cur_action" != "null" ]]; then
+            log_status "INFO" "Story ${cur_story}: ${cur_phase} (${cur_action})"
+        else
+            log_status "INFO" "Story ${cur_story}: ${cur_phase}"
+        fi
+    elif [[ "$cur_ac" != "$PREV_AC_PROGRESS" && -n "$cur_ac" && "$cur_ac" != "null" ]]; then
+        log_status "INFO" "Story ${cur_story}: verify (AC ${cur_ac})"
+    elif [[ "$cur_action" != "$PREV_LAST_ACTION" && -n "$cur_action" && "$cur_action" != "null" ]]; then
+        log_status "INFO" "Story ${cur_story}: ${cur_phase} (${cur_action})"
+    fi
+    PREV_STORY="$cur_story"
+    PREV_PHASE="$cur_phase"
+    PREV_AC_PROGRESS="$cur_ac"
+    PREV_LAST_ACTION="$cur_action"
+}
+# Reset polling state between iterations
+reset_poll_state() {
+    PREV_STORY=""
+    PREV_PHASE=""
+    PREV_AC_PROGRESS=""
+    PREV_LAST_ACTION=""
+}
 # ─── Progress Summary ───────────────────────────────────────────────────────
 print_progress_summary() {
@@ -463,7 +523,51 @@ print_progress_summary() {
         elapsed_fmt="${elapsed}s"
     fi
-    log_status "INFO" "Progress: ${completed}/${total} done, ${remaining} remaining (iterations: ${loop_count}, elapsed: ${elapsed_fmt})"
+    # Read cost and failed stories from sprint-state.json (single jq call)
+    local cost=""
+    local cost_fmt=""
+    local failed_stories=""
+    if [[ -f "sprint-state.json" ]]; then
+        local state_data
+        state_data=$(jq -r '(.run.cost // 0 | tostring) + "\n" + ((.run.failed // []) | join("\n"))' "sprint-state.json" 2>/dev/null) || state_data=""
+        if [[ -n "$state_data" ]]; then
+            cost=$(head -1 <<< "$state_data")
+            failed_stories=$(tail -n +2 <<< "$state_data")
+            if [[ -n "$cost" && "$cost" != "0" && "$cost" != "null" ]]; then
+                cost_fmt=", cost: \$${cost}"
+            fi
+        fi
+    fi
+    log_status "INFO" "Progress: ${completed}/${total} done, ${remaining} remaining (iterations: ${loop_count}, elapsed: ${elapsed_fmt}${cost_fmt})"
+    # Show completed stories with ✓
+    if [[ -f "$SPRINT_STATUS_FILE" ]]; then
+        while IFS=: read -r key value; do
+            key=$(echo "$key" | sed 's/^[[:space:]]*//;s/[[:space:]]*$//')
+            value=$(echo "$value" | sed 's/^[[:space:]]*//;s/[[:space:]]*$//')
+            [[ -z "$key" || "$key" == \#* ]] && continue
+            if [[ "$key" =~ ^[0-9]+-[0-9]+- && "$value" == "done" ]]; then
+                log_status "SUCCESS" "  ✓ ${key}"
+            fi
+        done < "$SPRINT_STATUS_FILE"
+    fi
+    # Show failed stories with ✗ from sprint-state.json
+    if [[ -n "$failed_stories" ]]; then
+        while IFS= read -r fkey; do
+            [[ -z "$fkey" ]] && continue
+            log_status "ERROR" "  ✗ ${fkey}"
+        done <<< "$failed_stories"
+    fi
+    # Show flagged/blocked stories with ✕
+    if [[ -f "$FLAGGED_STORIES_FILE" ]]; then
+        while IFS= read -r bkey; do
+            [[ -z "$bkey" ]] && continue
+            log_status "WARN" "  ✕ ${bkey} (blocked)"
+        done < "$FLAGGED_STORIES_FILE"
+    fi
     # Show the next story in line (first non-done, non-flagged)
     if [[ -f "$SPRINT_STATUS_FILE" ]]; then
@@ -541,7 +645,7 @@ load_platform_driver() {
         CLAUDE_ALLOWED_TOOLS=$(IFS=','; echo "${VALID_TOOL_PATTERNS[*]}")
     fi
-    log_status "INFO" "Platform driver: $(driver_display_name) ($(driver_cli_binary))"
+    log_status "DEBUG" "Platform driver: $(driver_display_name) ($(driver_cli_binary))"
 }
 # ─── Execution ───────────────────────────────────────────────────────────────
@@ -624,11 +728,13 @@ execute_iteration() {
         log_status "DEBUG" "Background PID: $claude_pid"
+        reset_poll_state
         while kill -0 $claude_pid 2>/dev/null; do
             progress_counter=$((progress_counter + 1))
             if [[ -f "$output_file" && -s "$output_file" ]]; then
                 cp "$output_file" "$LIVE_LOG_FILE" 2>/dev/null
             fi
+            poll_sprint_state_progress
             sleep 10
         done
@@ -723,7 +829,8 @@ execute_iteration() {
             log_status "ERROR" "Claude API usage limit reached"
             return 2
         # Check for transient API errors (500, 529, overloaded) — don't count against story
-        elif grep -qi "Internal server error\|api_error\|overloaded\|529\|503" "$output_file" 2>/dev/null; then
+        # Status code patterns exclude decimal prefixes (e.g., cost_usd=0.503 ≠ HTTP 503)
+        elif grep -qiE 'Internal server error|api_error|overloaded|(^|[^0-9.])529([^0-9]|$)|(^|[^0-9.])503([^0-9]|$)' "$output_file" 2>/dev/null; then
             log_status "WARN" "Transient API error (not story's fault) — will retry"
             return 4
         else
@@ -792,6 +899,41 @@ The loop:
 HELPEOF
 }
+# ─── Sprint Summary ──────────────────────────────────────────────────────────
+# Print a compact sprint summary at startup
+print_sprint_summary() {
+    local counts
+    counts=$(get_task_counts)
+    local total=${counts%% *}
+    local completed=${counts##* }
+    local remaining=$((total - completed))
+    # Find next story
+    local next_story=""
+    local next_status=""
+    if [[ -f "$SPRINT_STATUS_FILE" ]]; then
+        while IFS=: read -r key value; do
+            key=$(echo "$key" | sed 's/^[[:space:]]*//;s/[[:space:]]*$//')
+            value=$(echo "$value" | sed 's/^[[:space:]]*//;s/[[:space:]]*$//')
+            [[ -z "$key" || "$key" == \#* ]] && continue
+            if [[ "$key" =~ ^[0-9]+-[0-9]+- && "$value" != "done" ]]; then
+                if ! is_story_flagged "$key"; then
+                    next_story="$key"
+                    next_status="$value"
+                    break
+                fi
+            fi
+        done < "$SPRINT_STATUS_FILE"
+    fi
+    if [[ -n "$next_story" ]]; then
+        log_status "INFO" "Sprint: ${completed}/${total} done, ${remaining} remaining — next: ${next_story} (${next_status})"
+    else
+        log_status "INFO" "Sprint: ${completed}/${total} done, ${remaining} remaining"
+    fi
+}
 # ─── Main ────────────────────────────────────────────────────────────────────
 main() {
@@ -880,15 +1022,17 @@ main() {
     # .story_retries and .flagged_stories are file-based — they persist automatically
     log_status "SUCCESS" "Ralph loop starting"
-    log_status "INFO" "Plugin: $PLUGIN_DIR"
-    log_status "INFO" "Max iterations: $MAX_ITERATIONS | Timeout: $((LOOP_TIMEOUT_SECONDS / 3600))h"
-    log_status "INFO" "Prompt: $PROMPT_FILE"
-    log_status "INFO" "Sprint status: $SPRINT_STATUS_FILE"
-    log_status "INFO" "Max story retries: $MAX_STORY_RETRIES"
+    log_status "DEBUG" "Plugin: $PLUGIN_DIR"
+    log_status "DEBUG" "Max iterations: $MAX_ITERATIONS | Timeout: $((LOOP_TIMEOUT_SECONDS / 3600))h"
+    log_status "DEBUG" "Prompt: $PROMPT_FILE"
+    log_status "DEBUG" "Sprint status: $SPRINT_STATUS_FILE"
+    log_status "DEBUG" "Max story retries: $MAX_STORY_RETRIES"
     # Record loop start time for timeout
     loop_start_time=$(date +%s)
+    print_sprint_summary
     local consecutive_failures=0
     local max_consecutive_failures=3

package/templates/Dockerfile.verify CHANGED Viewed

@@ -5,12 +5,19 @@ FROM node:20-slim
 ARG TARBALL=package.tgz
-# System utilities
+# System utilities + Python for Semgrep
 RUN apt-get update && apt-get install -y --no-install-recommends \
     curl \
     jq \
+    python3 \
+    python3-pip \
+    pipx \
   && rm -rf /var/lib/apt/lists/*
+# Semgrep for static analysis verification
+RUN pipx install semgrep && pipx ensurepath
+ENV PATH="/root/.local/bin:${PATH}"
 # Verification tools + Claude Code CLI
 RUN npm install -g showboat @anthropic-ai/claude-code