npm - principles-disciple - Versions diffs - 1.61.0 → 1.63.0 - Mend

principles-disciple 1.61.0 → 1.63.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (28) hide show

package/openclaw.plugin.json +4 -4
package/package.json +3 -1
package/scripts/sync-plugin.mjs +28 -36
package/src/core/event-log.ts +71 -5
package/src/core/workflow-funnel-loader.ts +170 -0
package/src/hooks/gate-block-helper.ts +1 -1
package/src/hooks/gate.ts +62 -203
package/src/service/evolution-worker.ts +10 -0
package/src/service/nocturnal-service.ts +24 -3
package/src/service/subagent-workflow/nocturnal-workflow-manager.ts +16 -0
package/src/types/event-types.ts +103 -2
package/tests/core/event-log.test.ts +56 -1
package/tests/hooks/gate-rule-host-pipeline.test.ts +161 -316
package/tests/service/evolution-worker.compilation-backfill.test.ts +5 -1
package/src/hooks/bash-risk.ts +0 -175
package/src/hooks/edit-verification.ts +0 -302
package/src/hooks/gfi-gate.ts +0 -186
package/src/hooks/progressive-trust-gate.ts +0 -183
package/src/hooks/thinking-checkpoint.ts +0 -76
package/tests/hooks/bash-risk-integration.test.ts +0 -137
package/tests/hooks/bash-risk.test.ts +0 -81
package/tests/hooks/edit-verification.test.ts +0 -678
package/tests/hooks/gate-edit-verification-p1.test.ts +0 -632
package/tests/hooks/gate-pipeline-integration.test.ts +0 -404
package/tests/hooks/gate.test.ts +0 -271
package/tests/hooks/gfi-gate-unit.test.ts +0 -422
package/tests/hooks/gfi-gate.test.ts +0 -669
package/tests/hooks/thinking-gate.test.ts +0 -313

package/tests/core/event-log.test.ts CHANGED Viewed

@@ -1,6 +1,6 @@
 import { describe, it, expect, beforeEach, afterEach, vi } from 'vitest';
 import { EventLogService, EventLog } from '../../src/core/event-log.js';
-import type { DailyStats, DeepReflectionEventData } from '../../src/types/event-types.js';
+import type { DailyStats, DeepReflectionEventData, DiagnosticianReportEventData } from '../../src/types/event-types.js';
 import * as fs from 'fs';
 import * as path from 'path';
 import * as os from 'os';
@@ -252,5 +252,60 @@ describe('EventLog', () => {
       expect(stats.pain.avgScore).toBe(60); // (50+70+60)/3 = 60
       expect(stats.pain.maxScore).toBe(70);
     });
+    // PD-FUNNEL-1.2: Legacy backward compat — old events with { success: boolean } shape
+    // Stats are loaded from daily-stats.json (not re-read from JSONL), so we
+    // populate the stats cache directly by writing to daily-stats.json and
+    // creating a new EventLog instance that loads it via loadStats().
+    it('should count legacy success:true events in diagnosticianReportsWritten', () => {
+      const today = new Date().toISOString().slice(0, 10);
+      // Build a legacy daily-stats.json entry: old format had no category on
+      // diagnostician_report, and success:true meant it counted as written.
+      // statsFile lives at {tempDir}/logs/daily-stats.json (see EventLog constructor).
+      const statsFile = path.join(tempDir, 'logs', 'daily-stats.json');
+      fs.mkdirSync(path.dirname(statsFile), { recursive: true });
+      const legacyDailyStats = JSON.stringify({
+        [today]: {
+          date: today,
+          createdAt: new Date().toISOString(),
+          updatedAt: new Date().toISOString(),
+          tools: { total: 0, success: 0, failure: 0 },
+          pain: { signalsDetected: 0, avgScore: 0, maxScore: 0, signalsBySource: {} },
+          empathy: { totalEvents: 0, dedupedCount: 0, dedupeHitRate: 0, rolledBackScore: 0, rollbackCount: 0, bySeverity: { mild: 0, moderate: 0, severe: 0 }, scoreBySeverity: { mild: 0, moderate: 0, severe: 0 }, byDetectionMode: { structured: 0, legacy_tag: 0 }, byOrigin: { assistant_self_report: 0, user_manual: 0, system_infer: 0 }, confidenceDistribution: { high: 0, medium: 0, low: 0 }, dailyTrend: [] },
+          hooks: { total: 0, success: 0, failure: 0, byType: {} },
+          evolution: {
+            diagnosisTasksWritten: 0, heartbeatsInjected: 0,
+            diagnosticianReportsWritten: 1,  // legacy success:true counted here
+            reportsMissingJson: 0, reportsIncompleteFields: 0,
+            principleCandidatesCreated: 0, rulesEnforced: 0,
+            nocturnalDreamerCompleted: 0, nocturnalArtifactPersisted: 0,
+            nocturnalCodeCandidateCreated: 0, rulehostEvaluated: 0,
+            rulehostBlocked: 0, rulehostRequireApproval: 0,
+          },
+        },
+      }, null, 2);
+      fs.writeFileSync(statsFile, legacyDailyStats, 'utf8');
+      // Create new EventLog instance so it loads the legacy stats via loadStats()
+      const reloaded = new EventLog(tempDir);
+      const stats = reloaded.getDailyStats(today);
+      expect(stats.evolution.diagnosticianReportsWritten).toBe(1);
+    });
+    it('should count incomplete_fields in both diagnosticianReportsWritten and reportsIncompleteFields', () => {
+      const today = new Date().toISOString().slice(0, 10);
+      eventLog.recordDiagnosticianReport({
+        taskId: 'task-incomplete',
+        reportPath: '/test/incomplete.json',
+        category: 'incomplete_fields',
+      });
+      eventLog.flush();
+      const stats = eventLog.getDailyStats(today);
+      expect(stats.evolution.diagnosticianReportsWritten).toBe(1);
+      expect(stats.evolution.reportsIncompleteFields).toBe(1);
+      // Other sub-counters should not be set
+      expect(stats.evolution.reportsMissingJson).toBe(0);
+    });
   });
 });

package/tests/hooks/gate-rule-host-pipeline.test.ts CHANGED Viewed

@@ -1,385 +1,230 @@
 /**
- * Gate Rule Host Pipeline Integration Tests
+ * Gate Rule Host Only - Pipeline Integration Tests
  *
- * PURPOSE: Verify that the Rule Host is correctly wired into the gate chain
- * between GFI and Progressive Gate, with correct ordering and behavior.
+ * PURPOSE: Verify gate.ts with Rule Host Only (no hardcoded gates).
  *
  * Tests:
- * 1. When GFI blocks, Rule Host is never called
- * 2. When Rule Host blocks, Progressive Gate is never called
- * 3. When Rule Host returns undefined (no active implementations), Progressive Gate runs normally
- * 4. When Rule Host throws, gate continues to Progressive Gate (D-08)
- * 5. Block result uses blockSource='rule-host'
- * 6. Existing gate flow still works when no active implementations exist
+ * 1. Rule Host blocks operation → block result with blockSource='rule-host'
+ * 2. Rule Host allow (no match) → operation passes
+ * 3. Rule Host throws → degrades conservatively, allows operation
+ * 4. Rule Host requireApproval → records event, does not block
+ * 5. Non-target tools (read) → pass through early
  */
-import { describe, it, expect, vi, beforeEach, afterEach } from 'vitest';
+import { describe, it, expect, vi, beforeEach } from 'vitest';
 import { handleBeforeToolCall } from '../../src/hooks/gate.js';
-import * as fs from 'fs';
-import * as path from 'path';
-import { WorkspaceContext } from '../../src/core/workspace-context.js';
 import * as sessionTracker from '../../src/core/session-tracker.js';
 import * as evolutionEngine from '../../src/core/evolution-engine.js';
-// Mock fs
-vi.mock('fs');
+const workspaceDir = '/mock/workspace';
+const sessionId = 'test-session-rh';
-// Mock workspace context
-vi.mock('../../src/core/workspace-context.js');
+const mockEvolution = {
+  getTier: vi.fn().mockReturnValue(3),
+  getPoints: vi.fn().mockReturnValue(200),
+};
-// Mock session tracker
 vi.mock('../../src/core/session-tracker.js', () => ({
   getSession: vi.fn(() => ({ currentGfi: 0 })),
   trackBlock: vi.fn(),
   hasRecentThinking: vi.fn(() => false),
 }));
-// Mock evolution engine
-vi.mock('../../src/core/evolution-engine.js', async () => {
-  const actual = await vi.importActual('../../src/core/evolution-engine.js');
-  return {
-    ...actual,
-    checkEvolutionGate: vi.fn(() => ({ allowed: true, currentTier: 'SEED' })),
-    getEvolutionEngine: vi.fn(),
-  };
-});
+vi.mock('../../src/core/evolution-engine.js', () => ({
+  getEvolutionEngine: vi.fn(() => mockEvolution),
+}));
-// Mock Rule Host module — controls RuleHost.evaluate behavior
-// Use a shared mutable evaluate mock that tests can override
-let _mockEvaluate: ReturnType<typeof vi.fn> = vi.fn().mockReturnValue(undefined);
+const mockEventLogInstance = {
+  recordRuleHostEvaluated: vi.fn(),
+  recordRuleEnforced: vi.fn(),
+  recordRuleHostBlocked: vi.fn(),
+  recordRuleHostRequireApproval: vi.fn(),
+};
+vi.mock('../../src/core/event-log.js', () => ({
+  EventLogService: { get: vi.fn(() => mockEventLogInstance) },
+}));
-vi.mock('../../src/core/rule-host.js', () => {
-  return {
-    RuleHost: vi.fn(function(this: any, _stateDir: string) {
-      this.evaluate = _mockEvaluate;
-    }),
-  };
-});
+let _mockEvaluate = vi.fn().mockReturnValue(undefined);
+vi.mock('../../src/core/rule-host.js', () => ({
+  RuleHost: vi.fn(function(this: any, _stateDir: string, _logger: any) {
+    this.evaluate = _mockEvaluate;
+  }),
+}));
-// Mock ledger to avoid file reads
 vi.mock('../../src/core/principle-tree-ledger.js', () => ({
   loadLedger: vi.fn(),
   listImplementationsByLifecycleState: vi.fn(() => []),
 }));
-import { RuleHost } from '../../src/core/rule-host.js';
-import * as sessionTrackerModule from '../../src/core/session-tracker.js';
-import * as evolutionEngineModule from '../../src/core/evolution-engine.js';
-const MockedRuleHost = vi.mocked(RuleHost);
-const mockEvolution = {
-  getTier: vi.fn().mockReturnValue(3),
-  getPoints: vi.fn().mockReturnValue(200),
-};
-describe('Gate Rule Host Pipeline Integration', () => {
-  const workspaceDir = '/mock/workspace';
-  const sessionId = 'test-session-rh';
-  const mockConfig = {
-    get: vi.fn().mockImplementation((key: string) => {
-      if (key === 'trust') return {
-        limits: { stage_2_max_lines: 50, stage_3_max_lines: 300 }
-      };
-      if (key === 'gfi_gate') return {
-        enabled: true,
-        thresholds: { low_risk_block: 70, high_risk_block: 40 },
-        bash_safe_patterns: ['^(ls|dir|pwd)$'],
-        bash_dangerous_patterns: ['rm\\s+-rf'],
-      };
-      return undefined;
-    })
-  };
-  const mockEventLog = {
-    recordGateBlock: vi.fn(),
-    recordPlanApproval: vi.fn(),
-    recordGateBypass: vi.fn(),
-  };
-  const mockTrajectory = {
-    recordGateBlock: vi.fn(),
-  };
-  const mockWctx = {
-    workspaceDir,
-    stateDir: '/mock/state',
-    config: mockConfig,
-    eventLog: mockEventLog,
-    trajectory: mockTrajectory,
-    evolution: mockEvolution,
-    resolve: vi.fn().mockImplementation((key: string) => {
-      if (key === 'PROFILE') return path.join(workspaceDir, '.principles', 'PROFILE.json');
-      if (key === 'PLAN') return path.join(workspaceDir, 'PLAN.md');
-      if (key === 'STATE_DIR') return path.join(workspaceDir, '.state');
-      if (typeof key === 'string' && !key.includes(':')) {
-        return path.join(workspaceDir, key);
-      }
-      return key;
-    }),
-  };
+describe('Gate Rule Host Only Pipeline', () => {
   beforeEach(() => {
     vi.clearAllMocks();
-    vi.useFakeTimers();
-    // Reset the shared evaluate mock to default (returns undefined)
     _mockEvaluate = vi.fn().mockReturnValue(undefined);
-    MockedRuleHost.mockImplementation(function(this: any, _stateDir: string) {
-      this.evaluate = _mockEvaluate;
-    });
-    vi.mocked(WorkspaceContext.fromHookContext).mockReturnValue(mockWctx as any);
-    vi.mocked(sessionTrackerModule.getSession).mockReturnValue({ currentGfi: 0 } as any);
-    vi.mocked(sessionTrackerModule.trackBlock).mockImplementation(() => {});
-    vi.mocked(evolutionEngineModule.getEvolutionEngine).mockReturnValue(mockEvolution);
   });
-  afterEach(() => {
-    vi.useRealTimers();
-  });
+  describe('Rule Host blocks', () => {
+    it('should block with blockSource=rule-host when Rule Host returns block', () => {
+      _mockEvaluate = vi.fn().mockReturnValue({
+        decision: 'block',
+        matched: true,
+        reason: 'Dangerous git force-push detected',
+        ruleId: 'R_001',
+        principleId: 'P_001',
+      });
+      const event = {
+        toolName: 'bash',
+        params: { command: 'git push --force' },
+      };
-  /**
-   * Helper: create a standard write event
-   */
-  function makeWriteEvent(overrides?: Partial<any>) {
-    return {
-      toolName: 'write',
-      params: {
-        file_path: 'src/test.ts',
-        content: 'const x = 1;',
-      },
-      ...overrides,
-    };
-  }
-  /**
-   * Helper: set up fs mocks for a profile with progressive gate enabled
-   */
-  function setupProfileMock(profileOverrides?: Record<string, unknown>) {
-    vi.mocked(fs.existsSync).mockImplementation((p: any) => {
-      if (typeof p === 'string' && p.includes('PROFILE.json')) return true;
-      return false;
-    });
-    vi.mocked(fs.readFileSync).mockImplementation((p: any) => {
-      if (typeof p === 'string' && p.includes('PROFILE.json')) {
-        return JSON.stringify({
-          risk_paths: [],
-          progressive_gate: { enabled: true },
-          edit_verification: { enabled: true },
-          ...profileOverrides,
-        });
-      }
-      return '';
-    });
-  }
-  // ═══════════════════════════════════════════════════════════════════════════
-  // TEST 1: When GFI blocks, Rule Host is never called
-  // ═══════════════════════════════════════════════════════════════════════════
-  it('should not call Rule Host when GFI gate blocks', () => {
-    // Set high GFI to trigger GFI block
-    vi.mocked(sessionTrackerModule.getSession).mockReturnValue({ currentGfi: 85 } as any);
-    setupProfileMock();
-    const result = handleBeforeToolCall(makeWriteEvent() as any, { workspaceDir, sessionId } as any);
-    // GFI should block
-    expect(result).toBeDefined();
-    expect(result?.block).toBe(true);
-    expect(result?.blockReason).toContain('GFI');
-    // RuleHost constructor should NOT have been called
-    // (GFI returns before reaching Rule Host evaluation)
-    expect(MockedRuleHost).not.toHaveBeenCalled();
-  });
+      const result = handleBeforeToolCall(event as any, { workspaceDir, sessionId } as any);
-  // ═══════════════════════════════════════════════════════════════════════════
-  // TEST 2: When Rule Host blocks, Progressive Gate is never called
-  // ═══════════════════════════════════════════════════════════════════════════
-  it('should not reach Progressive Gate when Rule Host blocks', () => {
-    setupProfileMock();
-    // Mock RuleHost.evaluate to return a block
-    _mockEvaluate = vi.fn().mockReturnValue({
-      decision: 'block',
-      matched: true,
-      reason: 'Rule Host test block',
-    });
-    MockedRuleHost.mockImplementation(function(this: any, _stateDir: string) {
-      this.evaluate = _mockEvaluate;
+      expect(result).toBeDefined();
+      expect(result?.block).toBe(true);
+      expect(result?.blockReason).toContain('Dangerous git force-push detected');
     });
-    const result = handleBeforeToolCall(makeWriteEvent() as any, { workspaceDir, sessionId } as any);
+    it('should record rulehost_blocked event when Rule Host blocks', () => {
+      _mockEvaluate = vi.fn().mockReturnValue({
+        decision: 'block',
+        matched: true,
+        reason: 'High-risk path',
+        ruleId: 'R_002',
+      });
+      const event = {
+        toolName: 'write',
+        params: { file_path: 'src/danger.ts', content: 'bad' },
+      };
-    // Rule Host should block
-    expect(result).toBeDefined();
-    expect(result?.block).toBe(true);
+      handleBeforeToolCall(event as any, { workspaceDir, sessionId } as any);
-    // The block should come from rule-host
-    expect(mockEventLog.recordGateBlock).toHaveBeenCalledWith(
-      sessionId,
-      expect.objectContaining({ blockSource: 'rule-host' })
-    );
+      expect(mockEventLogInstance.recordRuleHostBlocked).toHaveBeenCalledWith(
+        expect.objectContaining({
+          toolName: 'write',
+          ruleId: 'R_002',
+        })
+      );
+    });
   });
-  // ═══════════════════════════════════════════════════════════════════════════
-  // TEST 3: When Rule Host returns undefined, Progressive Gate runs normally
-  // ═══════════════════════════════════════════════════════════════════════════
-  it('should continue to Progressive Gate when Rule Host returns undefined', () => {
-    setupProfileMock();
+  describe('Rule Host allows', () => {
+    it('should allow when Rule Host returns undefined (no match)', () => {
+      _mockEvaluate = vi.fn().mockReturnValue(undefined);
-    // Mock RuleHost.evaluate to return undefined (no active implementations)
-    _mockEvaluate = vi.fn().mockReturnValue(undefined);
-    MockedRuleHost.mockImplementation(function(this: any, _stateDir: string) {
-      this.evaluate = _mockEvaluate;
-    });
+      const event = {
+        toolName: 'write',
+        params: { file_path: 'src/safe.ts', content: 'const x = 1' },
+      };
-    const result = handleBeforeToolCall(makeWriteEvent() as any, { workspaceDir, sessionId } as any);
+      const result = handleBeforeToolCall(event as any, { workspaceDir, sessionId } as any);
-    // Should pass through (no block from any gate)
-    expect(result).toBeUndefined();
+      expect(result).toBeUndefined();
+    });
-    // Rule Host was called
-    expect(_mockEvaluate).toHaveBeenCalled();
-  });
+    it('should record rulehost_evaluated even when no match', () => {
+      _mockEvaluate = vi.fn().mockReturnValue(undefined);
-  // ═══════════════════════════════════════════════════════════════════════════
-  // TEST 4: When Rule Host throws, gate continues to Progressive Gate (D-08)
-  // ═══════════════════════════════════════════════════════════════════════════
-  it('should continue to Progressive Gate when Rule Host throws (D-08)', () => {
-    setupProfileMock();
+      const event = {
+        toolName: 'edit',
+        params: { file_path: 'src/config.ts', oldText: 'x', newText: 'y' },
+      };
-    // Mock RuleHost.evaluate to throw
-    _mockEvaluate = vi.fn().mockImplementation(() => {
-      throw new Error('Host internal error');
-    });
-    MockedRuleHost.mockImplementation(function(this: any, _stateDir: string) {
-      this.evaluate = _mockEvaluate;
+      handleBeforeToolCall(event as any, { workspaceDir, sessionId } as any);
+      expect(mockEventLogInstance.recordRuleHostEvaluated).toHaveBeenCalledWith(
+        expect.objectContaining({
+          toolName: 'edit',
+          matched: false,
+          decision: 'allow',
+        })
+      );
     });
+  });
-    const result = handleBeforeToolCall(makeWriteEvent() as any, { workspaceDir, sessionId } as any);
+  describe('Rule Host degradation', () => {
+    it('should allow operation when Rule Host throws (conservative degradation)', () => {
+      _mockEvaluate = vi.fn().mockImplementation(() => {
+        throw new Error('Host internal error');
+      });
-    // Should pass through (host error is caught, degrades to Progressive Gate)
-    // Progressive Gate will pass for this low-risk operation
-    expect(result).toBeUndefined();
-  });
+      const event = {
+        toolName: 'bash',
+        params: { command: 'ls -la' },
+      };
-  // ═══════════════════════════════════════════════════════════════════════════
-  // TEST 5: Block result uses blockSource='rule-host'
-  // ═══════════════════════════════════════════════════════════════════════════
-  it('should use blockSource=rule-host for Rule Host blocks', () => {
-    setupProfileMock();
+      const result = handleBeforeToolCall(event as any, { workspaceDir, sessionId } as any);
-    _mockEvaluate = vi.fn().mockReturnValue({
-      decision: 'block',
-      matched: true,
-      reason: 'Dangerous file modification',
-    });
-    MockedRuleHost.mockImplementation(function(this: any, _stateDir: string) {
-      this.evaluate = _mockEvaluate;
+      expect(result).toBeUndefined();
     });
+  });
-    const result = handleBeforeToolCall(makeWriteEvent() as any, { workspaceDir, sessionId } as any);
+  describe('Rule Host requireApproval', () => {
+    it('should not block when Rule Host returns requireApproval', () => {
+      _mockEvaluate = vi.fn().mockReturnValue({
+        decision: 'requireApproval',
+        matched: true,
+        reason: 'High-risk operation needs approval',
+        ruleId: 'R_003',
+      });
+      const event = {
+        toolName: 'bash',
+        params: { command: 'rm -rf node_modules' },
+      };
-    expect(result?.block).toBe(true);
+      const result = handleBeforeToolCall(event as any, { workspaceDir, sessionId } as any);
-    // Verify recordGateBlockAndReturn was called with blockSource='rule-host'
-    expect(mockEventLog.recordGateBlock).toHaveBeenCalledWith(
-      sessionId,
-      expect.objectContaining({
-        blockSource: 'rule-host',
-        reason: 'Dangerous file modification',
-      })
-    );
+      expect(result).toBeUndefined();
+      expect(mockEventLogInstance.recordRuleEnforced).toHaveBeenCalledWith(
+        expect.objectContaining({ enforcement: 'requireApproval' })
+      );
+    });
   });
-  // ═══════════════════════════════════════════════════════════════════════════
-  // TEST 5b: requireApproval result uses blockSource='rule-host' with reason
-  // ═══════════════════════════════════════════════════════════════════════════
-  it('should use blockSource=rule-host with approval prefix for requireApproval', () => {
-    setupProfileMock();
-    _mockEvaluate = vi.fn().mockReturnValue({
-      decision: 'requireApproval',
-      matched: true,
-      reason: 'High-risk path requires approval',
-    });
-    MockedRuleHost.mockImplementation(function(this: any, _stateDir: string) {
-      this.evaluate = _mockEvaluate;
-    });
+  describe('Early return for non-target tools', () => {
+    it('should allow read tool without calling Rule Host', () => {
+      const event = {
+        toolName: 'read',
+        params: { file_path: 'src/readonly.ts' },
+      };
-    const result = handleBeforeToolCall(makeWriteEvent() as any, { workspaceDir, sessionId } as any);
+      const result = handleBeforeToolCall(event as any, { workspaceDir, sessionId } as any);
-    expect(result?.block).toBe(true);
-    expect(mockEventLog.recordGateBlock).toHaveBeenCalledWith(
-      sessionId,
-      expect.objectContaining({
-        blockSource: 'rule-host',
-        reason: expect.stringContaining('[Rule Host] Approval required'),
-      })
-    );
-  });
+      expect(result).toBeUndefined();
+      expect(_mockEvaluate).not.toHaveBeenCalled();
+    });
-  // ═══════════════════════════════════════════════════════════════════════════
-  // TEST 6: Existing gate flow still works when no active implementations exist
-  // ═══════════════════════════════════════════════════════════════════════════
-  it('should allow operation through existing gate flow with no active implementations', () => {
-    setupProfileMock();
+    it('should allow agent tool without calling Rule Host when no workspace', () => {
+      const event = {
+        toolName: 'agent',
+        params: { task: 'do something' },
+      };
-    // Default mock: RuleHost.evaluate returns undefined (already set in beforeEach)
-    const result = handleBeforeToolCall(makeWriteEvent() as any, { workspaceDir, sessionId } as any);
+      const result = handleBeforeToolCall(event as any, { sessionId } as any);
-    // Should pass all gates — no block
-    expect(result).toBeUndefined();
+      expect(result).toBeUndefined();
+      expect(_mockEvaluate).not.toHaveBeenCalled();
+    });
   });
-  it('should block with GFI even when Rule Host would allow', () => {
-    // High GFI triggers GFI block
-    vi.mocked(sessionTrackerModule.getSession).mockReturnValue({ currentGfi: 85 } as any);
-    setupProfileMock();
+  describe('Session GFI context', () => {
+    it('should pass current GFI to Rule Host', () => {
+      _mockEvaluate = vi.fn().mockReturnValue(undefined);
+      vi.mocked(sessionTracker.getSession).mockReturnValue({ currentGfi: 75 } as any);
-    // Even if RuleHost would allow, GFI blocks first
-    const result = handleBeforeToolCall(makeWriteEvent() as any, { workspaceDir, sessionId } as any);
+      const event = {
+        toolName: 'write',
+        params: { file_path: 'src/test.ts', content: 'x' },
+      };
-    expect(result?.block).toBe(true);
-    expect(result?.blockReason).toContain('GFI');
-  });
+      handleBeforeToolCall(event as any, { workspaceDir, sessionId } as any);
-  it('should allow edit when oldText matches (full pipeline with Rule Host)', () => {
-    const fileContent = 'const x = 1;\n';
-    const editEvent = {
-      toolName: 'edit',
-      params: {
-        file_path: 'src/example.ts',
-        oldText: 'const x = 1;',
-        newText: 'const x = 2;',
-      },
-    };
-    setupProfileMock();
-    vi.mocked(fs.readFileSync).mockImplementation((p: any) => {
-      if (typeof p === 'string' && p.includes('PROFILE.json')) {
-        return JSON.stringify({
-          risk_paths: [],
-          progressive_gate: { enabled: true },
-          edit_verification: { enabled: true },
-        });
-      }
-      if (typeof p === 'string' && p.includes('example.ts')) {
-        return fileContent;
-      }
-      return '';
+      expect(_mockEvaluate).toHaveBeenCalledWith(
+        expect.objectContaining({
+          session: expect.objectContaining({ currentGfi: 75 }),
+        })
+      );
     });
-    vi.mocked(fs.statSync).mockReturnValue({ size: 1000 } as any);
-    vi.mocked(fs.existsSync).mockImplementation((p: any) => {
-      if (typeof p === 'string' && p.includes('PROFILE.json')) return true;
-      if (typeof p === 'string' && p.includes('example.ts')) return true;
-      return false;
-    });
-    const result = handleBeforeToolCall(editEvent as any, { workspaceDir, sessionId } as any);
-    expect(result).toBeUndefined();
   });
 });

package/tests/service/evolution-worker.compilation-backfill.test.ts CHANGED Viewed

@@ -70,7 +70,11 @@ const noopLogger: PluginLogger = {
 afterEach(() => {
   vi.restoreAllMocks();
   for (const dir of tempDirs.splice(0)) {
-    fs.rmSync(dir, { recursive: true, force: true });
+    try {
+      fs.rmSync(dir, { recursive: true, force: true });
+    } catch {
+      // On Windows, temp dirs may be held open — ignore cleanup errors
+    }
   }
 });