npm - pikakit - Versions diffs - 1.0.7 → 1.0.9 - Mend

pikakit 1.0.7 → 1.0.9

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (24) hide show

package/README.md +10 -6
package/bin/kit.mjs +6 -2
package/bin/lib/commands/help.js +13 -8
package/bin/lib/config.js +4 -2
package/lib/agent-cli/lib/ab-testing.js +508 -0
package/lib/agent-cli/lib/causality-engine.js +623 -0
package/lib/agent-cli/lib/dashboard-data.js +365 -0
package/lib/agent-cli/lib/fix.js +1 -1
package/lib/agent-cli/lib/metrics-collector.js +523 -0
package/lib/agent-cli/lib/metrics-schema.js +410 -0
package/lib/agent-cli/lib/precision-skill-generator.js +584 -0
package/lib/agent-cli/lib/recall.js +1 -1
package/lib/agent-cli/lib/reinforcement.js +610 -0
package/lib/agent-cli/lib/ui/index.js +37 -14
package/package.json +4 -2
package/lib/agent-cli/lib/auto-learn.js +0 -319
package/lib/agent-cli/scripts/adaptive_engine.js +0 -381
package/lib/agent-cli/scripts/error_sensor.js +0 -565
package/lib/agent-cli/scripts/learn_from_failure.js +0 -225
package/lib/agent-cli/scripts/pattern_analyzer.js +0 -781
package/lib/agent-cli/scripts/skill_injector.js +0 -387
package/lib/agent-cli/scripts/success_sensor.js +0 -500
package/lib/agent-cli/scripts/user_correction_sensor.js +0 -426
package/lib/agent-cli/services/auto-learn-service.js +0 -247

package/README.md CHANGED Viewed

@@ -12,7 +12,7 @@
 ## ⚡ Installation
 ```bash
-npx pikakit add pikakit/agent-skills
+npx pikakit
 ```
 **That's it!** One command installs everything:
@@ -34,6 +34,10 @@ npx pikakit add pikakit/agent-skills
 ### 1. Add Skills from GitHub
 ```bash
+# Recommended: One command install
+npx pikakit
+# Or specify a repo:
 npx pikakit add <owner>/<repo>
 # Examples:
@@ -126,19 +130,19 @@ agent watch                 # Real-time monitor
 ### Install Official Skills
 ```bash
-npx pikakit add pikakit/agent-skills
+npx pikakit add pikakit-agent-skills
 ```
 ### Install to Global Location
 ```bash
-npx pikakit add pikakit/agent-skills --global
+npx pikakit add pikakit-agent-skills --global
 ```
 ### Force Reinstall
 ```bash
-npx pikakit add pikakit/agent-skills --force
+npx pikakit add pikakit-agent-skills --force
 ```
 ---
@@ -193,7 +197,7 @@ npm install                        # Node.js dependencies
 | Package | Purpose |
 |---------|---------|
-| [agent-skills](https://github.com/pikakit/agent-skills) | Main skills repository |
+| [pikakit-agent-skills](https://www.npmjs.com/package/pikakit-agent-skills) | Main skills repository |
 | [pikakit](https://www.npmjs.com/package/pikakit) | This CLI installer |
 ---
@@ -220,7 +224,7 @@ cd pikakit
 npm install
 # Run locally
-node bin/cli.mjs add pikakit/agent-skills
+node bin/cli.mjs add pikakit-agent-skills
 ```
 ---

package/bin/kit.mjs CHANGED Viewed

@@ -1,10 +1,10 @@
-#!/usr/bin/env node
+#!/usr/bin/env node
 /**
  * Install Agent Skill CLI
  * @description Package manager for AI Agent Skills
  */
 import { c, brandedIntro } from "./lib/ui.js";
-import { command, params, VERSION } from "./lib/config.js";
+import { command, params, VERSION, DEFAULT_REPO } from "./lib/config.js";
 // --- Command Registry ---
 const COMMANDS = {
@@ -67,6 +67,10 @@ async function main() {
         if (found) {
             const cmdModule = await import(found.config.module);
             await cmdModule.run(found.config.hasParam ? params[0] : undefined);
+        } else if (command === "" || command === undefined) {
+            // NEW: No command = default install from pikakit/agent-skills
+            const cmdModule = await import("./lib/commands/install.js");
+            await cmdModule.run(DEFAULT_REPO);
         } else if (command.includes("/")) {
             // Direct install via org/repo syntax
             const cmdModule = await import("./lib/commands/install.js");

package/bin/lib/commands/help.js CHANGED Viewed

@@ -137,19 +137,24 @@ function showQuickStart() {
   step(c.bold("Quick Start Guide"), S.diamondFilled, "cyan");
   stepLine();
-  step(c.bold("1. Install skills"));
-  step("   " + c.cyan("kit pikakit/agent-skills"));
+  step(c.bold("1. Install PikaKit (Recommended)"));
+  step("   " + c.cyan("npx pikakit"));
+  step("   " + c.dim("→ Installs all skills from pikakit/agent-skills"));
   stepLine();
-  step(c.bold("2. Choose scope"));
-  step("   " + c.dim("→ Current Project (local .agent/)"));
-  step("   " + c.dim("→ Global System (available everywhere)"));
+  step(c.bold("2. Or install from specific repo"));
+  step("   " + c.cyan("npx pikakit add <org/repo>"));
+  step("   " + c.dim("Example: npx pikakit add pikakit/agent-skills"));
   stepLine();
-  step(c.bold("3. Check installation"));
-  step("   " + c.cyan("kit doctor"));
+  step(c.bold("3. Initialize directory only"));
+  step("   " + c.cyan("npx pikakit init"));
   stepLine();
-  step(c.bold("4. Use in your AI"));
+  step(c.bold("4. Check installation"));
+  step("   " + c.cyan("npx pikakit doctor"));
+  stepLine();
+  step(c.bold("5. Use in your AI"));
   step("   " + c.dim("Skills are now available in .agent/skills/"));
 }

package/bin/lib/config.js CHANGED Viewed

@@ -30,8 +30,8 @@ export const BACKUP_DIR = path.join(CACHE_ROOT, "backups");
 const args = process.argv.slice(2);
-/** Command name (first non-flag argument) */
-export const command = args[0] || "help";
+/** Command name (first non-flag argument, empty string if none) */
+export const command = args[0] || "";
 /** All flags (starting with --) */
 export const flags = new Set(args.filter((a) => a.startsWith("--")));
@@ -79,3 +79,5 @@ export const VERSION = (() => {
     catch { return "1.2.0"; }
 })();
+/** Default skills repository for npx pikakit shorthand */
+export const DEFAULT_REPO = "pikakit/agent-skills";

package/lib/agent-cli/lib/ab-testing.js ADDED Viewed

@@ -0,0 +1,508 @@
+/**
+ * AutoLearn v6.0 - A/B Testing Engine
+ *
+ * Compares patterns to determine which is more effective.
+ * Uses statistical significance to select winners.
+ *
+ * Key concepts:
+ * - Split Traffic: 50/50 allocation between patterns
+ * - Track Outcomes: Success rate per pattern
+ * - Statistical Significance: Chi-square test
+ * - Winner Selection: Auto-select when significant
+ *
+ * @version 6.0.0
+ * @author PikaKit
+ */
+import fs from 'fs';
+import path from 'path';
+import { recordABTestEvent } from './metrics-collector.js';
+import { applyReinforcement, REINFORCEMENT_RULES } from './reinforcement.js';
+// ============================================================================
+// CONFIGURATION
+// ============================================================================
+const KNOWLEDGE_DIR = path.join(process.cwd(), '.agent', 'knowledge');
+const AB_TESTS_FILE = path.join(KNOWLEDGE_DIR, 'ab-tests.json');
+// Minimum samples before we can determine winner
+const MIN_SAMPLES_PER_VARIANT = 10;
+// Confidence level for statistical significance (95%)
+const SIGNIFICANCE_LEVEL = 0.95;
+// Default test duration (7 days)
+const DEFAULT_TEST_DURATION_MS = 7 * 24 * 60 * 60 * 1000;
+// ============================================================================
+// A/B TEST DATA STRUCTURE
+// ============================================================================
+/**
+ * @typedef {Object} ABTest
+ * @property {string} id - Test ID
+ * @property {string} status - 'pending' | 'running' | 'completed' | 'cancelled'
+ * @property {Object} patternA - Pattern A details
+ * @property {Object} patternB - Pattern B details (or baseline)
+ * @property {number} allocation - Traffic split (0.5 = 50/50)
+ * @property {Object} metrics - Success metrics per variant
+ * @property {Object} result - Test result when completed
+ */
+// ============================================================================
+// TEST MANAGEMENT
+// ============================================================================
+/**
+ * Create a new A/B test
+ * @param {Object} patternA - First pattern
+ * @param {Object} patternB - Second pattern (or null for baseline)
+ * @param {Object} options - Test options
+ * @returns {Object} - Created test
+ */
+export function createABTest(patternA, patternB = null, options = {}) {
+    const test = {
+        id: `AB-${Date.now()}`,
+        createdAt: new Date().toISOString(),
+        startedAt: null,
+        endedAt: null,
+        status: 'pending',
+        // Patterns
+        patternA: {
+            id: patternA.id,
+            confidence: patternA.confidence,
+            name: patternA.name || patternA.id
+        },
+        patternB: patternB ? {
+            id: patternB.id,
+            confidence: patternB.confidence,
+            name: patternB.name || patternB.id
+        } : {
+            id: 'baseline',
+            confidence: null,
+            name: 'No pattern (baseline)'
+        },
+        // Configuration
+        allocation: options.allocation || 0.5,
+        minSamples: options.minSamples || MIN_SAMPLES_PER_VARIANT,
+        maxDuration: options.maxDuration || DEFAULT_TEST_DURATION_MS,
+        // Metrics
+        metrics: {
+            patternA: { applied: 0, success: 0, failure: 0, totalTime: 0 },
+            patternB: { applied: 0, success: 0, failure: 0, totalTime: 0 }
+        },
+        // Result (filled when completed)
+        result: null
+    };
+    saveABTest(test);
+    return test;
+}
+/**
+ * Start an A/B test
+ * @param {string} testId - Test ID
+ * @returns {Object} - Updated test
+ */
+export function startABTest(testId) {
+    const test = loadABTest(testId);
+    if (!test) return null;
+    test.status = 'running';
+    test.startedAt = new Date().toISOString();
+    saveABTest(test);
+    return test;
+}
+/**
+ * Get which variant to use for a task
+ * @param {string} testId - Test ID
+ * @returns {string} - 'patternA' | 'patternB'
+ */
+export function getVariantForTask(testId) {
+    const test = loadABTest(testId);
+    if (!test || test.status !== 'running') {
+        return null;
+    }
+    // Simple random allocation
+    return Math.random() < test.allocation ? 'patternA' : 'patternB';
+}
+/**
+ * Record outcome for an A/B test
+ * @param {string} testId - Test ID
+ * @param {string} variant - 'patternA' | 'patternB'
+ * @param {Object} outcome - Task outcome
+ */
+export function recordABOutcome(testId, variant, outcome) {
+    const test = loadABTest(testId);
+    if (!test || test.status !== 'running') return null;
+    const metrics = test.metrics[variant];
+    if (!metrics) return null;
+    metrics.applied++;
+    if (outcome.success) {
+        metrics.success++;
+    } else {
+        metrics.failure++;
+    }
+    if (outcome.duration) {
+        metrics.totalTime += outcome.duration;
+    }
+    // Check if test should complete
+    const shouldComplete = checkTestCompletion(test);
+    if (shouldComplete.complete) {
+        completeABTest(testId, shouldComplete.reason);
+    } else {
+        saveABTest(test);
+    }
+    return test;
+}
+// ============================================================================
+// STATISTICAL ANALYSIS
+// ============================================================================
+/**
+ * Calculate success rate for a variant
+ * @param {Object} metrics - Variant metrics
+ * @returns {number} - Success rate 0.0 to 1.0
+ */
+function calculateSuccessRate(metrics) {
+    if (metrics.applied === 0) return 0;
+    return metrics.success / metrics.applied;
+}
+/**
+ * Calculate chi-square statistic for A/B comparison
+ * @param {Object} metricsA - Pattern A metrics
+ * @param {Object} metricsB - Pattern B metrics
+ * @returns {Object} - Chi-square result
+ */
+function calculateChiSquare(metricsA, metricsB) {
+    const totalA = metricsA.success + metricsA.failure;
+    const totalB = metricsB.success + metricsB.failure;
+    const total = totalA + totalB;
+    if (total === 0) return { chiSquare: 0, significant: false };
+    const successTotal = metricsA.success + metricsB.success;
+    const failureTotal = metricsA.failure + metricsB.failure;
+    // Expected values
+    const expectedASuccess = (totalA * successTotal) / total;
+    const expectedAFailure = (totalA * failureTotal) / total;
+    const expectedBSuccess = (totalB * successTotal) / total;
+    const expectedBFailure = (totalB * failureTotal) / total;
+    // Chi-square calculation
+    let chiSquare = 0;
+    if (expectedASuccess > 0) {
+        chiSquare += Math.pow(metricsA.success - expectedASuccess, 2) / expectedASuccess;
+    }
+    if (expectedAFailure > 0) {
+        chiSquare += Math.pow(metricsA.failure - expectedAFailure, 2) / expectedAFailure;
+    }
+    if (expectedBSuccess > 0) {
+        chiSquare += Math.pow(metricsB.success - expectedBSuccess, 2) / expectedBSuccess;
+    }
+    if (expectedBFailure > 0) {
+        chiSquare += Math.pow(metricsB.failure - expectedBFailure, 2) / expectedBFailure;
+    }
+    // Critical value for 95% confidence, 1 degree of freedom
+    const criticalValue = 3.841;
+    const significant = chiSquare > criticalValue;
+    return {
+        chiSquare,
+        criticalValue,
+        significant,
+        confidence: significant ? 0.95 : chiSquare / criticalValue * 0.95
+    };
+}
+/**
+ * Analyze A/B test results
+ * @param {Object} test - A/B test object
+ * @returns {Object} - Analysis result
+ */
+export function analyzeABTest(test) {
+    const metricsA = test.metrics.patternA;
+    const metricsB = test.metrics.patternB;
+    const rateA = calculateSuccessRate(metricsA);
+    const rateB = calculateSuccessRate(metricsB);
+    const chiSquareResult = calculateChiSquare(metricsA, metricsB);
+    const avgTimeA = metricsA.applied > 0 ? metricsA.totalTime / metricsA.applied : 0;
+    const avgTimeB = metricsB.applied > 0 ? metricsB.totalTime / metricsB.applied : 0;
+    // Determine winner
+    let winner = null;
+    let winnerReason = '';
+    let margin = 0;
+    if (chiSquareResult.significant) {
+        if (rateA > rateB) {
+            winner = 'patternA';
+            margin = rateA - rateB;
+            winnerReason = `Higher success rate by ${(margin * 100).toFixed(1)}%`;
+        } else if (rateB > rateA) {
+            winner = 'patternB';
+            margin = rateB - rateA;
+            winnerReason = `Higher success rate by ${(margin * 100).toFixed(1)}%`;
+        }
+    } else {
+        winnerReason = 'No statistically significant difference';
+    }
+    return {
+        patternA: {
+            id: test.patternA.id,
+            samples: metricsA.applied,
+            successRate: rateA,
+            avgTime: avgTimeA
+        },
+        patternB: {
+            id: test.patternB.id,
+            samples: metricsB.applied,
+            successRate: rateB,
+            avgTime: avgTimeB
+        },
+        statistics: chiSquareResult,
+        winner,
+        winnerReason,
+        margin,
+        analyzedAt: new Date().toISOString()
+    };
+}
+// ============================================================================
+// TEST COMPLETION
+// ============================================================================
+/**
+ * Check if test should be completed
+ * @param {Object} test - A/B test
+ * @returns {Object} - { complete: boolean, reason: string }
+ */
+function checkTestCompletion(test) {
+    const metricsA = test.metrics.patternA;
+    const metricsB = test.metrics.patternB;
+    // Check minimum samples
+    if (metricsA.applied >= test.minSamples && metricsB.applied >= test.minSamples) {
+        const analysis = analyzeABTest(test);
+        if (analysis.statistics.significant) {
+            return {
+                complete: true,
+                reason: 'Statistical significance reached'
+            };
+        }
+    }
+    // Check max duration
+    if (test.startedAt) {
+        const duration = Date.now() - new Date(test.startedAt).getTime();
+        if (duration > test.maxDuration) {
+            return {
+                complete: true,
+                reason: 'Max duration reached'
+            };
+        }
+    }
+    // Check if one variant is clearly better (early stopping)
+    const totalSamples = metricsA.applied + metricsB.applied;
+    if (totalSamples >= 20) {
+        const rateA = calculateSuccessRate(metricsA);
+        const rateB = calculateSuccessRate(metricsB);
+        const diff = Math.abs(rateA - rateB);
+        // Early stop if difference > 30%
+        if (diff > 0.3) {
+            return {
+                complete: true,
+                reason: 'Clear winner detected (early stopping)'
+            };
+        }
+    }
+    return { complete: false };
+}
+/**
+ * Complete an A/B test and apply results
+ * @param {string} testId - Test ID
+ * @param {string} reason - Completion reason
+ * @returns {Object} - Completed test with results
+ */
+export function completeABTest(testId, reason) {
+    const test = loadABTest(testId);
+    if (!test) return null;
+    const analysis = analyzeABTest(test);
+    test.status = 'completed';
+    test.endedAt = new Date().toISOString();
+    test.result = {
+        ...analysis,
+        completionReason: reason
+    };
+    saveABTest(test);
+    // Record for metrics
+    recordABTestEvent({
+        hasWinner: !!analysis.winner
+    });
+    // Apply reinforcement to winner/loser
+    if (analysis.winner) {
+        applyABTestReinforcement(test, analysis);
+    }
+    return test;
+}
+/**
+ * Apply reinforcement based on A/B test results
+ * @param {Object} test - Completed test
+ * @param {Object} analysis - Test analysis
+ */
+function applyABTestReinforcement(test, analysis) {
+    // Winner gets reward proportional to margin
+    const winnerReward = Math.min(0.15, analysis.margin * 0.5);
+    // Loser gets penalty
+    const loserPenalty = -Math.min(0.10, analysis.margin * 0.3);
+    console.log(`A/B Test ${test.id} completed:`);
+    console.log(`  Winner: ${analysis.winner} (+${winnerReward.toFixed(2)} confidence)`);
+    console.log(`  Reason: ${analysis.winnerReason}`);
+    // Note: Actual pattern updates would be done by caller
+    // This just logs the recommended adjustments
+    return {
+        winnerId: analysis.winner === 'patternA' ? test.patternA.id : test.patternB.id,
+        loserId: analysis.winner === 'patternA' ? test.patternB.id : test.patternA.id,
+        winnerReward,
+        loserPenalty
+    };
+}
+// ============================================================================
+// STORAGE
+// ============================================================================
+/**
+ * Load A/B test from disk
+ * @param {string} testId - Test ID
+ * @returns {Object|null} - Test or null
+ */
+export function loadABTest(testId) {
+    const tests = loadAllABTests();
+    return tests.find(t => t.id === testId) || null;
+}
+/**
+ * Load all A/B tests
+ * @returns {Array} - All tests
+ */
+export function loadAllABTests() {
+    try {
+        if (!fs.existsSync(AB_TESTS_FILE)) return [];
+        return JSON.parse(fs.readFileSync(AB_TESTS_FILE, 'utf8'));
+    } catch {
+        return [];
+    }
+}
+/**
+ * Save A/B test
+ * @param {Object} test - Test to save
+ */
+export function saveABTest(test) {
+    try {
+        if (!fs.existsSync(KNOWLEDGE_DIR)) {
+            fs.mkdirSync(KNOWLEDGE_DIR, { recursive: true });
+        }
+        const tests = loadAllABTests();
+        const existingIndex = tests.findIndex(t => t.id === test.id);
+        if (existingIndex >= 0) {
+            tests[existingIndex] = test;
+        } else {
+            tests.push(test);
+        }
+        fs.writeFileSync(AB_TESTS_FILE, JSON.stringify(tests, null, 2), 'utf8');
+    } catch (error) {
+        console.error('Error saving A/B test:', error.message);
+    }
+}
+/**
+ * Get active A/B tests
+ * @returns {Array} - Running tests
+ */
+export function getActiveTests() {
+    return loadAllABTests().filter(t => t.status === 'running');
+}
+/**
+ * Get A/B test statistics
+ * @returns {Object} - Statistics
+ */
+export function getABTestStats() {
+    const tests = loadAllABTests();
+    const completed = tests.filter(t => t.status === 'completed');
+    const withWinner = completed.filter(t => t.result?.winner);
+    return {
+        total: tests.length,
+        running: tests.filter(t => t.status === 'running').length,
+        completed: completed.length,
+        withWinner: withWinner.length,
+        winRate: completed.length > 0 ? withWinner.length / completed.length : 0,
+        pending: tests.filter(t => t.status === 'pending').length
+    };
+}
+// ============================================================================
+// EXPORTS
+// ============================================================================
+export default {
+    createABTest,
+    startABTest,
+    getVariantForTask,
+    recordABOutcome,
+    analyzeABTest,
+    completeABTest,
+    loadABTest,
+    loadAllABTests,
+    saveABTest,
+    getActiveTests,
+    getABTestStats,
+    MIN_SAMPLES_PER_VARIANT,
+    SIGNIFICANCE_LEVEL
+};