npm - @sparkleideas/agentdb-onnx - Versions diffs - 1.0.1 - Mend

@sparkleideas/agentdb-onnx 1.0.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/ARCHITECTURE.md +331 -0
package/IMPLEMENTATION-SUMMARY.md +456 -0
package/README.md +418 -0
package/examples/complete-workflow.ts +281 -0
package/package.json +41 -0
package/src/benchmarks/benchmark-runner.ts +301 -0
package/src/cli.ts +245 -0
package/src/index.ts +128 -0
package/src/services/ONNXEmbeddingService.ts +459 -0
package/src/tests/integration.test.ts +302 -0
package/src/tests/onnx-embedding.test.ts +317 -0
package/tsconfig.json +19 -0

package/package.json ADDED Viewed

@@ -0,0 +1,41 @@
+{
+  "name": "@sparkleideas/agentdb-onnx",
+  "version": "1.0.1",
+  "description": "AgentDB with optimized ONNX embeddings - 100% local, GPU-accelerated AI agent memory",
+  "type": "module",
+  "main": "dist/index.js",
+  "types": "dist/index.d.ts",
+  "scripts": {
+    "build": "tsc",
+    "dev": "tsx src/cli.ts",
+    "test": "vitest run",
+    "test:watch": "vitest",
+    "benchmark": "tsx src/benchmarks/benchmark-runner.ts",
+    "example": "tsx examples/complete-workflow.ts"
+  },
+  "keywords": [
+    "agentdb",
+    "onnx",
+    "embeddings",
+    "vector-database",
+    "ai-agents",
+    "local-inference",
+    "gpu-acceleration"
+  ],
+  "dependencies": {
+    "onnxruntime-node": "^1.20.1",
+    "@xenova/transformers": "^2.17.2",
+    "commander": "^12.1.0",
+    "chalk": "^5.3.0",
+    "@sparkleideas/agentdb": "*"
+  },
+  "devDependencies": {
+    "@types/node": "^22.10.2",
+    "tsx": "^4.19.2",
+    "typescript": "^5.7.2",
+    "vitest": "^2.1.8"
+  },
+  "engines": {
+    "node": ">=18.0.0"
+  }
+}

package/src/benchmarks/benchmark-runner.ts ADDED Viewed

@@ -0,0 +1,301 @@
+#!/usr/bin/env tsx
+/**
+ * Comprehensive Performance Benchmarks for AgentDB + ONNX
+ */
+import { createONNXAgentDB } from '../index.js';
+import { unlink } from 'fs/promises';
+import chalk from 'chalk';
+interface BenchmarkResult {
+  name: string;
+  operations: number;
+  totalTime: number;
+  opsPerSec: number;
+  avgLatency: number;
+  p50: number;
+  p95: number;
+  p99: number;
+}
+/**
+ * Run a benchmark and collect statistics
+ */
+async function benchmark(
+  name: string,
+  operations: number,
+  fn: () => Promise<void>
+): Promise<BenchmarkResult> {
+  const latencies: number[] = [];
+  console.log(chalk.blue(`\n🏃 Running: ${name}`));
+  console.log(chalk.gray(`   Operations: ${operations}`));
+  const startTime = Date.now();
+  for (let i = 0; i < operations; i++) {
+    const opStart = Date.now();
+    await fn();
+    const opLatency = Date.now() - opStart;
+    latencies.push(opLatency);
+    if ((i + 1) % Math.max(1, Math.floor(operations / 10)) === 0) {
+      process.stdout.write(chalk.gray(`.`));
+    }
+  }
+  const totalTime = Date.now() - startTime;
+  const opsPerSec = (operations / totalTime) * 1000;
+  // Calculate percentiles
+  latencies.sort((a, b) => a - b);
+  const p50 = latencies[Math.floor(latencies.length * 0.5)];
+  const p95 = latencies[Math.floor(latencies.length * 0.95)];
+  const p99 = latencies[Math.floor(latencies.length * 0.99)];
+  const avgLatency = latencies.reduce((a, b) => a + b, 0) / latencies.length;
+  console.log(); // Newline after dots
+  return {
+    name,
+    operations,
+    totalTime,
+    opsPerSec,
+    avgLatency,
+    p50,
+    p95,
+    p99
+  };
+}
+/**
+ * Print benchmark results
+ */
+function printResult(result: BenchmarkResult) {
+  console.log(chalk.green(`\n✅ ${result.name}`));
+  console.log(chalk.white(`   Total time:     ${result.totalTime.toFixed(2)}ms`));
+  console.log(chalk.white(`   Throughput:     ${result.opsPerSec.toFixed(2)} ops/sec`));
+  console.log(chalk.white(`   Avg latency:    ${result.avgLatency.toFixed(2)}ms`));
+  console.log(chalk.white(`   P50 latency:    ${result.p50.toFixed(2)}ms`));
+  console.log(chalk.white(`   P95 latency:    ${result.p95.toFixed(2)}ms`));
+  console.log(chalk.white(`   P99 latency:    ${result.p99.toFixed(2)}ms`));
+}
+/**
+ * Main benchmark suite
+ */
+async function main() {
+  console.log(chalk.bold.cyan('\n╔════════════════════════════════════════╗'));
+  console.log(chalk.bold.cyan('║  AgentDB + ONNX Performance Benchmark  ║'));
+  console.log(chalk.bold.cyan('╚════════════════════════════════════════╝\n'));
+  const dbPath = './benchmark-agentdb-onnx.db';
+  try {
+    // Initialize AgentDB
+    console.log(chalk.yellow('📦 Initializing AgentDB + ONNX...'));
+    const agentdb = await createONNXAgentDB({
+      dbPath,
+      modelName: 'Xenova/all-MiniLM-L6-v2',
+      useGPU: false,
+      batchSize: 32,
+      cacheSize: 10000
+    });
+    console.log(chalk.green('✅ Initialization complete\n'));
+    const results: BenchmarkResult[] = [];
+    // Benchmark 1: Single embedding generation
+    results.push(await benchmark(
+      'Single Embedding Generation',
+      100,
+      async () => {
+        await agentdb.embedder.embed(`Test embedding ${Math.random()}`);
+      }
+    ));
+    // Benchmark 2: Cached embedding access
+    const cachedText = 'This text will be cached';
+    await agentdb.embedder.embed(cachedText); // Warm up cache
+    results.push(await benchmark(
+      'Cached Embedding Access',
+      1000,
+      async () => {
+        await agentdb.embedder.embed(cachedText);
+      }
+    ));
+    // Benchmark 3: Batch embedding (10 items)
+    results.push(await benchmark(
+      'Batch Embedding (10 items)',
+      50,
+      async () => {
+        const texts = Array.from({ length: 10 }, (_, i) =>
+          `Batch text ${i} ${Math.random()}`
+        );
+        await agentdb.embedder.embedBatch(texts);
+      }
+    ));
+    // Benchmark 4: Batch embedding (100 items)
+    results.push(await benchmark(
+      'Batch Embedding (100 items)',
+      10,
+      async () => {
+        const texts = Array.from({ length: 100 }, (_, i) =>
+          `Large batch text ${i} ${Math.random()}`
+        );
+        await agentdb.embedder.embedBatch(texts);
+      }
+    ));
+    // Benchmark 5: Pattern storage
+    results.push(await benchmark(
+      'Pattern Storage (Single)',
+      100,
+      async () => {
+        await agentdb.reasoningBank.storePattern({
+          taskType: 'benchmark',
+          approach: `Approach ${Math.random()}`,
+          successRate: Math.random()
+        });
+      }
+    ));
+    // Benchmark 6: Pattern batch storage (using loops)
+    results.push(await benchmark(
+      'Pattern Storage (Batch of 10)',
+      20,
+      async () => {
+        const patterns = Array.from({ length: 10 }, (_, i) => ({
+          taskType: 'batch-benchmark',
+          approach: `Batch approach ${i} ${Math.random()}`,
+          successRate: Math.random()
+        }));
+        for (const pattern of patterns) {
+          await agentdb.reasoningBank.storePattern(pattern);
+        }
+      }
+    ));
+    // Benchmark 7: Pattern search - pre-populate database
+    for (let i = 0; i < 100; i++) {
+      await agentdb.reasoningBank.storePattern({
+        taskType: 'search-test',
+        approach: `Search approach ${i}`,
+        successRate: Math.random()
+      });
+    }
+    results.push(await benchmark(
+      'Pattern Search (k=10)',
+      100,
+      async () => {
+        await agentdb.reasoningBank.searchPatterns({
+          task: 'search approach',
+          k: 10
+        });
+      }
+    ));
+    // Benchmark 8: Episode storage
+    results.push(await benchmark(
+      'Episode Storage (Single)',
+      100,
+      async () => {
+        await agentdb.reflexionMemory.storeEpisode({
+          sessionId: 'benchmark',
+          task: `Task ${Math.random()}`,
+          reward: Math.random(),
+          success: Math.random() > 0.5,
+          critique: 'Benchmark critique'
+        });
+      }
+    ));
+    // Benchmark 9: Episode batch storage (using loops)
+    results.push(await benchmark(
+      'Episode Storage (Batch of 10)',
+      20,
+      async () => {
+        const episodes = Array.from({ length: 10 }, (_, i) => ({
+          sessionId: 'batch-benchmark',
+          task: `Batch task ${i} ${Math.random()}`,
+          reward: Math.random(),
+          success: Math.random() > 0.5,
+          critique: `Batch critique ${i}`
+        }));
+        for (const episode of episodes) {
+          await agentdb.reflexionMemory.storeEpisode(episode);
+        }
+      }
+    ));
+    // Benchmark 10: Episode retrieval - pre-populate database
+    for (let i = 0; i < 100; i++) {
+      await agentdb.reflexionMemory.storeEpisode({
+        sessionId: 'retrieval-test',
+        task: `Retrieval task ${i}`,
+        reward: Math.random(),
+        success: Math.random() > 0.5
+      });
+    }
+    results.push(await benchmark(
+      'Episode Retrieval (k=10)',
+      100,
+      async () => {
+        await agentdb.reflexionMemory.retrieveRelevant({
+          task: 'retrieval task',
+          k: 10
+        });
+      }
+    ));
+    // Print all results
+    console.log(chalk.bold.cyan('\n\n╔════════════════════════════════════════╗'));
+    console.log(chalk.bold.cyan('║         Benchmark Results              ║'));
+    console.log(chalk.bold.cyan('╚════════════════════════════════════════╝'));
+    results.forEach(printResult);
+    // Print summary
+    console.log(chalk.bold.cyan('\n\n╔════════════════════════════════════════╗'));
+    console.log(chalk.bold.cyan('║            Summary                     ║'));
+    console.log(chalk.bold.cyan('╚════════════════════════════════════════╝\n'));
+    const stats = agentdb.getStats();
+    console.log(chalk.white('📊 Overall Statistics:'));
+    console.log(chalk.white(`   Total embeddings:   ${stats.embedder.totalEmbeddings}`));
+    console.log(chalk.white(`   Avg embedding time: ${stats.embedder.avgLatency.toFixed(2)}ms`));
+    console.log(chalk.white(`   Cache hit rate:     ${(stats.embedder.cache.hitRate * 100).toFixed(1)}%`));
+    console.log(chalk.white(`   Cache size:         ${stats.embedder.cache.size}/${stats.embedder.cache.maxSize}`));
+    // Calculate speedup from batching
+    const singlePattern = results.find(r => r.name === 'Pattern Storage (Single)');
+    const batchPattern = results.find(r => r.name === 'Pattern Storage (Batch of 10)');
+    if (singlePattern && batchPattern) {
+      const speedup = (singlePattern.opsPerSec * 10) / batchPattern.opsPerSec;
+      console.log(chalk.white(`\n🚀 Batch speedup:      ${speedup.toFixed(2)}x faster`));
+    }
+    // Cleanup
+    await agentdb.close();
+    console.log(chalk.green('\n✅ Benchmark complete!\n'));
+  } catch (error) {
+    console.error(chalk.red('\n❌ Benchmark failed:'), error);
+    process.exit(1);
+  } finally {
+    try {
+      await unlink(dbPath);
+    } catch {}
+  }
+}
+// Run benchmarks
+main().catch(console.error);

package/src/cli.ts ADDED Viewed

@@ -0,0 +1,245 @@
+#!/usr/bin/env node
+/**
+ * CLI for AgentDB + ONNX
+ */
+import { Command } from 'commander';
+import chalk from 'chalk';
+import { createONNXAgentDB } from './index.js';
+import { unlink } from 'fs/promises';
+const program = new Command();
+program
+  .name('agentdb-onnx')
+  .description('AgentDB with optimized ONNX embeddings')
+  .version('1.0.0');
+// Init command
+program
+  .command('init')
+  .description('Initialize a new AgentDB with ONNX embeddings')
+  .argument('<db-path>', 'Path to database file')
+  .option('-m, --model <name>', 'Model name', 'Xenova/all-MiniLM-L6-v2')
+  .option('--gpu', 'Enable GPU acceleration')
+  .option('-b, --batch-size <size>', 'Batch size', '32')
+  .option('-c, --cache-size <size>', 'Cache size', '10000')
+  .action(async (dbPath, options) => {
+    try {
+      console.log(chalk.blue('Initializing AgentDB + ONNX...'));
+      console.log(chalk.gray(`  Database: ${dbPath}`));
+      console.log(chalk.gray(`  Model:    ${options.model}`));
+      console.log(chalk.gray(`  GPU:      ${options.gpu ? 'enabled' : 'disabled'}`));
+      const agentdb = await createONNXAgentDB({
+        dbPath,
+        modelName: options.model,
+        useGPU: options.gpu,
+        batchSize: parseInt(options.batchSize),
+        cacheSize: parseInt(options.cacheSize)
+      });
+      console.log(chalk.green('✅ Initialized successfully'));
+      await agentdb.close();
+    } catch (error) {
+      console.error(chalk.red('❌ Error:'), error);
+      process.exit(1);
+    }
+  });
+// Store pattern command
+program
+  .command('store-pattern')
+  .description('Store a reasoning pattern')
+  .argument('<db-path>', 'Database path')
+  .requiredOption('-t, --task-type <type>', 'Task type')
+  .requiredOption('-a, --approach <approach>', 'Approach description')
+  .requiredOption('-s, --success-rate <rate>', 'Success rate (0-1)')
+  .option('--tags <tags>', 'Comma-separated tags')
+  .action(async (dbPath, options) => {
+    try {
+      const agentdb = await createONNXAgentDB({ dbPath, useGPU: false });
+      const id = await agentdb.reasoningBank.storePattern({
+        taskType: options.taskType,
+        approach: options.approach,
+        successRate: parseFloat(options.successRate),
+        tags: options.tags?.split(',')
+      });
+      console.log(chalk.green(`✅ Pattern stored with ID: ${id}`));
+      await agentdb.close();
+    } catch (error) {
+      console.error(chalk.red('❌ Error:'), error);
+      process.exit(1);
+    }
+  });
+// Search patterns command
+program
+  .command('search-patterns')
+  .description('Search for similar patterns')
+  .argument('<db-path>', 'Database path')
+  .argument('<query>', 'Search query')
+  .option('-k, --top-k <k>', 'Number of results', '10')
+  .option('--threshold <threshold>', 'Similarity threshold', '0.7')
+  .option('--task-type <type>', 'Filter by task type')
+  .action(async (dbPath, query, options) => {
+    try {
+      const agentdb = await createONNXAgentDB({ dbPath, useGPU: false });
+      const results = await agentdb.reasoningBank.searchPatterns({
+        task: query,
+        k: parseInt(options.topK),
+        threshold: parseFloat(options.threshold),
+        filters: options.taskType ? { taskType: options.taskType } : undefined
+      });
+      console.log(chalk.blue(`\nFound ${results.length} patterns:\n`));
+      results.forEach((r, i) => {
+        console.log(chalk.white(`${i + 1}. ${r.approach}`));
+        console.log(chalk.gray(`   Type:       ${r.taskType}`));
+        console.log(chalk.gray(`   Success:    ${(r.successRate * 100).toFixed(1)}%`));
+        console.log(chalk.gray(`   Similarity: ${(r.similarity * 100).toFixed(1)}%`));
+        if (r.tags && r.tags.length > 0) {
+          console.log(chalk.gray(`   Tags:       ${r.tags.join(', ')}`));
+        }
+        console.log();
+      });
+      await agentdb.close();
+    } catch (error) {
+      console.error(chalk.red('❌ Error:'), error);
+      process.exit(1);
+    }
+  });
+// Store episode command
+program
+  .command('store-episode')
+  .description('Store a reflexion episode')
+  .argument('<db-path>', 'Database path')
+  .requiredOption('-s, --session <id>', 'Session ID')
+  .requiredOption('-t, --task <task>', 'Task description')
+  .requiredOption('-r, --reward <reward>', 'Reward (0-1)')
+  .requiredOption('--success', 'Task succeeded')
+  .option('--critique <critique>', 'Self-critique')
+  .action(async (dbPath, options) => {
+    try {
+      const agentdb = await createONNXAgentDB({ dbPath, useGPU: false });
+      const id = await agentdb.reflexionMemory.storeEpisode({
+        sessionId: options.session,
+        task: options.task,
+        reward: parseFloat(options.reward),
+        success: true,
+        critique: options.critique
+      });
+      console.log(chalk.green(`✅ Episode stored with ID: ${id}`));
+      await agentdb.close();
+    } catch (error) {
+      console.error(chalk.red('❌ Error:'), error);
+      process.exit(1);
+    }
+  });
+// Search episodes command
+program
+  .command('search-episodes')
+  .description('Search for similar episodes')
+  .argument('<db-path>', 'Database path')
+  .argument('<query>', 'Search query')
+  .option('-k, --top-k <k>', 'Number of results', '10')
+  .option('--only-successes', 'Only successful episodes')
+  .option('--min-reward <reward>', 'Minimum reward threshold')
+  .action(async (dbPath, query, options) => {
+    try {
+      const agentdb = await createONNXAgentDB({ dbPath, useGPU: false });
+      const results = await agentdb.reflexionMemory.retrieveRelevant({
+        task: query,
+        k: parseInt(options.topK),
+        onlySuccesses: options.onlySuccesses,
+        minReward: options.minReward ? parseFloat(options.minReward) : undefined
+      });
+      console.log(chalk.blue(`\nFound ${results.length} episodes:\n`));
+      results.forEach((r, i) => {
+        console.log(chalk.white(`${i + 1}. ${r.task}`));
+        console.log(chalk.gray(`   Session:    ${r.sessionId}`));
+        console.log(chalk.gray(`   Reward:     ${(r.reward * 100).toFixed(1)}%`));
+        console.log(chalk.gray(`   Success:    ${r.success ? 'Yes' : 'No'}`));
+        console.log(chalk.gray(`   Similarity: ${(r.similarity * 100).toFixed(1)}%`));
+        if (r.critique) {
+          console.log(chalk.gray(`   Critique:   ${r.critique.substring(0, 80)}${r.critique.length > 80 ? '...' : ''}`));
+        }
+        console.log();
+      });
+      await agentdb.close();
+    } catch (error) {
+      console.error(chalk.red('❌ Error:'), error);
+      process.exit(1);
+    }
+  });
+// Stats command
+program
+  .command('stats')
+  .description('Show database statistics')
+  .argument('<db-path>', 'Database path')
+  .action(async (dbPath) => {
+    try {
+      const agentdb = await createONNXAgentDB({ dbPath, useGPU: false });
+      const stats = agentdb.getStats();
+      console.log(chalk.blue('\n📊 AgentDB + ONNX Statistics\n'));
+      console.log(chalk.white('Embeddings:'));
+      console.log(chalk.gray(`  Model:          ${stats.embedder.model}`));
+      console.log(chalk.gray(`  Total:          ${stats.embedder.totalEmbeddings}`));
+      console.log(chalk.gray(`  Avg latency:    ${stats.embedder.avgLatency.toFixed(2)}ms`));
+      console.log(chalk.gray(`  Cache hit rate: ${(stats.embedder.cache.hitRate * 100).toFixed(1)}%`));
+      console.log(chalk.gray(`  Cache size:     ${stats.embedder.cache.size}/${stats.embedder.cache.maxSize}`));
+      console.log(chalk.white('\nDatabase:'));
+      if (stats.database) {
+        Object.entries(stats.database).forEach(([key, value]) => {
+          console.log(chalk.gray(`  ${key}: ${value}`));
+        });
+      }
+      console.log();
+      await agentdb.close();
+    } catch (error) {
+      console.error(chalk.red('❌ Error:'), error);
+      process.exit(1);
+    }
+  });
+// Benchmark command
+program
+  .command('benchmark')
+  .description('Run performance benchmarks')
+  .option('--operations <n>', 'Number of operations per test', '100')
+  .action(async (options) => {
+    console.log(chalk.blue('Running benchmarks...\n'));
+    try {
+      // Import and run benchmark dynamically
+      await import('./benchmarks/benchmark-runner.js');
+    } catch (error) {
+      console.error(chalk.red('❌ Benchmark failed:'), error);
+      process.exit(1);
+    }
+  });
+program.parse();