npm - obol-ai - Versions diffs - 0.3.8 → 0.3.10 - Mend

obol-ai 0.3.8 → 0.3.10

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (10) hide show

package/CHANGELOG.md CHANGED Viewed

@@ -1,3 +1,7 @@
+## 0.3.10
+- add CLI commands for evolve and curiosity, verbose logging
+- fix pattern analysis: enforce factual observations, use incrementObservation
 ## 0.3.8
 - override haiku to sonnet when recent history has tool use

package/bin/obol.js CHANGED Viewed

@@ -94,4 +94,20 @@ program
     await reauth();
   });
+program
+  .command('evolve [userId]')
+  .description('Trigger an evolution cycle manually')
+  .action(async (userId) => {
+    const { evolve } = require('../src/cli/evolve');
+    await evolve({ userId: userId ? parseInt(userId) : undefined });
+  });
+program
+  .command('curiosity [userId]')
+  .description('Trigger a curiosity cycle manually')
+  .action(async (userId) => {
+    const { curiosity } = require('../src/cli/curiosity');
+    await curiosity({ userId: userId ? parseInt(userId) : undefined });
+  });
 program.parse();

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "obol-ai",
-  "version": "0.3.8",
+  "version": "0.3.10",
   "description": "Self-evolving AI assistant that learns, remembers, and acts on its own. Persistent vector memory, self-rewriting personality, proactive heartbeats.",
   "main": "src/index.js",
   "bin": {
@@ -10,6 +10,10 @@
     "start": "node src/index.js",
     "test": "vitest run",
     "test:watch": "vitest",
+    "evolve": "node bin/obol.js evolve",
+    "curiosity": "node bin/obol.js curiosity",
+    "bench": "node src/cli/prompt-bench.js",
+    "debug": "node src/cli/prompt-debug.js",
     "prepublishOnly": "node src/cli/changelog.js",
     "postinstall": "pip3 install faster-whisper 2>/dev/null || pip install faster-whisper 2>/dev/null || echo 'Note: faster-whisper not installed (Python/pip unavailable). Voice transcription will be disabled.'"
   },

package/src/analysis.js CHANGED Viewed

@@ -124,10 +124,10 @@ async function structureReport(client, report, scheduler, patterns, chatId, time
           items: {
             type: 'object',
             properties: {
-              key: { type: 'string', description: 'Stable identifier e.g. "timing.active_hours"' },
+              key: { type: 'string', description: 'Stable dot-notation identifier for this pattern, e.g. "timing.active_hours", "mood.stress_signals", "humor.style"' },
               dimension: { type: 'string', enum: ['timing', 'mood', 'humor', 'engagement', 'communication', 'topics'] },
-              summary: { type: 'string', description: 'Human-readable statement e.g. "Usually active 7-10pm"' },
-              data: { type: 'object', description: 'Structured supporting data' },
+              summary: { type: 'string', description: 'Factual observation about the user, e.g. "Most active between 7-10pm on weekdays", "Uses sarcasm and dry humor when relaxed"' },
+              data: { type: 'object', description: 'Factual evidence only. Examples: {"peak_hours":["19:00-22:00"],"peak_days":["mon","wed","fri"]} or {"preferred_topics":["crypto","music"]} or {"avg_message_length":"short","uses_caps":false}. Never put notes, commentary, or meta-analysis here.' },
               confidence: { type: 'number', description: '0-1' },
             },
             required: ['key', 'dimension', 'summary', 'confidence'],
@@ -139,9 +139,11 @@ async function structureReport(client, report, scheduler, patterns, chatId, time
   }];
   try {
+    const patternGuidance = `Extract behavioral patterns about this user from the report. Each pattern must be a factual observation about the user's behavior — not notes about your analysis process. If you see the same pattern in the existing list, reuse its exact key and update the summary/confidence. Skip patterns already at confidence >0.8 unless new evidence contradicts them.`;
     const system = formattedPatterns
-      ? `Existing behavioral patterns for this user:\n${formattedPatterns}\n\n---\n\nConvert this analytical report into structured data using the save_analysis tool. Use existing patterns to calibrate confidence scores (higher if confirming, consider skipping if already well-established at >0.8). Flag contradictions in pattern data.`
-      : 'Convert this analytical report into structured data using the save_analysis tool. Extract all follow-ups and patterns mentioned.';
+      ? `Existing behavioral patterns for this user:\n${formattedPatterns}\n\n---\n\n${patternGuidance}`
+      : `Convert this analytical report into structured data using the save_analysis tool. ${patternGuidance}`;
     const response = await client.messages.create({
       model: 'claude-sonnet-4-6',
@@ -169,8 +171,10 @@ async function structureReport(client, report, scheduler, patterns, chatId, time
     for (const p of patternList) {
       if (!p.key || !p.dimension || !p.summary) continue;
-      await patterns.upsert(p.key, p.dimension, p.summary, p.data || {}, p.confidence || 0.5).catch(e =>
-        console.error('[analysis] Failed to upsert pattern:', e.message)
+      const existing = await patterns.get(p.key).catch(() => null);
+      const save = existing ? patterns.incrementObservation : patterns.upsert;
+      await save(p.key, p.dimension, p.summary, p.data || {}, p.confidence || 0.5).catch(e =>
+        console.error('[analysis] Failed to save pattern:', e.message)
       );
     }

package/src/cli/curiosity.js ADDED Viewed

@@ -0,0 +1,62 @@
+const { loadConfig, ensureUserDir } = require('../config');
+const { createMemory } = require('../memory');
+const { createSelfMemory } = require('../memory/self');
+const { createPatterns } = require('../soul/patterns');
+const { createAnthropicClient } = require('../claude/client');
+const { runCuriosity } = require('../curiosity');
+async function runCuriosityCli({ userId: userIdArg } = {}) {
+  process.env.OBOL_VERBOSE = '1';
+  const config = loadConfig({ resolve: false });
+  if (!config?.anthropic) {
+    console.error('Anthropic not configured. Run: obol init');
+    process.exit(1);
+  }
+  if (!config?.supabase) {
+    console.error('Supabase not configured. Run: obol init');
+    process.exit(1);
+  }
+  const allowedUsers = config.telegram?.allowedUsers || [];
+  const userId = userIdArg || allowedUsers[0];
+  if (!userId) {
+    console.error('No user ID found. Pass <userId> or configure telegram.allowedUsers');
+    process.exit(1);
+  }
+  const userDir = ensureUserDir(userId);
+  console.log(`Starting curiosity cycle for user ${userId}...`);
+  const client = createAnthropicClient(config.anthropic);
+  const selfMemory = await createSelfMemory(config.supabase, 0);
+  const memory = await createMemory(config.supabase, userId).catch(() => null);
+  const patterns = await createPatterns(config.supabase, userId).catch(() => null);
+  const parts = [];
+  if (memory) {
+    const recent = await memory.recent({ limit: 3 }).catch(() => []);
+    if (recent.length) parts.push(recent.map(m => `- ${m.content}`).join('\n'));
+  }
+  if (patterns) {
+    const fmt = await patterns.format().catch(() => null);
+    if (fmt) parts.push(fmt);
+  }
+  const peopleContext = parts.join('\n\n') || undefined;
+  try {
+    const result = await runCuriosity(client, selfMemory, userId, { memory, patterns, peopleContext, userDir });
+    console.log(`\nCuriosity cycle complete — stored ${result.count} things`);
+  } catch (e) {
+    console.error(`Curiosity cycle failed: ${e.message}`);
+    process.exit(1);
+  } finally {
+    delete process.env.OBOL_VERBOSE;
+  }
+}
+module.exports = { curiosity: runCuriosityCli };

package/src/cli/evolve.js ADDED Viewed

@@ -0,0 +1,72 @@
+const { loadConfig, ensureUserDir } = require('../config');
+const { createMemory } = require('../memory');
+const { createSelfMemory } = require('../memory/self');
+const { createMessageLog } = require('../messages');
+const { createAnthropicClient } = require('../claude/client');
+async function runEvolve({ userId: userIdArg } = {}) {
+  process.env.OBOL_VERBOSE = '1';
+  const config = loadConfig({ resolve: false });
+  if (!config?.anthropic) {
+    console.error('Anthropic not configured. Run: obol init');
+    process.exit(1);
+  }
+  if (!config?.supabase) {
+    console.error('Supabase not configured. Run: obol init');
+    process.exit(1);
+  }
+  const allowedUsers = config.telegram?.allowedUsers || [];
+  const userId = userIdArg || allowedUsers[0];
+  if (!userId) {
+    console.error('No user ID found. Pass <userId> or configure telegram.allowedUsers');
+    process.exit(1);
+  }
+  const userDir = ensureUserDir(userId);
+  console.log(`Starting evolution for user ${userId}...`);
+  const client = createAnthropicClient(config.anthropic);
+  const memory = await createMemory(config.supabase, userId);
+  const selfMemory = await createSelfMemory(config.supabase, 0).catch(() => null);
+  const messageLog = createMessageLog(config.supabase, memory, config.anthropic, userId, userDir);
+  try {
+    const { evolve } = require('../evolve');
+    const result = await evolve(client, messageLog, memory, userDir, config.supabase, selfMemory);
+    console.log(`\nEvolution #${result.evolutionNumber} complete`);
+    console.log(`  Soul: ${result.previousLength} → ${result.newLength} chars`);
+    if (result.scriptsFixed) console.log('  Scripts: fixed after test regression');
+    else if (result.scriptsRolledBack) console.log('  Scripts: rolled back (tests failed)');
+    if (result.upgrades?.length > 0) {
+      console.log('  New capabilities:');
+      for (const u of result.upgrades) {
+        console.log(`    - ${u.name}: ${u.description}`);
+      }
+    }
+    if (result.deployedApps?.length > 0) {
+      console.log('  Deployed:');
+      for (const app of result.deployedApps) {
+        console.log(`    - ${app.name}${app.url ? ` → ${app.url}` : ` (failed: ${app.error})`}`);
+      }
+    }
+    if (result.changelog) console.log(`\n  ${result.changelog}`);
+  } catch (e) {
+    console.error(`Evolution failed: ${e.message}`);
+    process.exit(1);
+  } finally {
+    delete process.env.OBOL_VERBOSE;
+  }
+}
+module.exports = { evolve: runEvolve };

package/src/curiosity/index.js CHANGED Viewed

@@ -107,10 +107,12 @@ You can search your own memory to see what you already know before looking thing
     context ? `What you have access to:\n\n${context}` : null,
   ].filter(Boolean).join('\n\n');
+  const log = process.env.OBOL_VERBOSE ? (msg) => console.log(`[curiosity] ${msg}`) : () => {};
   const messages = [{ role: 'user', content: `What are you curious about right now?` }];
   let stored = 0;
   for (let i = 0; i < MAX_ITERATIONS; i++) {
+    log(`Iteration ${i + 1}/${MAX_ITERATIONS}...`);
     const response = await client.messages.create({
       model: RESEARCH_MODEL,
       max_tokens: 2000,
@@ -121,12 +123,24 @@ You can search your own memory to see what you already know before looking thing
     messages.push({ role: 'assistant', content: response.content });
-    if (response.stop_reason === 'end_turn') break;
+    const textBlocks = response.content.filter(b => b.type === 'text').map(b => b.text).join(' ');
+    if (textBlocks) log(`  Text: ${textBlocks.substring(0, 200)}`);
+    log(`  Stop reason: ${response.stop_reason}`);
+    if (response.stop_reason === 'end_turn') {
+      if (stored === 0 && i < 3) {
+        log('  No saves yet — nudging to continue...');
+        messages.push({ role: 'user', content: 'Keep going — search the web, explore that thread, and save what you find with the remember tool. Don\'t just reflect, actually look things up.' });
+        continue;
+      }
+      break;
+    }
     if (response.stop_reason !== 'tool_use') break;
     const toolResults = [];
     for (const block of response.content) {
       if (block.type !== 'tool_use') continue;
+      log(`  Tool: ${block.name}${block.name === 'remember' ? ` — ${block.input.content?.substring(0, 100)}` : block.name === 'web_search' ? ` — "${block.input.query}"` : block.name === 'knowledge_search' ? ` — "${block.input.query}"` : ''}`);
       if (block.name === 'remember') {
         try {

package/src/evolve/backup.js CHANGED Viewed

@@ -1,11 +1,11 @@
 async function backupSnapshot(message, userDir) {
   try {
     const { loadConfig } = require('../config');
-    const cfg = loadConfig();
-    if (cfg?.github) {
-      const { runBackup } = require('../backup');
-      await runBackup(cfg.github, message, userDir);
-    }
+    const cfg = loadConfig({ resolve: false });
+    if (!cfg?.github?.token || !cfg?.github?.username || !cfg?.github?.repo) return;
+    const resolved = loadConfig();
+    const { runBackup } = require('../backup');
+    await runBackup(resolved.github, message, userDir);
   } catch {}
 }

package/src/evolve/data.js CHANGED Viewed

@@ -45,7 +45,8 @@ async function fetchRecentMessages(messageLog, state) {
       `${messageLog.url}/rest/v1/obol_messages?order=created_at.asc&limit=500&select=role,content,created_at${userFilter}${sinceFilter}`,
       { headers: messageLog.headers }
     );
-    return await res.json();
+    const data = await res.json();
+    return Array.isArray(data) ? data : [];
   } catch (e) {
     console.error('[evolve] Failed to fetch recent messages:', e.message);
     return [];
@@ -73,7 +74,8 @@ async function fetchMemories(memory, messageLog, state) {
       `${url}/rest/v1/obol_memory?select=content,category,importance&order=importance.desc,accessed_at.desc&limit=20${memUserFilter}`,
       { headers }
     );
-    coreMemories = await res.json();
+    const coreData = await res.json();
+    coreMemories = Array.isArray(coreData) ? coreData : [];
   } catch (e) {
     console.error('[evolve] Failed to fetch core memories:', e.message);
   }
@@ -85,7 +87,8 @@ async function fetchMemories(memory, messageLog, state) {
       `${url}/rest/v1/obol_memory?select=content,category,importance,tags,created_at,source&order=created_at.asc&limit=100${memUserFilter}${sinceFilter}`,
       { headers }
     );
-    recentMemories = await res.json();
+    const recentData = await res.json();
+    recentMemories = Array.isArray(recentData) ? recentData : [];
   } catch (e) {
     console.error('[evolve] Failed to fetch recent memories:', e.message);
   }

package/src/evolve/evolve.js CHANGED Viewed

@@ -22,6 +22,8 @@ const MODELS = {
 const MAX_FIX_ATTEMPTS = 1;
 async function evolve(claudeClient, messageLog, memory, userDir, supabaseConfig = null, selfMemory = null) {
+  const log = process.env.OBOL_VERBOSE ? (msg) => console.log(`[evolve] ${msg}`) : () => {};
   const { PERSONALITY_DIR } = require('../soul');
   const baseDir = userDir || OBOL_DIR;
   const state = loadEvolutionState(userDir);
@@ -33,16 +35,20 @@ async function evolve(claudeClient, messageLog, memory, userDir, supabaseConfig
   const testsDir = path.join(baseDir, 'tests');
   const commandsDir = path.join(baseDir, 'commands');
+  log('Loading current personality files...');
   const currentSoul = fs.existsSync(soulPath) ? fs.readFileSync(soulPath, 'utf-8') : '';
   const currentUser = fs.existsSync(userPath) ? fs.readFileSync(userPath, 'utf-8') : '';
   const currentAgents = fs.existsSync(agentsPath) ? fs.readFileSync(agentsPath, 'utf-8') : '';
   const currentScripts = readDir(scriptsDir);
   const currentTests = readDir(testsDir);
   const currentCommands = readDir(commandsDir);
+  log(`  Soul: ${currentSoul.length} chars, Scripts: ${Object.keys(currentScripts).length}, Tests: ${Object.keys(currentTests).length}, Commands: ${Object.keys(currentCommands).length}`);
+  log('Fetching messages and memories...');
   const recentMessages = await fetchRecentMessages(messageLog, state);
   const { coreMemories, recentMemories } = await fetchMemories(memory, messageLog, state);
   const selfMemories = await fetchSelfMemories(selfMemory);
+  log(`  Messages: ${recentMessages.length}, Core memories: ${coreMemories.length}, Recent memories: ${recentMemories.length}, Self memories: ${selfMemories.length}`);
   let previousSoul = '';
   const archiveDir = path.join(PERSONALITY_DIR, 'evolution');
@@ -53,6 +59,7 @@ async function evolve(claudeClient, messageLog, memory, userDir, supabaseConfig
         .sort();
       if (archives.length > 0) {
         previousSoul = fs.readFileSync(path.join(archiveDir, archives[archives.length - 1]), 'utf-8');
+        log(`  Previous soul: ${archives[archives.length - 1]} (${previousSoul.length} chars)`);
       }
     }
   } catch {}
@@ -78,10 +85,13 @@ async function evolve(claudeClient, messageLog, memory, userDir, supabaseConfig
     .join('\n\n') || '(no commands)';
   const evolutionNumber = state.evolutionCount + 1;
+  log(`Evolution #${evolutionNumber} (last: ${state.lastEvolution || 'never'})`);
+  log('Pre-evolution backup...');
   await backupSnapshot(`pre-evolution #${evolutionNumber}`, userDir);
   if (memory && recentMessages.length >= 4) {
+    log('Deep consolidating memory...');
     await deepConsolidateMemory(claudeClient, memory, recentMessages, evolutionNumber, MODELS.personality).catch(e =>
       console.error('[evolve] Deep consolidation failed:', e.message)
     );
@@ -90,6 +100,7 @@ async function evolve(claudeClient, messageLog, memory, userDir, supabaseConfig
   const isFirstEvolution = !currentSoul;
   let growthReport = '';
   if (!isFirstEvolution && (recentMemories.length > 0 || recentMessages.length > 0 || selfMemories.length > 0)) {
+    log('Running growth analysis...');
     try {
       const growthResponse = await claudeClient.messages.create({
         model: MODELS.personality,
@@ -122,12 +133,15 @@ ${transcript.substring(0, 30000)}`,
         }],
       });
       growthReport = growthResponse.content.filter(b => b.type === 'text').map(b => b.text).join('\n');
+      log(`  Growth report: ${growthReport.length} chars`);
     } catch (e) {
       console.error('[evolve] Growth analysis failed:', e.message);
     }
   }
+  log('Running baseline tests...');
   const baselineResults = runTests(testsDir);
+  log(`  Baseline: ${baselineResults.passed} passed, ${baselineResults.failed} failed`);
   const firstEvolutionPreamble = isFirstEvolution ? `
 ## FIRST EVOLUTION — IMPORTANT
@@ -152,6 +166,7 @@ A pre-evolution analysis has been conducted comparing your previous state agains
     baselineResults,
   });
+  log('Running main evolution (this takes a while)...');
   const response = await claudeClient.messages.create({
     model: MODELS.personality,
     max_tokens: 16384,
@@ -191,6 +206,7 @@ ${transcript || '(no conversations yet)'}
 Evolve. Rewrite everything that needs rewriting. Write tests for every script. Keep what works. Fix what doesn't.${growthReport ? ' Use the growth report to guide personality continuity and trait adjustments.' : ''}`
     }],
   });
+  log('  Evolution response received');
   const responseText = response.content.filter(b => b.type === 'text').map(b => b.text).join('\n');
@@ -211,11 +227,14 @@ Evolve. Rewrite everything that needs rewriting. Write tests for every script. K
     throw new Error('Evolution produced empty or too-short SOUL.md');
   }
+  log(`  New soul: ${result.soul.length} chars`);
   let scriptsRolledBack = false;
   const hasNewTests = result.tests && typeof result.tests === 'object' && Object.keys(result.tests).length > 0;
   const hasNewScripts = result.scripts && typeof result.scripts === 'object' && Object.keys(result.scripts).length > 0;
   if (hasNewTests) {
+    log(`Writing ${Object.keys(result.tests).length} new tests...`);
     syncDir(testsDir, result.tests);
     for (const f of Object.keys(result.tests)) {
       try { fs.chmodSync(path.join(testsDir, f), 0o755); } catch {}
@@ -225,6 +244,7 @@ Evolve. Rewrite everything that needs rewriting. Write tests for every script. K
   const preRefactorResults = hasNewTests ? runTests(testsDir) : baselineResults;
   if (hasNewScripts) {
+    log(`Writing ${Object.keys(result.scripts).length} new scripts...`);
     syncDir(scriptsDir, result.scripts);
     for (const f of Object.keys(result.scripts)) {
       try { fs.chmodSync(path.join(scriptsDir, f), 0o755); } catch {}
@@ -234,11 +254,14 @@ Evolve. Rewrite everything that needs rewriting. Write tests for every script. K
   let scriptsFixed = false;
   if (hasNewTests || hasNewScripts) {
+    log('Running post-refactor tests...');
     let postRefactorResults = runTests(testsDir);
+    log(`  Post-refactor: ${postRefactorResults.passed} passed, ${postRefactorResults.failed} failed`);
     let fixAttempt = 0;
     while (postRefactorResults.failed > preRefactorResults.failed && fixAttempt < MAX_FIX_ATTEMPTS) {
       fixAttempt++;
+      log(`  Fix attempt ${fixAttempt}/${MAX_FIX_ATTEMPTS}...`);
       try {
         const fixResponse = await claudeClient.messages.create({
@@ -288,6 +311,7 @@ Fix the scripts. Tests define correct behavior.`
             if (postRefactorResults.failed <= preRefactorResults.failed) {
               scriptsFixed = true;
+              log('  Scripts fixed');
             }
           }
         }
@@ -297,6 +321,7 @@ Fix the scripts. Tests define correct behavior.`
     }
     if (postRefactorResults.failed > preRefactorResults.failed) {
+      log('  Rolling back scripts...');
       syncDir(scriptsDir, currentScripts);
       for (const f of Object.keys(currentScripts)) {
         try { fs.chmodSync(path.join(scriptsDir, f), 0o755); } catch {}
@@ -312,6 +337,7 @@ Fix the scripts. Tests define correct behavior.`
     }
   }
+  log('Archiving previous soul...');
   fs.mkdirSync(archiveDir, { recursive: true });
   if (currentSoul) {
     const timestamp = new Date().toISOString().slice(0, 10);
@@ -321,6 +347,7 @@ Fix the scripts. Tests define correct behavior.`
     );
   }
+  log('Writing new soul...');
   fs.writeFileSync(soulPath, result.soul);
   if (supabaseConfig) {
     const { backup } = require('../soul');
@@ -330,22 +357,27 @@ Fix the scripts. Tests define correct behavior.`
   }
   if (result.user && result.user.length > 50) {
+    log('Writing USER.md...');
     fs.writeFileSync(userPath, result.user);
   }
   if (result.agents && result.agents.length > 50) {
+    log('Writing AGENTS.md...');
     fs.writeFileSync(agentsPath, result.agents);
   }
   if (result.commands && typeof result.commands === 'object') {
     if (Object.keys(result.commands).length > 0 || Object.keys(currentCommands).length > 0) {
+      log(`Writing ${Object.keys(result.commands).length} commands...`);
       syncDir(commandsDir, result.commands);
     }
   }
+  log('Building and deploying apps...');
   const deployedApps = await buildAndDeployApps(result, baseDir);
   if (result.dependencies && Array.isArray(result.dependencies) && result.dependencies.length > 0) {
+    log(`Installing dependencies: ${result.dependencies.join(', ')}...`);
     try {
       const validDeps = result.dependencies.filter(isValidNpmPackage);
       if (validDeps.length === 0) throw new Error('No valid package names found');
@@ -370,6 +402,7 @@ Fix the scripts. Tests define correct behavior.`
   saveEvolutionState(state, userDir);
   if (memory) {
+    log('Saving evolution memory...');
     const changelog = result.changelog || `Evolution #${evolutionNumber} completed.`;
     const rollbackNote = scriptsRolledBack ? ' Scripts rolled back due to test regression.' : scriptsFixed ? ' Scripts fixed after test regression.' : '';
     await memory.add(
@@ -385,8 +418,10 @@ Fix the scripts. Tests define correct behavior.`
     }
   }
+  log('Post-evolution backup...');
   await backupSnapshot(`post-evolution #${evolutionNumber}`, userDir);
+  log('Done');
   return {
     evolutionNumber,
     previousLength: currentSoul.length,