npm - @geminilight/mindos - Versions diffs - 0.6.19 → 0.6.20 - Mend

@geminilight/mindos 0.6.19 → 0.6.20

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (12) hide show

package/app/app/api/ask/route.ts +147 -315
package/app/app/api/settings/test-key/route.ts +3 -47
package/app/components/settings/AiTab.tsx +1 -10
package/app/components/settings/types.ts +0 -1
package/app/hooks/useAiOrganize.ts +1 -0
package/app/lib/agent/model.ts +2 -1
package/app/lib/agent/prompt.ts +23 -0
package/app/lib/agent/tools.ts +12 -0
package/app/lib/i18n-en.ts +0 -1
package/app/lib/i18n-zh.ts +0 -1
package/app/lib/settings.ts +0 -2
package/package.json +1 -1

package/app/app/api/ask/route.ts CHANGED Viewed

@@ -16,8 +16,8 @@ import fs from 'fs';
 import path from 'path';
 import { getFileContent, getMindRoot } from '@/lib/fs';
 import { getModelConfig } from '@/lib/agent/model';
-import { getRequestScopedTools, WRITE_TOOLS, truncate } from '@/lib/agent/tools';
-import { AGENT_SYSTEM_PROMPT } from '@/lib/agent/prompt';
+import { getRequestScopedTools, getOrganizeTools, WRITE_TOOLS, truncate } from '@/lib/agent/tools';
+import { AGENT_SYSTEM_PROMPT, ORGANIZE_SYSTEM_PROMPT } from '@/lib/agent/prompt';
 import { toAgentMessages } from '@/lib/agent/to-agent-messages';
 import { logAgentOp } from '@/lib/agent/log';
 import { readSettings } from '@/lib/settings';
@@ -27,24 +27,6 @@ import { assertNotProtected } from '@/lib/core';
 import { scanExtensionPaths } from '@/lib/pi-integration/extensions';
 import type { Message as FrontendMessage } from '@/lib/types';
-// ---------------------------------------------------------------------------
-// Streaming blacklist — caches provider+model combos that don't support SSE.
-// Auto-populated when streaming fails; entries expire after 10 minutes
-// so transient proxy issues don't permanently lock out streaming.
-// ---------------------------------------------------------------------------
-const streamingBlacklist = new Map<string, number>();
-const STREAMING_BLACKLIST_TTL = 10 * 60 * 1000;
-function isStreamingBlacklisted(key: string): boolean {
-  const ts = streamingBlacklist.get(key);
-  if (ts === undefined) return false;
-  if (Date.now() - ts > STREAMING_BLACKLIST_TTL) {
-    streamingBlacklist.delete(key);
-    return false;
-  }
-  return true;
-}
 // ---------------------------------------------------------------------------
 // MindOS SSE format — 6 event types (front-back contract)
 // ---------------------------------------------------------------------------
@@ -270,6 +252,8 @@ export async function POST(req: NextRequest) {
     attachedFiles?: string[];
     uploadedFiles?: Array<{ name: string; content: string }>;
     maxSteps?: number;
+    /** 'organize' = lean prompt for file import organize; default = full prompt */
+    mode?: 'organize' | 'default';
   };
   try {
     body = await req.json();
@@ -278,6 +262,7 @@ export async function POST(req: NextRequest) {
   }
   const { messages, currentFile, attachedFiles, uploadedFiles } = body;
+  const isOrganizeMode = body.mode === 'organize';
   // Read agent config from settings
   const serverSettings = readSettings();
@@ -289,99 +274,7 @@ export async function POST(req: NextRequest) {
   const thinkingBudget = agentConfig.thinkingBudget ?? 5000;
   const contextStrategy = agentConfig.contextStrategy ?? 'auto';
-  // Auto-load skill + bootstrap context for each request.
-  // 1. SKILL.md — complete skill with operating rules (always loaded)
-  // 2. user-skill-rules.md — user's personalized rules from KB root (if exists)
-  const isZh = serverSettings.disabledSkills?.includes('mindos') ?? false;
-  const skillDirName = isZh ? 'mindos-zh' : 'mindos';
-  const appDir = process.env.MINDOS_PROJECT_ROOT
-    ? path.join(process.env.MINDOS_PROJECT_ROOT, 'app')
-    : process.cwd();
-  const skillPath = path.join(appDir, `data/skills/${skillDirName}/SKILL.md`);
-  const skill = readAbsoluteFile(skillPath);
-  const mindRoot = getMindRoot();
-  const userSkillRules = readKnowledgeFile('user-skill-rules.md');
-  const targetDir = dirnameOf(currentFile);
-  const bootstrap = {
-    instruction: readKnowledgeFile('INSTRUCTION.md'),
-    index: readKnowledgeFile('README.md'),
-    config_json: readKnowledgeFile('CONFIG.json'),
-    config_md: readKnowledgeFile('CONFIG.md'),
-    target_readme: targetDir ? readKnowledgeFile(`${targetDir}/README.md`) : null,
-    target_instruction: targetDir ? readKnowledgeFile(`${targetDir}/INSTRUCTION.md`) : null,
-    target_config_json: targetDir ? readKnowledgeFile(`${targetDir}/CONFIG.json`) : null,
-    target_config_md: targetDir ? readKnowledgeFile(`${targetDir}/CONFIG.md`) : null,
-  };
-  // Only report failures + truncation warnings
-  const initFailures: string[] = [];
-  const truncationWarnings: string[] = [];
-  if (!skill.ok) initFailures.push(`skill.mindos: failed (${skill.error})`);
-  if (skill.ok && skill.truncated) truncationWarnings.push('skill.mindos was truncated');
-  if (userSkillRules.ok && userSkillRules.truncated) truncationWarnings.push('user-skill-rules.md was truncated');
-  if (!bootstrap.instruction.ok) initFailures.push(`bootstrap.instruction: failed (${bootstrap.instruction.error})`);
-  if (bootstrap.instruction.ok && bootstrap.instruction.truncated) truncationWarnings.push('bootstrap.instruction was truncated');
-  if (!bootstrap.index.ok) initFailures.push(`bootstrap.index: failed (${bootstrap.index.error})`);
-  if (bootstrap.index.ok && bootstrap.index.truncated) truncationWarnings.push('bootstrap.index was truncated');
-  if (!bootstrap.config_json.ok) initFailures.push(`bootstrap.config_json: failed (${bootstrap.config_json.error})`);
-  if (bootstrap.config_json.ok && bootstrap.config_json.truncated) truncationWarnings.push('bootstrap.config_json was truncated');
-  if (!bootstrap.config_md.ok) initFailures.push(`bootstrap.config_md: failed (${bootstrap.config_md.error})`);
-  if (bootstrap.config_md.ok && bootstrap.config_md.truncated) truncationWarnings.push('bootstrap.config_md was truncated');
-  if (bootstrap.target_readme && !bootstrap.target_readme.ok) initFailures.push(`bootstrap.target_readme: failed (${bootstrap.target_readme.error})`);
-  if (bootstrap.target_readme?.ok && bootstrap.target_readme.truncated) truncationWarnings.push('bootstrap.target_readme was truncated');
-  if (bootstrap.target_instruction && !bootstrap.target_instruction.ok) initFailures.push(`bootstrap.target_instruction: failed (${bootstrap.target_instruction.error})`);
-  if (bootstrap.target_instruction?.ok && bootstrap.target_instruction.truncated) truncationWarnings.push('bootstrap.target_instruction was truncated');
-  if (bootstrap.target_config_json && !bootstrap.target_config_json.ok) initFailures.push(`bootstrap.target_config_json: failed (${bootstrap.target_config_json.error})`);
-  if (bootstrap.target_config_json?.ok && bootstrap.target_config_json.truncated) truncationWarnings.push('bootstrap.target_config_json was truncated');
-  if (bootstrap.target_config_md && !bootstrap.target_config_md.ok) initFailures.push(`bootstrap.target_config_md: failed (${bootstrap.target_config_md.error})`);
-  if (bootstrap.target_config_md?.ok && bootstrap.target_config_md.truncated) truncationWarnings.push('bootstrap.target_config_md was truncated');
-  const initStatus = initFailures.length === 0
-    ? `All initialization contexts loaded successfully. mind_root=${getMindRoot()}${targetDir ? `, target_dir=${targetDir}` : ''}${truncationWarnings.length > 0 ? ` ⚠️ ${truncationWarnings.length} files truncated` : ''}`
-    : `Initialization issues:\n${initFailures.join('\n')}\nmind_root=${getMindRoot()}${targetDir ? `, target_dir=${targetDir}` : ''}${truncationWarnings.length > 0 ? `\n⚠️ Warnings:\n${truncationWarnings.join('\n')}` : ''}`;
-  const initContextBlocks: string[] = [];
-  if (skill.ok) initContextBlocks.push(`## mindos_skill_md\n\n${skill.content}`);
-  // User personalization rules (from knowledge base root)
-  if (userSkillRules.ok && !userSkillRules.truncated && userSkillRules.content.trim()) {
-    initContextBlocks.push(`## user_skill_rules\n\nUser personalization rules (user-skill-rules.md):\n\n${userSkillRules.content}`);
-  }
-  if (bootstrap.instruction.ok) initContextBlocks.push(`## bootstrap_instruction\n\n${bootstrap.instruction.content}`);
-  if (bootstrap.index.ok) initContextBlocks.push(`## bootstrap_index\n\n${bootstrap.index.content}`);
-  if (bootstrap.config_json.ok) initContextBlocks.push(`## bootstrap_config_json\n\n${bootstrap.config_json.content}`);
-  if (bootstrap.config_md.ok) initContextBlocks.push(`## bootstrap_config_md\n\n${bootstrap.config_md.content}`);
-  if (bootstrap.target_readme?.ok) initContextBlocks.push(`## bootstrap_target_readme\n\n${bootstrap.target_readme.content}`);
-  if (bootstrap.target_instruction?.ok) initContextBlocks.push(`## bootstrap_target_instruction\n\n${bootstrap.target_instruction.content}`);
-  if (bootstrap.target_config_json?.ok) initContextBlocks.push(`## bootstrap_target_config_json\n\n${bootstrap.target_config_json.content}`);
-  if (bootstrap.target_config_md?.ok) initContextBlocks.push(`## bootstrap_target_config_md\n\n${bootstrap.target_config_md.content}`);
-  // Build initial context from attached/current files
-  const contextParts: string[] = [];
-  const seen = new Set<string>();
-  const hasAttached = Array.isArray(attachedFiles) && attachedFiles.length > 0;
-  if (hasAttached) {
-    for (const filePath of attachedFiles!) {
-      if (seen.has(filePath)) continue;
-      seen.add(filePath);
-      try {
-        const content = truncate(getFileContent(filePath));
-        contextParts.push(`## Attached: ${filePath}\n\n${content}`);
-      } catch { /* ignore missing files */ }
-    }
-  }
-  if (currentFile && !seen.has(currentFile)) {
-    seen.add(currentFile);
-    try {
-      const content = truncate(getFileContent(currentFile));
-      contextParts.push(`## Current file: ${currentFile}\n\n${content}`);
-    } catch { /* ignore */ }
-  }
-  // Uploaded files
+  // Uploaded files — shared by both modes
   const uploadedParts: string[] = [];
   if (Array.isArray(uploadedFiles) && uploadedFiles.length > 0) {
     for (const f of uploadedFiles.slice(0, 8)) {
@@ -390,60 +283,158 @@ export async function POST(req: NextRequest) {
     }
   }
-  // Generate current time for the agent's context
-  const now = new Date();
-  const timeContext = `## Current Time Context
+  // ---------------------------------------------------------------------------
+  // Build system prompt — lean path for organize mode, full path otherwise
+  // ---------------------------------------------------------------------------
+  let systemPrompt: string;
+  if (isOrganizeMode) {
+    // Organize mode: minimal prompt — only KB structure + uploaded files
+    const promptParts: string[] = [ORGANIZE_SYSTEM_PROMPT];
+    promptParts.push(`---\n\nmind_root=${getMindRoot()}`);
+    // Only load root README.md for KB structure awareness (skip SKILL.md, configs, target dir, time, etc.)
+    const bootstrapIndex = readKnowledgeFile('README.md');
+    if (bootstrapIndex.ok) {
+      promptParts.push(`---\n\n## Knowledge Base Structure\n\n${bootstrapIndex.content}`);
+    }
+    if (uploadedParts.length > 0) {
+      promptParts.push(
+        `---\n\n## ⚠️ USER-UPLOADED FILES\n\n` +
+        `Their FULL CONTENT is below. Use this directly — do NOT call read tools on them.\n\n` +
+        uploadedParts.join('\n\n---\n\n'),
+      );
+    }
+    systemPrompt = promptParts.join('\n\n');
+  } else {
+    // Full mode: original prompt assembly
+    // Auto-load skill + bootstrap context for each request.
+    const isZh = serverSettings.disabledSkills?.includes('mindos') ?? false;
+    const skillDirName = isZh ? 'mindos-zh' : 'mindos';
+    const appDir = process.env.MINDOS_PROJECT_ROOT
+      ? path.join(process.env.MINDOS_PROJECT_ROOT, 'app')
+      : process.cwd();
+    const skillPath = path.join(appDir, `data/skills/${skillDirName}/SKILL.md`);
+    const skill = readAbsoluteFile(skillPath);
+    const userSkillRules = readKnowledgeFile('user-skill-rules.md');
+    const targetDir = dirnameOf(currentFile);
+    const bootstrap = {
+      instruction: readKnowledgeFile('INSTRUCTION.md'),
+      index: readKnowledgeFile('README.md'),
+      config_json: readKnowledgeFile('CONFIG.json'),
+      config_md: readKnowledgeFile('CONFIG.md'),
+      target_readme: targetDir ? readKnowledgeFile(`${targetDir}/README.md`) : null,
+      target_instruction: targetDir ? readKnowledgeFile(`${targetDir}/INSTRUCTION.md`) : null,
+      target_config_json: targetDir ? readKnowledgeFile(`${targetDir}/CONFIG.json`) : null,
+      target_config_md: targetDir ? readKnowledgeFile(`${targetDir}/CONFIG.md`) : null,
+    };
+    // Only report failures + truncation warnings
+    const initFailures: string[] = [];
+    const truncationWarnings: string[] = [];
+    if (!skill.ok) initFailures.push(`skill.mindos: failed (${skill.error})`);
+    if (skill.ok && skill.truncated) truncationWarnings.push('skill.mindos was truncated');
+    if (userSkillRules.ok && userSkillRules.truncated) truncationWarnings.push('user-skill-rules.md was truncated');
+    if (!bootstrap.instruction.ok) initFailures.push(`bootstrap.instruction: failed (${bootstrap.instruction.error})`);
+    if (bootstrap.instruction.ok && bootstrap.instruction.truncated) truncationWarnings.push('bootstrap.instruction was truncated');
+    if (!bootstrap.index.ok) initFailures.push(`bootstrap.index: failed (${bootstrap.index.error})`);
+    if (bootstrap.index.ok && bootstrap.index.truncated) truncationWarnings.push('bootstrap.index was truncated');
+    if (!bootstrap.config_json.ok) initFailures.push(`bootstrap.config_json: failed (${bootstrap.config_json.error})`);
+    if (bootstrap.config_json.ok && bootstrap.config_json.truncated) truncationWarnings.push('bootstrap.config_json was truncated');
+    if (!bootstrap.config_md.ok) initFailures.push(`bootstrap.config_md: failed (${bootstrap.config_md.error})`);
+    if (bootstrap.config_md.ok && bootstrap.config_md.truncated) truncationWarnings.push('bootstrap.config_md was truncated');
+    if (bootstrap.target_readme && !bootstrap.target_readme.ok) initFailures.push(`bootstrap.target_readme: failed (${bootstrap.target_readme.error})`);
+    if (bootstrap.target_readme?.ok && bootstrap.target_readme.truncated) truncationWarnings.push('bootstrap.target_readme was truncated');
+    if (bootstrap.target_instruction && !bootstrap.target_instruction.ok) initFailures.push(`bootstrap.target_instruction: failed (${bootstrap.target_instruction.error})`);
+    if (bootstrap.target_instruction?.ok && bootstrap.target_instruction.truncated) truncationWarnings.push('bootstrap.target_instruction was truncated');
+    if (bootstrap.target_config_json && !bootstrap.target_config_json.ok) initFailures.push(`bootstrap.target_config_json: failed (${bootstrap.target_config_json.error})`);
+    if (bootstrap.target_config_json?.ok && bootstrap.target_config_json.truncated) truncationWarnings.push('bootstrap.target_config_json was truncated');
+    if (bootstrap.target_config_md && !bootstrap.target_config_md.ok) initFailures.push(`bootstrap.target_config_md: failed (${bootstrap.target_config_md.error})`);
+    if (bootstrap.target_config_md?.ok && bootstrap.target_config_md.truncated) truncationWarnings.push('bootstrap.target_config_md was truncated');
+    const initStatus = initFailures.length === 0
+      ? `All initialization contexts loaded successfully. mind_root=${getMindRoot()}${targetDir ? `, target_dir=${targetDir}` : ''}${truncationWarnings.length > 0 ? ` ⚠️ ${truncationWarnings.length} files truncated` : ''}`
+      : `Initialization issues:\n${initFailures.join('\n')}\nmind_root=${getMindRoot()}${targetDir ? `, target_dir=${targetDir}` : ''}${truncationWarnings.length > 0 ? `\n⚠️ Warnings:\n${truncationWarnings.join('\n')}` : ''}`;
+    const initContextBlocks: string[] = [];
+    if (skill.ok) initContextBlocks.push(`## mindos_skill_md\n\n${skill.content}`);
+    if (userSkillRules.ok && !userSkillRules.truncated && userSkillRules.content.trim()) {
+      initContextBlocks.push(`## user_skill_rules\n\nUser personalization rules (user-skill-rules.md):\n\n${userSkillRules.content}`);
+    }
+    if (bootstrap.instruction.ok) initContextBlocks.push(`## bootstrap_instruction\n\n${bootstrap.instruction.content}`);
+    if (bootstrap.index.ok) initContextBlocks.push(`## bootstrap_index\n\n${bootstrap.index.content}`);
+    if (bootstrap.config_json.ok) initContextBlocks.push(`## bootstrap_config_json\n\n${bootstrap.config_json.content}`);
+    if (bootstrap.config_md.ok) initContextBlocks.push(`## bootstrap_config_md\n\n${bootstrap.config_md.content}`);
+    if (bootstrap.target_readme?.ok) initContextBlocks.push(`## bootstrap_target_readme\n\n${bootstrap.target_readme.content}`);
+    if (bootstrap.target_instruction?.ok) initContextBlocks.push(`## bootstrap_target_instruction\n\n${bootstrap.target_instruction.content}`);
+    if (bootstrap.target_config_json?.ok) initContextBlocks.push(`## bootstrap_target_config_json\n\n${bootstrap.target_config_json.content}`);
+    if (bootstrap.target_config_md?.ok) initContextBlocks.push(`## bootstrap_target_config_md\n\n${bootstrap.target_config_md.content}`);
+    // Build initial context from attached/current files
+    const contextParts: string[] = [];
+    const seen = new Set<string>();
+    const hasAttached = Array.isArray(attachedFiles) && attachedFiles.length > 0;
+    if (hasAttached) {
+      for (const filePath of attachedFiles!) {
+        if (seen.has(filePath)) continue;
+        seen.add(filePath);
+        try {
+          const content = truncate(getFileContent(filePath));
+          contextParts.push(`## Attached: ${filePath}\n\n${content}`);
+        } catch { /* ignore missing files */ }
+      }
+    }
+    if (currentFile && !seen.has(currentFile)) {
+      seen.add(currentFile);
+      try {
+        const content = truncate(getFileContent(currentFile));
+        contextParts.push(`## Current file: ${currentFile}\n\n${content}`);
+      } catch { /* ignore */ }
+    }
+    const now = new Date();
+    const timeContext = `## Current Time Context
 - Current UTC Time: ${now.toISOString()}
 - System Local Time: ${new Intl.DateTimeFormat('en-US', { dateStyle: 'full', timeStyle: 'long' }).format(now)}
 - Unix Timestamp: ${Math.floor(now.getTime() / 1000)}
 *Note: The times listed above represent "NOW". The user may have sent messages hours or days ago in this same conversation thread. Each user message in the history contains its own specific timestamp which you should refer to when understanding historical context.*`;
-  const promptParts: string[] = [AGENT_SYSTEM_PROMPT];
-  promptParts.push(`---\n\n${timeContext}`);
-  promptParts.push(`---\n\nInitialization status (auto-loaded at request start):\n\n${initStatus}`);
+    const promptParts: string[] = [AGENT_SYSTEM_PROMPT];
+    promptParts.push(`---\n\n${timeContext}`);
+    promptParts.push(`---\n\nInitialization status (auto-loaded at request start):\n\n${initStatus}`);
-  if (initContextBlocks.length > 0) {
-    promptParts.push(`---\n\nInitialization context:\n\n${initContextBlocks.join('\n\n---\n\n')}`);
-  }
-  if (contextParts.length > 0) {
-    promptParts.push(`---\n\nThe user is currently viewing these files:\n\n${contextParts.join('\n\n---\n\n')}`);
-  }
+    if (initContextBlocks.length > 0) {
+      promptParts.push(`---\n\nInitialization context:\n\n${initContextBlocks.join('\n\n---\n\n')}`);
+    }
-  if (uploadedParts.length > 0) {
-    promptParts.push(
-      `---\n\n## ⚠️ USER-UPLOADED FILES (ACTIVE ATTACHMENTS)\n\n` +
-      `The user has uploaded the following file(s) in this conversation. ` +
-      `Their FULL CONTENT is provided below. You MUST use this content directly when the user refers to these files. ` +
-      `Do NOT use read_file or search tools to find them — they exist only here, not in the knowledge base.\n\n` +
-      uploadedParts.join('\n\n---\n\n'),
-    );
-  }
+    if (contextParts.length > 0) {
+      promptParts.push(`---\n\nThe user is currently viewing these files:\n\n${contextParts.join('\n\n---\n\n')}`);
+    }
-  const systemPrompt = promptParts.join('\n\n');
+    if (uploadedParts.length > 0) {
+      promptParts.push(
+        `---\n\n## ⚠️ USER-UPLOADED FILES (ACTIVE ATTACHMENTS)\n\n` +
+        `The user has uploaded the following file(s) in this conversation. ` +
+        `Their FULL CONTENT is provided below. You MUST use this content directly when the user refers to these files. ` +
+        `Do NOT use read_file or search tools to find them — they exist only here, not in the knowledge base.\n\n` +
+        uploadedParts.join('\n\n---\n\n'),
+      );
+    }
-  const useStreaming = agentConfig.useStreaming !== false;
+    systemPrompt = promptParts.join('\n\n');
+  }
   try {
     const { model, modelName, apiKey, provider } = getModelConfig();
-    // ── Non-streaming path (auto-detected or cached) ──
-    // When test-key detected streaming incompatibility, or a previous request
-    // failed and cached the result, go directly to non-streaming.
-    const cacheKey = `${provider}:${model.id}:${model.baseUrl ?? ''}`;
-    if (!useStreaming || isStreamingBlacklisted(cacheKey)) {
-      if (isStreamingBlacklisted(cacheKey)) {
-        console.log(`[ask] Using non-streaming mode (cached failure for ${cacheKey})`);
-      }
-      return await handleNonStreaming({
-        provider, apiKey, model, systemPrompt, messages, modelName,
-      });
-    }
-    // ── Streaming path (default) ──
     // Convert frontend messages to AgentMessage[]
     const agentMessages = toAgentMessages(messages);
@@ -458,7 +449,7 @@ export async function POST(req: NextRequest) {
     // Capture API key for this request — safe since each POST creates a new Agent instance.
     const requestApiKey = apiKey;
     const projectRoot = process.env.MINDOS_PROJECT_ROOT || path.resolve(process.cwd(), '..');
-    const requestTools = await getRequestScopedTools();
+    const requestTools = isOrganizeMode ? getOrganizeTools() : await getRequestScopedTools();
     const customTools = toPiCustomToolDefinitions(requestTools);
     const authStorage = AuthStorage.create();
@@ -612,27 +603,10 @@ export async function POST(req: NextRequest) {
           }
         });
-        session.prompt(lastUserContent).then(async () => {
+        session.prompt(lastUserContent).then(() => {
           metrics.recordRequest(Date.now() - requestStartTime);
           if (!hasContent && lastModelError) {
-            // Streaming failed — auto-retry with non-streaming fallback.
-            // Cache the failure so subsequent requests skip streaming entirely.
-            console.warn(`[ask] Streaming failed for ${modelName}, retrying non-streaming: ${lastModelError}`);
-            streamingBlacklist.set(cacheKey, Date.now());
-            // No visible hint needed — the fallback is transparent to the user
-            try {
-              const fallbackResult = await directNonStreamingCall({
-                provider, apiKey, model, systemPrompt, messages, modelName,
-              });
-              if (fallbackResult) {
-                send({ type: 'text_delta', delta: fallbackResult });
-                send({ type: 'done' });
-              } else {
-                send({ type: 'error', message: lastModelError });
-              }
-            } catch (fallbackErr) {
-              send({ type: 'error', message: lastModelError });
-            }
+            send({ type: 'error', message: lastModelError });
           } else {
             send({ type: 'done' });
           }
@@ -663,145 +637,3 @@ export async function POST(req: NextRequest) {
   }
 }
-// ---------------------------------------------------------------------------
-// Non-streaming — direct /chat/completions call (no SSE, no tools)
-// ---------------------------------------------------------------------------
-interface NonStreamingOpts {
-  provider: 'anthropic' | 'openai';
-  apiKey: string;
-  model: { id: string; baseUrl?: string; maxTokens?: number };
-  systemPrompt: string;
-  messages: FrontendMessage[];
-  modelName: string;
-}
-/**
- * Core non-streaming API call. Returns the response text or throws.
- * Used by both the direct non-streaming path and the auto-fallback.
- */
-async function directNonStreamingCall(opts: NonStreamingOpts): Promise<string> {
-  const { provider, apiKey, model, systemPrompt, messages, modelName } = opts;
-  const ctrl = new AbortController();
-  const timeout = setTimeout(() => ctrl.abort(), 120_000);
-  try {
-    if (provider === 'openai') {
-      const baseUrl = (model.baseUrl || 'https://api.openai.com/v1').replace(/\/+$/, '');
-      const url = `${baseUrl}/chat/completions`;
-      const apiMessages = [
-        { role: 'system', content: systemPrompt },
-        ...messages.map(m => ({ role: m.role, content: m.content })),
-      ];
-      const res = await fetch(url, {
-        method: 'POST',
-        headers: { 'Content-Type': 'application/json', Authorization: `Bearer ${apiKey}` },
-        body: JSON.stringify({
-          model: model.id,
-          messages: apiMessages,
-          stream: false,
-          max_tokens: model.maxTokens ?? 16_384,
-        }),
-        signal: ctrl.signal,
-      });
-      if (!res.ok) {
-        const body = await res.text().catch(() => '');
-        throw new Error(`API returned ${res.status}: ${body.slice(0, 500)}`);
-      }
-      const json = await res.json();
-      return json?.choices?.[0]?.message?.content ?? '';
-    }
-    // Anthropic
-    const url = 'https://api.anthropic.com/v1/messages';
-    const apiMessages = messages.map(m => ({ role: m.role, content: m.content }));
-    const res = await fetch(url, {
-      method: 'POST',
-      headers: {
-        'Content-Type': 'application/json',
-        'x-api-key': apiKey,
-        'anthropic-version': '2023-06-01',
-      },
-      body: JSON.stringify({
-        model: model.id,
-        system: systemPrompt,
-        messages: apiMessages,
-        max_tokens: model.maxTokens ?? 8_192,
-      }),
-      signal: ctrl.signal,
-    });
-    if (!res.ok) {
-      const body = await res.text().catch(() => '');
-      throw new Error(`API returned ${res.status}: ${body.slice(0, 500)}`);
-    }
-    const json = await res.json();
-    const blocks = json?.content;
-    if (Array.isArray(blocks)) {
-      return blocks.filter((b: any) => b.type === 'text').map((b: any) => b.text).join('');
-    }
-    return '';
-  } finally {
-    clearTimeout(timeout);
-  }
-}
-/**
- * Full non-streaming response handler — wraps directNonStreamingCall
- * and returns an SSE-formatted Response for the client.
- */
-async function handleNonStreaming(opts: NonStreamingOpts): Promise<Response> {
-  const { modelName } = opts;
-  const requestStartTime = Date.now();
-  const encoder = new TextEncoder();
-  try {
-    const text = await directNonStreamingCall(opts);
-    metrics.recordRequest(Date.now() - requestStartTime);
-    if (!text) {
-      metrics.recordError();
-      return sseResponse(encoder, { type: 'error', message: `[non-streaming] ${modelName} returned empty response` });
-    }
-    console.log(`[ask] Non-streaming response from ${modelName}: ${text.length} chars`);
-    const stream = new ReadableStream({
-      start(controller) {
-        controller.enqueue(encoder.encode(`data:${JSON.stringify({ type: 'text_delta', delta: text })}\n\n`));
-        controller.enqueue(encoder.encode(`data:${JSON.stringify({ type: 'done' })}\n\n`));
-        controller.close();
-      },
-    });
-    return new Response(stream, { headers: sseHeaders() });
-  } catch (err) {
-    metrics.recordRequest(Date.now() - requestStartTime);
-    metrics.recordError();
-    const message = err instanceof Error ? err.message : String(err);
-    console.error(`[ask] Non-streaming request failed:`, message);
-    return sseResponse(encoder, { type: 'error', message });
-  }
-}
-function sseResponse(encoder: TextEncoder, event: MindOSSSEvent): Response {
-  const stream = new ReadableStream({
-    start(controller) {
-      controller.enqueue(encoder.encode(`data:${JSON.stringify(event)}\n\n`));
-      controller.close();
-    },
-  });
-  return new Response(stream, { headers: sseHeaders() });
-}
-function sseHeaders(): HeadersInit {
-  return {
-    'Content-Type': 'text/event-stream',
-    'Cache-Control': 'no-cache, no-transform',
-    'Connection': 'keep-alive',
-    'X-Accel-Buffering': 'no',
-  };
-}

package/app/app/api/settings/test-key/route.ts CHANGED Viewed

@@ -46,7 +46,7 @@ async function testAnthropic(apiKey: string, model: string): Promise<{ ok: boole
   }
 }
-async function testOpenAI(apiKey: string, model: string, baseUrl: string): Promise<{ ok: boolean; latency?: number; code?: ErrorCode; error?: string; streamingSupported?: boolean }> {
+async function testOpenAI(apiKey: string, model: string, baseUrl: string): Promise<{ ok: boolean; latency?: number; code?: ErrorCode; error?: string }> {
   const start = Date.now();
   const ctrl = new AbortController();
   const timer = setTimeout(() => ctrl.abort(), TIMEOUT);
@@ -58,7 +58,7 @@ async function testOpenAI(apiKey: string, model: string, baseUrl: string): Promi
         'Content-Type': 'application/json',
         'Authorization': `Bearer ${apiKey}`,
       },
-      body: JSON.stringify({ model, max_tokens: 1, messages: [{ role: 'user', content: 'hi' }] }),
+      body: JSON.stringify({ model, messages: [{ role: 'user', content: 'hi' }] }),
       signal: ctrl.signal,
     });
     const latency = Date.now() - start;
@@ -76,7 +76,6 @@ async function testOpenAI(apiKey: string, model: string, baseUrl: string): Promi
       },
       body: JSON.stringify({
         model,
-        max_tokens: 1,
         messages: [
           { role: 'system', content: 'You are a helpful assistant.' },
           { role: 'user', content: 'hi' },
@@ -107,50 +106,7 @@ async function testOpenAI(apiKey: string, model: string, baseUrl: string): Promi
       };
     }
-    // Streaming compatibility test — `/api/ask` uses SSE streaming by default.
-    // Many proxies pass non-streaming tests but fail at streaming.
-    // If streaming fails, we still report ok: true (basic chat works via non-streaming fallback).
-    let streamingSupported = true;
-    try {
-      const streamRes = await fetch(url, {
-        method: 'POST',
-        headers: {
-          'Content-Type': 'application/json',
-          'Authorization': `Bearer ${apiKey}`,
-        },
-        body: JSON.stringify({
-          model,
-          max_tokens: 5,
-          stream: true,
-          messages: [{ role: 'user', content: 'Say OK' }],
-        }),
-        signal: ctrl.signal,
-      });
-      if (!streamRes.ok) {
-        streamingSupported = false;
-      } else {
-        const reader = streamRes.body?.getReader();
-        if (reader) {
-          const decoder = new TextDecoder();
-          let gotData = false;
-          try {
-            while (true) {
-              const { done, value } = await reader.read();
-              if (done) break;
-              const text = decoder.decode(value, { stream: true });
-              if (text.includes('data:')) { gotData = true; break; }
-            }
-          } finally {
-            reader.releaseLock();
-          }
-          if (!gotData) streamingSupported = false;
-        }
-      }
-    } catch {
-      streamingSupported = false;
-    }
-    return { ok: true, latency, streamingSupported };
+    return { ok: true, latency };
   } catch (e: unknown) {
     if (e instanceof Error && e.name === 'AbortError') return { ok: false, code: 'network_error', error: 'Request timed out' };
     return { ok: false, code: 'network_error', error: e instanceof Error ? e.message : 'Network error' };

package/app/components/settings/AiTab.tsx CHANGED Viewed

@@ -14,7 +14,6 @@ interface TestResult {
   latency?: number;
   error?: string;
   code?: ErrorCode;
-  streamingSupported?: boolean;
 }
 function errorMessage(t: AiTabProps['t'], code?: ErrorCode): string {
@@ -73,12 +72,7 @@ export function AiTab({ data, updateAi, updateAgent, t }: AiTabProps) {
       const json = await res.json();
       if (json.ok) {
-        const streamingSupported = json.streamingSupported !== false;
-        setTestResult(prev => ({ ...prev, [providerName]: { state: 'ok', latency: json.latency, streamingSupported } }));
-        // Auto-persist streaming capability so /api/ask uses the right path
-        if (providerName === data.ai.provider) {
-          updateAgent({ useStreaming: streamingSupported });
-        }
+        setTestResult(prev => ({ ...prev, [providerName]: { state: 'ok', latency: json.latency } }));
         if (okTimerRef.current) clearTimeout(okTimerRef.current);
         okTimerRef.current = setTimeout(() => {
           setTestResult(prev => ({ ...prev, [providerName]: { state: 'idle' } }));
@@ -146,9 +140,6 @@ export function AiTab({ data, updateAi, updateAgent, t }: AiTabProps) {
         {result.state === 'ok' && result.latency != null && (
           <span className="text-xs text-success">
             {t.settings.ai.testKeyOk(result.latency)}
-            {result.streamingSupported === false && (
-              <span className="text-muted-foreground ml-1.5">{t.settings.ai.streamingFallback}</span>
-            )}
           </span>
         )}
         {result.state === 'error' && (

package/app/components/settings/types.ts CHANGED Viewed

@@ -21,7 +21,6 @@ export interface AgentSettings {
   thinkingBudget?: number;
   contextStrategy?: 'auto' | 'off';
   reconnectRetries?: number;
-  useStreaming?: boolean;
 }
 export interface SettingsData {

package/app/hooks/useAiOrganize.ts CHANGED Viewed

@@ -281,6 +281,7 @@ export function useAiOrganize() {
           messages,
           uploadedFiles: truncatedFiles,
           maxSteps: 15,
+          mode: 'organize',
         }),
         signal: controller.signal,
       });

package/app/lib/agent/model.ts CHANGED Viewed

@@ -57,6 +57,8 @@ export function getModelConfig(): {
     // For custom proxy endpoints, set conservative compat flags.
     // Most proxies (Azure, Bedrock relays, corporate gateways) only support
     // a subset of OpenAI's features. These defaults prevent silent failures.
+    // NOTE: maxTokensField is NOT overridden — pi-ai auto-detects the correct
+    // field based on URL (defaults to max_completion_tokens for modern APIs).
     if (hasCustomBase) {
       model = {
         ...model,
@@ -68,7 +70,6 @@ export function getModelConfig(): {
           supportsReasoningEffort: false,
           supportsUsageInStreaming: false,
           supportsStrictMode: false,
-          maxTokensField: 'max_tokens' as const,
         },
       };
       if (customApiVariant) {

package/app/lib/agent/prompt.ts CHANGED Viewed

@@ -35,3 +35,26 @@ Persona: Methodical, strictly objective, execution-oriented. Zero fluff. Never u
 - Reply in the user's language.
 - Use clean Markdown (tables, lists, bold).
 - End with concrete next actions if the task is incomplete.`;
+/**
+ * Lean system prompt for "organize uploaded files" mode.
+ *
+ * Design goal: ~200 tokens (vs ~600 for general). Strips everything the
+ * organize task doesn't need: anti-hallucination (no KB Q&A), cite sources,
+ * smart recovery, skills/MCP discovery, output formatting.
+ *
+ * The full SKILL.md is NOT loaded in organize mode — only the bootstrap
+ * README.md (for KB structure awareness) is injected by route.ts.
+ */
+export const ORGANIZE_SYSTEM_PROMPT = `You are MindOS Agent — an expert at organizing information into a local Markdown knowledge base.
+Your ONLY job: read the user's uploaded files, extract key information, and save well-structured Markdown notes into the knowledge base using file tools.
+Rules:
+1. Read uploaded file content from the "USER-UPLOADED FILES" section below — do NOT call read tools on them.
+2. Use \`list_files\` to understand the existing KB structure before deciding where to place notes.
+3. Create new files or update existing ones. Prefer \`create_file\` for new content, \`update_section\` / \`append_to_file\` for additions to existing files.
+4. Match the language of the source files when writing notes.
+5. Batch parallel tool calls in a single turn for efficiency.
+6. Do NOT write to the KB root directory — place files under the most fitting subdirectory.
+7. After writing, provide a brief summary of what you created/updated.`;

package/app/lib/agent/tools.ts CHANGED Viewed

@@ -173,6 +173,18 @@ export const WRITE_TOOLS = new Set([
   'update_section', 'edit_lines', 'delete_file', 'rename_file', 'move_file', 'append_csv',
 ]);
+/** Tool names sufficient for the "organize uploaded files" task. */
+const ORGANIZE_TOOL_NAMES = new Set([
+  'list_files', 'read_file', 'search',
+  'create_file', 'batch_create_files', 'write_file',
+  'append_to_file', 'insert_after_heading', 'update_section',
+]);
+/** Lean tool set for organize mode — skips MCP discovery, history, backlinks, etc. */
+export function getOrganizeTools(): AgentTool<any>[] {
+  return knowledgeBaseTools.filter(t => ORGANIZE_TOOL_NAMES.has(t.name));
+}
 export async function getRequestScopedTools(): Promise<AgentTool<any>[]> {
   try {
     const result = await listMcporterServers();

package/app/lib/i18n-en.ts CHANGED Viewed

@@ -844,7 +844,6 @@ export const en = {
       testKeyUnknown: 'Test failed',
       listModels: 'Browse',
       noModelsFound: 'No models found',
-      streamingFallback: '(will use standard mode)',
     },
     agent: {
       title: 'Agent Behavior',

package/app/lib/i18n-zh.ts CHANGED Viewed

@@ -868,7 +868,6 @@ export const zh = {
       testKeyUnknown: '测试失败',
       listModels: '选择模型',
       noModelsFound: '未找到可用模型',
-      streamingFallback: '（将使用标准模式）',
     },
     agent: {
       title: 'Agent 行为',

package/app/lib/settings.ts CHANGED Viewed

@@ -24,7 +24,6 @@ export interface AgentConfig {
   thinkingBudget?: number;    // default 5000
   contextStrategy?: 'auto' | 'off'; // default 'auto'
   reconnectRetries?: number;  // default 3, range 0-10 (0 = disabled)
-  useStreaming?: boolean;     // default true; false = non-streaming fallback for proxy compat
 }
 export interface GuideState {
@@ -131,7 +130,6 @@ function parseAgent(raw: unknown): AgentConfig | undefined {
   if (typeof obj.thinkingBudget === 'number') result.thinkingBudget = Math.min(50000, Math.max(1000, obj.thinkingBudget));
   if (obj.contextStrategy === 'auto' || obj.contextStrategy === 'off') result.contextStrategy = obj.contextStrategy;
   if (typeof obj.reconnectRetries === 'number') result.reconnectRetries = Math.min(10, Math.max(0, obj.reconnectRetries));
-  if (typeof obj.useStreaming === 'boolean') result.useStreaming = obj.useStreaming;
   return Object.keys(result).length > 0 ? result : undefined;
 }

package/package.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "@geminilight/mindos",
-  "version": "0.6.19",
+  "version": "0.6.20",
   "description": "MindOS — Human-Agent Collaborative Mind System. Local-first knowledge base that syncs your mind to all AI Agents via MCP.",
   "keywords": [
     "mindos",