npm - @aigne/doc-smith - Versions diffs - 0.8.15-beta.1 → 0.8.15-beta.11 - Mend

@aigne/doc-smith 0.8.15-beta.1 → 0.8.15-beta.11

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (89) hide show

package/CHANGELOG.md +89 -0
package/agents/clear/choose-contents.mjs +4 -4
package/agents/clear/clear-auth-tokens.mjs +8 -8
package/agents/clear/clear-deployment-config.mjs +2 -2
package/agents/clear/clear-document-config.mjs +3 -3
package/agents/clear/clear-document-structure.mjs +10 -10
package/agents/clear/clear-generated-docs.mjs +103 -14
package/agents/clear/clear-media-description.mjs +7 -7
package/agents/evaluate/document-structure.yaml +3 -1
package/agents/evaluate/document.yaml +3 -1
package/agents/evaluate/index.yaml +1 -3
package/agents/generate/check-diagram.mjs +1 -1
package/agents/generate/check-need-generate-structure.mjs +2 -7
package/agents/generate/draw-diagram.yaml +4 -0
package/agents/generate/generate-structure.yaml +117 -65
package/agents/generate/index.yaml +3 -3
package/agents/generate/{merge-d2-diagram.yaml → merge-diagram.yaml} +7 -6
package/agents/generate/update-document-structure.yaml +1 -1
package/agents/generate/user-review-document-structure.mjs +3 -25
package/agents/generate/utils/merge-document-structures.mjs +30 -0
package/agents/init/check.mjs +4 -2
package/agents/init/index.mjs +37 -7
package/agents/media/load-media-description.mjs +12 -24
package/agents/publish/publish-docs.mjs +3 -8
package/agents/schema/document-execution-structure.yaml +1 -1
package/agents/schema/document-structure-item.yaml +23 -0
package/agents/schema/document-structure-refine-item.yaml +20 -0
package/agents/schema/document-structure.yaml +1 -1
package/agents/translate/index.yaml +1 -4
package/agents/translate/record-translation-history.mjs +6 -2
package/agents/translate/translate-multilingual.yaml +1 -1
package/agents/update/batch-generate-document.yaml +1 -1
package/agents/update/batch-update-document.yaml +1 -1
package/agents/update/check-document.mjs +35 -13
package/agents/update/check-generate-diagram.mjs +29 -0
package/agents/update/generate-diagram.yaml +29 -0
package/agents/update/generate-document.yaml +17 -30
package/agents/update/handle-document-update.yaml +10 -1
package/agents/update/save-and-translate-document.mjs +18 -47
package/agents/update/update-document-detail.yaml +2 -1
package/agents/update/update-single-document.yaml +1 -1
package/agents/update/user-review-document.mjs +6 -5
package/agents/utils/choose-docs.mjs +16 -5
package/agents/utils/find-item-by-path.mjs +4 -2
package/agents/utils/load-sources.mjs +63 -46
package/agents/utils/{save-docs.mjs → post-generate.mjs} +2 -51
package/agents/utils/save-doc-translation.mjs +27 -0
package/agents/utils/{save-single-doc.mjs → save-doc.mjs} +17 -12
package/agents/utils/save-sidebar.mjs +38 -0
package/agents/utils/{transform-detail-datasources.mjs → transform-detail-data-sources.mjs} +7 -7
package/aigne.yaml +16 -8
package/package.json +3 -1
package/prompts/common/document/content-rules-core.md +6 -6
package/prompts/common/document/media-file-list-usage-rules.md +12 -0
package/prompts/common/document/openapi-usage-rules.md +36 -0
package/prompts/common/document/role-and-personality.md +1 -2
package/prompts/common/document-structure/conflict-resolution-guidance.md +2 -2
package/prompts/common/document-structure/document-structure-rules.md +8 -8
package/prompts/common/document-structure/output-constraints.md +3 -3
package/prompts/detail/custom/custom-components.md +38 -3
package/prompts/detail/d2-diagram/rules.md +11 -14
package/prompts/detail/d2-diagram/system-prompt.md +0 -14
package/prompts/detail/d2-diagram/user-prompt.md +39 -0
package/prompts/detail/generate/document-rules.md +3 -3
package/prompts/detail/generate/system-prompt.md +2 -6
package/prompts/detail/generate/user-prompt.md +20 -61
package/prompts/detail/update/system-prompt.md +2 -6
package/prompts/detail/update/user-prompt.md +7 -6
package/prompts/evaluate/document.md +0 -4
package/prompts/structure/check-document-structure.md +4 -4
package/prompts/structure/generate/system-prompt.md +0 -31
package/prompts/structure/generate/user-prompt.md +73 -29
package/prompts/structure/review/structure-review-system.md +81 -0
package/prompts/structure/update/system-prompt.md +1 -1
package/prompts/structure/update/user-prompt.md +4 -4
package/prompts/translate/code-block.md +13 -3
package/prompts/translate/translate-document.md +3 -3
package/types/document-structure-schema.mjs +3 -3
package/utils/constants/index.mjs +6 -0
package/utils/docs-finder-utils.mjs +85 -3
package/utils/extract-api.mjs +32 -0
package/utils/file-utils.mjs +153 -101
package/utils/history-utils.mjs +20 -8
package/utils/load-config.mjs +20 -1
package/utils/markdown-checker.mjs +35 -1
package/utils/utils.mjs +67 -65
package/agents/generate/document-structure-tools/generate-sub-structure.mjs +0 -131
package/agents/generate/generate-structure-without-tools.yaml +0 -65
package/prompts/common/document/media-handling-rules.md +0 -9

package/prompts/structure/review/structure-review-system.md ADDED Viewed

@@ -0,0 +1,81 @@
+<role_and_goal>
+You are a **Documentation Structure Refiner** with the analytical mindset of an **INTJ (The Architect)**. You combine expert knowledge in technical documentation architecture and information design with strategic thinking, systematic analysis, and perfectionist attention to detail. Your core strengths are understanding complex systems, creating logically sound blueprints, and anticipating future documentation challenges.
+</role_and_goal>
+<document_info>
+projectName: |
+  {{projectName}}
+{% if projectDesc %}
+projectDesc: |
+  {{projectDesc}}
+{% endif %}
+</document_info>
+<document_structure>
+{{ documentStructure | yaml.stringify }}
+</document_structure>
+<instructions>
+Your task:
+Given an existing document structure (a JSON array or tree of sections), refine and optimize its **hierarchy and order** to improve clarity, usability, and conventional organization.
+️ You must not add or rename any nodes. You may delete nodes when necessary for better organization and adjust the **order** and **nesting levels** of existing nodes.
+---
+## Optimization Goals
+1. **Logical Order**
+   - Introductory materials should always appear at the beginning:
+     - “Overview”, “Introduction”, “Quick Start”, “Getting Started”, “Setup” should be near the top.
+   - Meta and community-related sections (e.g., “Community”, “Contributing”, “License”, “Changelog”) should always be at the end.
+   - Technical reference and configuration sections should appear after conceptual and usage sections.
+2. **Hierarchy Correction**
+   - Ensure proper depth:
+     - “Overview” and “Quick Start” should have **1–2 levels max**.
+     - Remove deeply nested technical details from “Overview” or “Quick Start”.
+     - Relocate such details under “Architecture”, “API Reference”, or “Modules”.
+   - Keep beneficial nodes — you may delete duplicated, redundant, or harmful nodes when needed for clarity.
+3. **Grouping and Alignment**
+   - Align similar nodes logically (e.g., group “Usage”, “Examples”, “Tutorials” together).
+   - Avoid duplication or overlap by reordering or strategic deletion when necessary.
+4. **Naming and Identity**
+   - You are **not allowed to rename or reword** any section titles or descriptions.
+   - Keep all existing keys, identifiers, and text intact.
+5. **Balance**
+   - Maintain a clean, well-organized hierarchy.
+   - Keep top-level nodes concise (≤ 8 preferred).
+   - Avoid over-nesting (≤ 4 levels deep).
+---
+## Behavior Rules
+- Do **not** add new nodes.
+- You **may** delete nodes when they are redundant, duplicated, or detrimental to documentation clarity.
+- Do **not** rename or rewrite content.
+- You **may** move nodes to different parents or reorder siblings to achieve better logical flow.
+- You **must** maintain structural integrity for all remaining nodes.
+- The output must be a complete, valid document structure array matching the expected schema.
+---
+## Objective
+Output a complete `structures` array containing the optimized document structure:
+1. Include ALL nodes from the input structure (whether modified or not)
+2. Each item must include: `id`, `title`, `description`, `path`, `parentPath` (if not top-level)
+3. Apply your optimizations through proper ordering, hierarchy changes, and selective deletion
+4. Maintain all required fields and ensure paths are valid (start with /, no spaces/special chars)
+5. **Important**: Only modify structural aspects (`id`, `title`, `description`, `path`, `parentPath`). Do NOT modify `sourceIds` or other data fields
+**Optimization Approach:**
+- Reorder nodes by adjusting their position in the array
+- Change hierarchy by modifying `parentPath` values (use the path of the new parent node)
+- Delete problematic nodes by simply omitting them from the output array
+- Keep beneficial nodes with their original content intact
+</instructions>

package/prompts/structure/update/system-prompt.md CHANGED Viewed

@@ -99,7 +99,7 @@ Analyze the user feedback to determine the intended operation:
 When to use Tools:
 - During document structure update, if the given context is missing or lacks referenced content, use glob/grep/readFile to obtain more context
-- When sourceIds or file content from <file_list> is needed but not provided in DataSources, use readFile to read the file content
+- When sourceIds or file content from `<file_list>` is needed but not provided in `<data_sources>`, use readFile to read the file content
 </file_tool_usage>

package/prompts/structure/update/user-prompt.md CHANGED Viewed

@@ -6,9 +6,9 @@
 {{allFilesPaths}}
 </file_list>
-<datasources>
-{{ datasources }}
-</datasources>
+<data_sources>
+{{ dataSourceChunk }}
+</data_sources>
 Initial Documentation Structure:
@@ -38,5 +38,5 @@ Processing workflow:
 Rules:
 ** All changes must be made using Tools. **
-** Carefully check if the latest version of documentStructure data meets user requirements, must avoid duplicate Tool calls. **
+** Carefully check if the latest version of `<document_structure>` data meets user requirements, must avoid duplicate Tool calls. **
 </instructions>

package/prompts/translate/code-block.md CHANGED Viewed

@@ -2,13 +2,23 @@
 The following formats are considered Code Blocks:
 - Wrapped with ```
-- Supports configurations: language, title, icon, where title and icon are optional
+- Supports configurations: language, optional title, optional icon (icon uses key=value)
+- title is free text placed after the language (not as title=xxx), may contain spaces, and **must NEVER be wrapped in quotes**
 - content can be code, command line examples, text or any other content
 <code_block_sample>
-```{language} [{title}] [icon={icon}]
-{content}
+- `language`: javascript
+- `title`: Modern: Using createRoot()
+- `icon`: logos:javascript
+```javascript Modern: Using createRoot() icon=logos:javascript
+import { createRoot } from 'react-dom/client'
+const container = document.getElementById('root')
+const root = createRoot(container)
+root.unmount()
 ```
 </code_block_sample>

package/prompts/translate/translate-document.md CHANGED Viewed

@@ -5,10 +5,10 @@ You are an **Elite Polyglot Localization and Translation Specialist** with exten
 Core Mandates:
 1. Semantic Fidelity (Accuracy): The translation must perfectly and comprehensively convey the **entire meaning, tone, and nuance** of the source text. **No omission, addition, or distortion of the original content** is permitted.
-2. Native Fluency and Style: The resulting text must adhere strictly to the target language's **grammar, syntax, and idiomatic expressions**. The translation must **sound like it was originally written by a native speaker**, completely **free of grammatical errors** or "translationese" (literal, stiff, or unnatural phrasing).
+2. Native Fluency and Style: The resulting text must adhere strictly to the target language's **grammar, syntax, and idiomatic expressions**. The translation must **sound like it was originally written by a native speaker**, completely **free of grammatical errors**, avoid "translationese" (literal, stiff, or unnatural phrasing).
 3. Readability and Flow: The final output must be **smooth, logical, and highly readable**. Sentences must flow naturally, ensuring a pleasant and coherent reading experience for the target audience.
 4. Localization and Clarity: Where a **literal (word-for-word) translation** of a term, phrase, or idiom would be **uncommon, confusing, or ambiguous** in the target language, you must apply **localization best practices**. This means translating the **concept** into the most **idiomatic, common, and easily understandable expression** in the target language.
-5. Versatility and Scope: You are proficient in handling **any pair of requested languages** (e.g., Chinese $\leftrightarrow$ English, English $\leftrightarrow$ Japanese) and are adept at translating diverse **document types**, including but not limited to: **Technical Manuals, Business Reports, Marketing Copy/Ads, Legal Documents, Academic Papers, and General Correspondence.**
+5. Versatility and Scope: You are proficient in handling **any pair of requested languages** (e.g., Chinese <--> English, English <--> Japanese) and are adept at translating diverse **document types**, including but not limited to: **Technical Manuals, Business Reports, Marketing Copy/Ads, Legal Documents, Academic Papers, and General Correspondence.**
 </role_and_goal>
@@ -299,5 +299,5 @@ Original text as follows:
 </content>
 <output_constraints>
-Please **accurately** translate the content within <content> tags (excluding the outermost <content> tags) into **{{ language }}**, strictly following the translation requirements.
+Please **accurately** translate the content within `<content>` tags (excluding the outermost `<content>` tags) into **{{ language }}**, strictly following the translation requirements.
 </output_constraints>

package/types/document-structure-schema.mjs CHANGED Viewed

@@ -6,7 +6,7 @@ export const documentItemSchema = z.object({
   title: z.string().min(1, "Title is required"),
   description: z.string().min(1, "Description is required"),
   path: z.string().startsWith("/", 'Path must start with "/"'),
-  parentId: z.string().nullable(),
+  parentId: z.string().nullish(),
   sourceIds: z.array(z.string()).min(1, "At least one source ID is required"),
 });
@@ -18,7 +18,7 @@ export const addDocumentInputSchema = z.object({
   title: z.string().min(1, "Title is required"),
   description: z.string().min(1, "Description is required"),
   path: z.string().startsWith("/", 'Path must start with "/"'),
-  parentId: z.string().nullable().optional(),
+  parentId: z.string().nullish(),
   sourceIds: z.array(z.string()).min(1, "At least one source ID is required"),
 });
@@ -44,7 +44,7 @@ export const deleteDocumentOutputSchema = z.object({
 // Move document schemas
 export const moveDocumentInputSchema = z.object({
   path: z.string().min(1, "Path is required"),
-  newParentId: z.string().nullable().optional(),
+  newParentId: z.string().nullish(),
 });
 export const moveDocumentOutputSchema = z.object({

package/utils/constants/index.mjs CHANGED Viewed

@@ -549,3 +549,9 @@ export const DOC_SMITH_DIR = ".aigne/doc-smith";
 export const TMP_DIR = ".tmp";
 export const TMP_DOCS_DIR = "docs";
 export const TMP_ASSETS_DIR = "assets";
+export const DOC_ACTION = {
+  translate: "translate",
+  update: "update",
+  clear: "clear",
+};

package/utils/docs-finder-utils.mjs CHANGED Viewed

@@ -1,14 +1,14 @@
 import { access, readdir, readFile } from "node:fs/promises";
 import { join } from "node:path";
+import { pathExists } from "./file-utils.mjs";
 /**
  * Get action-specific text based on isTranslate flag
- * @param {boolean} isTranslate - Whether this is a translation action
  * @param {string} baseText - Base text template with {action} placeholder
+ * @param {string} action - doc action type
  * @returns {string} Text with action replaced
  */
-export function getActionText(isTranslate, baseText) {
-  const action = isTranslate ? "translate" : "update";
+export function getActionText(baseText, action) {
   return baseText.replace("{action}", action);
 }
@@ -276,3 +276,85 @@ export function addFeedbackToItems(items, feedback) {
     feedback: feedback.trim(),
   }));
 }
+/**
+ * Load document execution structure from structure-plan.json
+ * @param {string} outputDir - Output directory containing structure-plan.json
+ * @returns {Promise<Array|null>} Document execution structure array or null if not found/failed
+ */
+export async function loadDocumentStructure(outputDir) {
+  if (!outputDir) {
+    return null;
+  }
+  try {
+    const structurePlanPath = join(outputDir, "structure-plan.json");
+    const structureExists = await pathExists(structurePlanPath);
+    if (!structureExists) {
+      return null;
+    }
+    const structureContent = await readFile(structurePlanPath, "utf8");
+    if (!structureContent?.trim()) {
+      return null;
+    }
+    try {
+      // Validate that the content looks like JSON before parsing
+      const trimmedContent = structureContent.trim();
+      if (!trimmedContent.startsWith("[") && !trimmedContent.startsWith("{")) {
+        console.warn("structure-plan.json contains non-JSON content, skipping parse");
+        return null;
+      }
+      const parsed = JSON.parse(structureContent);
+      // Return array if it's an array, otherwise return null
+      return Array.isArray(parsed) ? parsed : null;
+    } catch (parseError) {
+      console.error(`Failed to parse structure-plan.json: ${parseError.message}`);
+      return null;
+    }
+  } catch (readError) {
+    // Only warn if it's not a "file not found" error
+    if (readError.code !== "ENOENT") {
+      console.warn(`Error reading structure-plan.json: ${readError.message}`);
+    }
+    return null;
+  }
+}
+/**
+ * Build a tree structure from a flat document structure array using parentId
+ * @param {Array} documentStructure - Flat array of document structure items with path and parentId
+ * @returns {Object} Object containing rootNodes (array of root nodes) and nodeMap (Map for lookups)
+ */
+export function buildDocumentTree(documentStructure) {
+  // Create a map of nodes for easy lookup
+  const nodeMap = new Map();
+  const rootNodes = [];
+  // First pass: create node map
+  documentStructure.forEach((node) => {
+    nodeMap.set(node.path, {
+      ...node,
+      children: [],
+    });
+  });
+  // Build the tree structure using parentId
+  documentStructure.forEach((node) => {
+    if (node.parentId) {
+      const parent = nodeMap.get(node.parentId);
+      if (parent) {
+        parent.children.push(nodeMap.get(node.path));
+      } else {
+        rootNodes.push(nodeMap.get(node.path));
+      }
+    } else {
+      rootNodes.push(nodeMap.get(node.path));
+    }
+  });
+  return { rootNodes, nodeMap };
+}

package/utils/extract-api.mjs ADDED Viewed

@@ -0,0 +1,32 @@
+import { readFile } from "node:fs/promises";
+import { transpileDeclaration } from "typescript";
+export async function extractApi(path) {
+  const content = await readFile(path, "utf8");
+  const lang = languages.find((lang) => lang.match(path, content));
+  if (lang) {
+    return lang.extract(path, content);
+  }
+  return content;
+}
+const languages = [
+  {
+    match: (path) => /\.m?(js|ts)x?$/.test(path),
+    extract: extractJsApi,
+  },
+];
+async function extractJsApi(_path, content) {
+  const res = transpileDeclaration(content, {
+    compilerOptions: {
+      declaration: true,
+      emitDeclarationOnly: true,
+      allowJs: true,
+    },
+  });
+  return res.outputText.trim();
+}

package/utils/file-utils.mjs CHANGED Viewed

@@ -11,8 +11,9 @@ import { gunzipSync } from "node:zlib";
 import { debug } from "./debug.mjs";
 import { isGlobPattern } from "./utils.mjs";
-import { INTELLIGENT_SUGGESTION_TOKEN_THRESHOLD } from "./constants/index.mjs";
 import { uploadFiles } from "./upload-files.mjs";
+import { extractApi } from "./extract-api.mjs";
+import { minimatch } from "minimatch";
 /**
  * Check if a directory is inside a git repository using git command
@@ -286,7 +287,7 @@ export async function loadFilesFromPaths(sourcesPath, options = {}) {
         continue;
       }
-      if (checkIsRemoteFile(dir)) {
+      if (isRemoteFile(dir)) {
         allFiles.push(dir);
         continue;
       }
@@ -387,8 +388,8 @@ export async function loadFilesFromPaths(sourcesPath, options = {}) {
  * @returns {Promise<boolean>} True if file appears to be a text file
  */
 async function isTextFile(filePath) {
-  if (checkIsRemoteFile(filePath)) {
-    return checkIsHttpTextFile(filePath);
+  if (isRemoteFile(filePath)) {
+    return isRemoteTextFile(filePath);
   }
   try {
@@ -400,14 +401,42 @@ async function isTextFile(filePath) {
   }
 }
-export function checkIsRemoteFile(filepath) {
-  if (filepath.startsWith("http://") || filepath.startsWith("https://")) {
-    return true;
+/**
+ * Check if a string is an HTTP/HTTPS URL
+ * @param {string} fileUrl - The string to check
+ * @returns {boolean} - True if the string starts with http:// or https://
+ */
+export function isRemoteFile(fileUrl) {
+  if (typeof fileUrl !== "string") return false;
+  try {
+    const url = new URL(fileUrl);
+    // Only accept http and https url
+    if (["http:", "https:"].includes(url.protocol)) {
+      return true;
+    }
+    // other protocol will be treated as bad url
+    return false;
+  } catch {
+    return false;
   }
-  return false;
 }
-export async function checkIsHttpTextFile(fileUrl) {
+export async function isRemoteFileAvailable(fileUrl) {
+  if (!isRemoteFile(fileUrl)) return false;
+  try {
+    const res = await fetch(fileUrl, {
+      method: "HEAD",
+    });
+    return res.ok;
+  } catch (error) {
+    debug(`Failed to check HTTP file availability: ${fileUrl} - ${error.message}`);
+    return false;
+  }
+}
+export async function isRemoteTextFile(fileUrl) {
   try {
     const res = await fetch(fileUrl, {
       method: "HEAD",
@@ -435,14 +464,14 @@ export async function checkIsHttpTextFile(fileUrl) {
   }
 }
-export async function getHttpFileContent(file) {
-  if (!file) return null;
+export async function getRemoteFileContent(fileUrl) {
+  if (!fileUrl) return null;
   try {
-    const res = await fetch(file);
+    const res = await fetch(fileUrl);
     const text = await res.text();
     return text;
   } catch (error) {
-    debug(`Failed to fetch HTTP file content: ${file} - ${error.message}`);
+    debug(`Failed to fetch HTTP file content: ${fileUrl} - ${error.message}`);
     return null;
   }
 }
@@ -469,8 +498,8 @@ export async function readFileContents(files, baseDir = process.cwd(), options =
       }
       try {
-        if (checkIsRemoteFile(file)) {
-          const content = await getHttpFileContent(file);
+        if (isRemoteFile(file)) {
+          const content = await getRemoteFileContent(file);
           if (content) {
             return {
               sourceId: file,
@@ -480,7 +509,9 @@ export async function readFileContents(files, baseDir = process.cwd(), options =
           return null;
         } else {
-          const content = await readFile(file, "utf8");
+          const content = await extractApi(file);
+          if (!content) return null;
           const relativePath = path.relative(baseDir, file);
           return {
             sourceId: relativePath,
@@ -499,6 +530,11 @@ export async function readFileContents(files, baseDir = process.cwd(), options =
   return results.filter((result) => result !== null);
 }
+export function calculateTokens(text) {
+  const tokens = encode(text);
+  return tokens.length;
+}
 /**
  * Calculate total lines and tokens from file contents
  * @param {Array<{content: string}>} sourceFiles - Array of objects containing content property
@@ -524,97 +560,17 @@ export function calculateFileStats(sourceFiles) {
 }
 /**
- * Build sources content string based on context size
- * For large contexts, only include core project files to avoid token limit issues
+ * Build sources content string
  * @param {Array<{sourceId: string, content: string}>} sourceFiles - Array of source file objects
- * @param {boolean} isLargeContext - Whether the context is large
  * @returns {string} Concatenated sources content with sourceId comments
  */
-export function buildSourcesContent(sourceFiles, isLargeContext = false) {
-  // Define core file patterns that represent project structure and key information
-  const coreFilePatterns = [
-    // Configuration files
-    /package\.json$/,
-    /tsconfig\.json$/,
-    /jsconfig\.json$/,
-    /\.env\.example$/,
-    /Cargo\.toml$/,
-    /go\.mod$/,
-    /pom\.xml$/,
-    /build\.gradle$/,
-    /Gemfile$/,
-    /requirements\.txt$/,
-    /Pipfile$/,
-    /composer\.json$/,
-    /pyproject\.toml$/,
-    // Documentation
-    /README\.md$/i,
-    /CHANGELOG\.md$/i,
-    /CONTRIBUTING\.md$/i,
-    /\.github\/.*\.md$/i,
-    // Entry points and main files
-    /index\.(js|ts|jsx|tsx|py|go|rs|java|rb|php)$/,
-    /main\.(js|ts|jsx|tsx|py|go|rs|java|rb|php)$/,
-    /app\.(js|ts|jsx|tsx|py)$/,
-    /server\.(js|ts|jsx|tsx|py)$/,
-    // API definitions
-    /api\/.*\.(js|ts|jsx|tsx|py|go|rs|java|rb|php)$/,
-    /routes\/.*\.(js|ts|jsx|tsx|py|go|rs|java|rb|php)$/,
-    /controllers\/.*\.(js|ts|jsx|tsx|py|go|rs|java|rb|php)$/,
-    // Type definitions and schemas
-    /types\.(ts|d\.ts)$/,
-    /schema\.(js|ts|jsx|tsx|py|go|rs|java|rb|php)$/,
-    /.*\.d\.ts$/,
-    // Core utilities
-    /utils\/.*\.(js|ts|jsx|tsx|py|go|rs|java|rb|php)$/,
-    /lib\/.*\.(js|ts|jsx|tsx|py|go|rs|java|rb|php)$/,
-    /helpers\/.*\.(js|ts|jsx|tsx|py|go|rs|java|rb|php)$/,
-  ];
-  // Function to check if a file is a core file
-  const isCoreFile = (filePath) => {
-    return coreFilePatterns.some((pattern) => pattern.test(filePath));
-  };
+export function buildSourcesContent(sourceFiles) {
   // Build sources string
   let allSources = "";
-  if (isLargeContext) {
-    // Only include core files for large contexts
-    const coreFiles = sourceFiles.filter((source) => isCoreFile(source.sourceId));
-    // Determine which files to use and set appropriate message
-    const filesToInclude = coreFiles.length > 0 ? coreFiles : sourceFiles;
-    const noteMessage =
-      coreFiles.length > 0
-        ? "// Note: Context is large, showing only core project files.\n"
-        : "// Note: Context is large, showing a sample of files.\n";
-    allSources += noteMessage;
-    let accumulatedTokens = 0;
-    for (const source of filesToInclude) {
-      const fileContent = `// sourceId: ${source.sourceId}\n${source.content}\n`;
-      const fileTokens = encode(fileContent);
-      // Check if adding this file would exceed the token limit
-      if (accumulatedTokens + fileTokens.length > INTELLIGENT_SUGGESTION_TOKEN_THRESHOLD) {
-        break;
-      }
-      allSources += fileContent;
-      accumulatedTokens += fileTokens.length;
-    }
-  } else {
-    // Include all files for normal contexts
-    for (const source of sourceFiles) {
-      allSources += `// sourceId: ${source.sourceId}\n${source.content}\n`;
-    }
+  // Include all files for normal contexts
+  for (const source of sourceFiles) {
+    allSources += `\n// sourceId: ${source.sourceId}\n${source.content}\n`;
   }
   return allSources;
@@ -904,3 +860,99 @@ export async function downloadAndUploadImage(imageUrl, docsDir, appUrl, accessTo
     return { url: imageUrl, downloadFinalPath: null };
   }
 }
+/**
+ * Extract the path prefix from a glob pattern until the first glob character
+ */
+export function getPathPrefix(pattern) {
+  const segments = pattern.split("/");
+  const result = [];
+  for (const segment of segments) {
+    if (isGlobPattern(segment)) {
+      break;
+    }
+    result.push(segment);
+  }
+  return result.join("/") || ".";
+}
+/**
+ * Check if a dir matches any exclude pattern
+ */
+export function isDirExcluded(dir, excludePatterns) {
+  if (!dir || typeof dir !== "string") {
+    return false;
+  }
+  let normalizedDir = dir.replace(/\\/g, "/").replace(/^\.\/+/, "");
+  normalizedDir = normalizedDir.endsWith("/") ? normalizedDir : `${normalizedDir}/`;
+  for (const excludePattern of excludePatterns) {
+    if (minimatch(normalizedDir, excludePattern, { dot: true })) {
+      return true;
+    }
+  }
+  return false;
+}
+/**
+ * Return source paths that would be excluded by exclude patterns (files are skipped, directories use minimatch, glob patterns use path prefix heuristic)
+ */
+export async function findInvalidSourcePaths(sourcePaths, excludePatterns) {
+  if (!Array.isArray(sourcePaths) || sourcePaths.length === 0) {
+    return [];
+  }
+  if (!Array.isArray(excludePatterns) || excludePatterns.length === 0) {
+    return [];
+  }
+  const invalidPaths = [];
+  for (const sourcePath of sourcePaths) {
+    if (typeof sourcePath !== "string" || !sourcePath) {
+      continue;
+    }
+    // Skip paths starting with "!" (exclusion patterns)
+    if (sourcePath.startsWith("!")) {
+      continue;
+    }
+    // Skip remote URLs
+    if (isRemoteFile(sourcePath)) {
+      continue;
+    }
+    // Check glob pattern: use heuristic algorithm
+    if (isGlobPattern(sourcePath)) {
+      const representativePath = getPathPrefix(sourcePath);
+      if (isDirExcluded(representativePath, excludePatterns)) {
+        invalidPaths.push(sourcePath);
+      }
+      continue;
+    }
+    try {
+      const stats = await stat(sourcePath);
+      // Skip file
+      if (stats.isFile()) {
+        continue;
+      }
+      // Check dir with minimatch
+      if (stats.isDirectory()) {
+        if (isDirExcluded(sourcePath, excludePatterns)) {
+          invalidPaths.push(sourcePath);
+        }
+      }
+    } catch {
+      // Path doesn't exist
+      invalidPaths.push(sourcePath);
+    }
+  }
+  return invalidPaths;
+}