npm - agentmap - Versions diffs - 0.8.0 → 0.9.0 - Mend

agentmap 0.8.0 → 0.9.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (83) hide show

package/CHANGELOG.md +96 -0
package/README.md +24 -0
package/dist/cli.js +37 -12
package/dist/cli.js.map +1 -1
package/dist/extract/definitions.js +12 -12
package/dist/extract/definitions.js.map +1 -1
package/dist/extract/definitions.test.js +30 -259
package/dist/extract/definitions.test.js.map +1 -1
package/dist/extract/git-status.d.ts +7 -2
package/dist/extract/git-status.d.ts.map +1 -1
package/dist/extract/git-status.js +12 -18
package/dist/extract/git-status.js.map +1 -1
package/dist/extract/markdown.js +1 -1
package/dist/extract/markdown.test.js +3 -3
package/dist/extract/markdown.test.js.map +1 -1
package/dist/extract/marker.js +1 -1
package/dist/extract/marker.test.js +4 -4
package/dist/extract/marker.test.js.map +1 -1
package/dist/index.d.ts +4 -1
package/dist/index.d.ts.map +1 -1
package/dist/index.js +5 -4
package/dist/index.js.map +1 -1
package/dist/logger.d.ts +10 -0
package/dist/logger.d.ts.map +1 -0
package/dist/logger.js +41 -0
package/dist/logger.js.map +1 -0
package/dist/map/builder.d.ts.map +1 -1
package/dist/map/builder.js +23 -12
package/dist/map/builder.js.map +1 -1
package/dist/map/builder.test.d.ts +2 -0
package/dist/map/builder.test.d.ts.map +1 -0
package/dist/map/builder.test.js +66 -0
package/dist/map/builder.test.js.map +1 -0
package/dist/map/truncate.d.ts +7 -3
package/dist/map/truncate.d.ts.map +1 -1
package/dist/map/truncate.js +80 -11
package/dist/map/truncate.js.map +1 -1
package/dist/scanner.d.ts.map +1 -1
package/dist/scanner.js +164 -65
package/dist/scanner.js.map +1 -1
package/dist/scanner.test.d.ts +2 -0
package/dist/scanner.test.d.ts.map +1 -0
package/dist/scanner.test.js +84 -0
package/dist/scanner.test.js.map +1 -0
package/dist/test-helpers/git-test-helpers.d.ts +13 -0
package/dist/test-helpers/git-test-helpers.d.ts.map +1 -0
package/dist/test-helpers/git-test-helpers.js +48 -0
package/dist/test-helpers/git-test-helpers.js.map +1 -0
package/dist/types.d.ts +15 -1
package/dist/types.d.ts.map +1 -1
package/package.json +15 -3
package/src/cli.ts +164 -0
package/src/extract/definitions.test.ts +2040 -0
package/src/extract/definitions.ts +379 -0
package/src/extract/git-status.test.ts +507 -0
package/src/extract/git-status.ts +359 -0
package/src/extract/markdown.test.ts +159 -0
package/src/extract/markdown.ts +202 -0
package/src/extract/marker.test.ts +566 -0
package/src/extract/marker.ts +398 -0
package/src/extract/submodules.test.ts +95 -0
package/src/extract/submodules.ts +269 -0
package/src/extract/utils.ts +27 -0
package/src/index.ts +106 -0
package/src/languages/cpp.ts +129 -0
package/src/languages/go.ts +72 -0
package/src/languages/index.ts +231 -0
package/src/languages/javascript.ts +33 -0
package/src/languages/python.ts +41 -0
package/src/languages/rust.ts +72 -0
package/src/languages/typescript.ts +74 -0
package/src/languages/zig.ts +106 -0
package/src/logger.ts +55 -0
package/src/map/builder.test.ts +72 -0
package/src/map/builder.ts +175 -0
package/src/map/truncate.ts +188 -0
package/src/map/yaml.ts +66 -0
package/src/parser/index.ts +53 -0
package/src/parser/languages.ts +64 -0
package/src/scanner.test.ts +95 -0
package/src/scanner.ts +364 -0
package/src/test-helpers/git-test-helpers.ts +62 -0
package/src/types.ts +191 -0

package/src/extract/marker.ts ADDED Viewed

@@ -0,0 +1,398 @@
+// Extract file header comment/docstring using tree-sitter.
+// Detects standard comment styles from existing projects.
+// Automatically skips license headers (Copyright, SPDX, etc.).
+import { parseCode, detectLanguage } from '../parser/index.js'
+import { readFirstLines } from './utils.js'
+import type { MarkerResult, Language, SyntaxNode } from '../types.js'
+export { extractMarkdownDescription } from './markdown.js'
+const MAX_LINES = 50
+const MAX_DESC_LINES = 20
+/**
+ * Patterns that strongly indicate a license/copyright comment.
+ * These are checked against comment text.
+ */
+const LICENSE_PATTERNS = [
+  /\bcopyright\s*(?:\(c\)|©|\d{4})/i,   // "Copyright (c)", "Copyright ©", "Copyright 2024"
+  /\bspdx-license-identifier\s*:/i,     // "SPDX-License-Identifier: MIT"
+  /\ball rights reserved\b/i,           // Common in copyright notices
+  /\blicensed under\b/i,                // "Licensed under the MIT License", "Licensed under Apache 2.0"
+  /\bpermission is hereby granted\b/i,  // MIT license text
+  /\bredistribution and use\b/i,        // BSD license text
+  /\bthis source code is licensed\b/i,  // Meta/Facebook style
+  /\bwithout warranty\b/i,              // Common in license text
+  /\bthe software is provided "as is"\b/i, // MIT license text
+]
+/**
+ * Check if comment text looks like a license/copyright header.
+ * Uses patterns specific to actual license text to avoid false positives.
+ */
+function isLicenseComment(text: string): boolean {
+  return LICENSE_PATTERNS.some(pattern => pattern.test(text))
+}
+/**
+ * Truncate lines to MAX_DESC_LINES, adding indicator if truncated
+ */
+function truncateDescription(lines: string[]): string {
+  const trimmed = lines.join('\n').trim()
+  const trimmedLines = trimmed.split('\n')
+  if (trimmedLines.length <= MAX_DESC_LINES) {
+    return trimmed
+  }
+  const truncated = trimmedLines.slice(0, MAX_DESC_LINES)
+  const remaining = trimmedLines.length - MAX_DESC_LINES
+  truncated.push(`... and ${remaining} more lines`)
+  return truncated.join('\n')
+}
+/**
+ * Extract header comment/docstring from a file.
+ * Uses tree-sitter for clean AST-based extraction.
+ *
+ * Supports:
+ * - // line comments (JS/TS/Go/Rust)
+ * - /* block comments (JS/TS/Go/Rust)
+ * - # line comments (Python)
+ * - """ docstrings (Python)
+ * - //! inner doc comments (Rust)
+ */
+export async function extractMarker(filepath: string): Promise<MarkerResult> {
+  const language = detectLanguage(filepath)
+  if (!language) {
+    return { found: false }
+  }
+  const head = await readFirstLines(filepath, MAX_LINES)
+  if (head === null) {
+    // File couldn't be read - skip silently
+    return { found: false }
+  }
+  return extractMarkerFromCode(head, language)
+}
+/**
+ * Extract header comment/docstring from code string.
+ * Use this when you already have the file content to avoid re-reading.
+ */
+export async function extractMarkerFromCode(code: string, language: Language): Promise<MarkerResult> {
+  // Only parse first MAX_LINES worth of content for efficiency
+  const lines = code.split('\n').slice(0, MAX_LINES)
+  const head = lines.join('\n')
+  const tree = await parseCode(head, language)
+  const description = extractHeaderFromAST(tree.rootNode, language)
+  if (description === null) {
+    return { found: false }
+  }
+  return {
+    found: true,
+    description: description || undefined,
+  }
+}
+/**
+ * Check if a node is a JS/TS directive like "use strict" or "use client"
+ */
+function isDirective(node: SyntaxNode): boolean {
+  if (node.type !== 'expression_statement') return false
+  const str = node.child(0)
+  if (str?.type !== 'string') return false
+  const text = str.text
+  // Check for known directives (with quotes)
+  return /^["']use (strict|client|server)["']$/.test(text)
+}
+/**
+ * Extract header comment from AST root node
+ */
+function extractHeaderFromAST(root: SyntaxNode, language: Language): string | null {
+  const children = getChildren(root)
+  if (children.length === 0) {
+    return null
+  }
+  let startIdx = 0
+  let shebang: string | null = null
+  // Capture shebang if present
+  // Python/shell: comment node starting with #!
+  // JS/TS: hash_bang_line node
+  const firstChild = children[0]
+  if (firstChild?.type === 'hash_bang_line' ||
+      (firstChild?.type === 'comment' && firstChild.text.startsWith('#!'))) {
+    shebang = firstChild.text.trim()
+    startIdx = 1
+  }
+  // Skip JS/TS directives like "use strict", "use client"
+  while (startIdx < children.length && isDirective(children[startIdx])) {
+    startIdx++
+  }
+  if (startIdx >= children.length) {
+    // Only shebang, no description
+    return shebang
+  }
+  const first = children[startIdx]
+  // Helper to prepend shebang to description
+  const withShebang = (desc: string | null): string | null => {
+    if (!desc) return shebang
+    if (!shebang) return desc
+    return `${shebang}\n${desc}`
+  }
+  // Python: check for module docstring (expression_statement containing string)
+  if (language === 'python' && first.type === 'expression_statement') {
+    const str = first.childForFieldName('expression') ?? first.child(0)
+    if (str?.type === 'string') {
+      const docstring = extractPythonDocstring(str)
+      // Skip if it looks like a license
+      if (docstring && isLicenseComment(docstring)) {
+        // Try to find next comment after this docstring
+        return withShebang(extractConsecutiveComments(children, startIdx + 1, language))
+      }
+      return withShebang(docstring)
+    }
+  }
+  // Collect consecutive comment nodes at the start, skipping license comments
+  if (isCommentNode(first)) {
+    return withShebang(extractConsecutiveCommentsSkipLicense(children, startIdx, language))
+  }
+  return shebang
+}
+/**
+ * Extract consecutive comments, skipping leading license comments
+ */
+function extractConsecutiveCommentsSkipLicense(
+  children: SyntaxNode[],
+  startIdx: number,
+  language: Language
+): string | null {
+  let idx = startIdx
+  while (idx < children.length) {
+    const node = children[idx]
+    // Skip non-comment nodes (might be blank lines, etc.)
+    if (!isCommentNode(node)) {
+      idx++
+      continue
+    }
+    const text = extractCommentText(node, language)
+    if (text === null) {
+      idx++
+      continue
+    }
+    // Check if this comment is a license
+    if (isLicenseComment(text)) {
+      // Skip this license comment
+      idx++
+      // Continue to skip any consecutive license comments
+      continue
+    }
+    // Found a non-license comment - extract from here
+    return extractConsecutiveComments(children, idx, language)
+  }
+  return null
+}
+/**
+ * Check if a node is a comment
+ */
+function isCommentNode(node: SyntaxNode): boolean {
+  return (
+    node.type === 'comment' ||
+    node.type === 'line_comment' ||
+    node.type === 'block_comment'
+  )
+}
+/**
+ * Extract consecutive comment nodes and combine their text
+ */
+function extractConsecutiveComments(
+  children: SyntaxNode[],
+  startIdx: number,
+  language: Language
+): string {
+  const lines: string[] = []
+  for (let i = startIdx; i < children.length; i++) {
+    const node = children[i]
+    if (!isCommentNode(node)) {
+      break
+    }
+    const text = extractCommentText(node, language)
+    if (text !== null) {
+      lines.push(...text.split('\n'))
+    }
+  }
+  return truncateDescription(lines)
+}
+/**
+ * Check if comment is a TypeScript triple-slash reference directive
+ * These are compiler directives, not actual comments
+ */
+function isReferenceDirective(text: string): boolean {
+  return /^\/\/\/\s*<reference\s/.test(text)
+}
+/**
+ * Extract text content from a comment node
+ */
+function extractCommentText(node: SyntaxNode, language: Language): string | null {
+  const text = node.text
+  // Skip TypeScript triple-slash reference directives
+  if (isReferenceDirective(text)) {
+    return null
+  }
+  // Rust: line_comment may have doc_comment child with actual content
+  if (language === 'rust' && node.type === 'line_comment') {
+    const docComment = findChild(node, 'doc_comment')
+    if (docComment) {
+      return docComment.text.trim()
+    }
+    // Regular // comment - strip prefix
+    return stripLinePrefix(text, '//')
+  }
+  // Block comment /* */ or /** */ (including Rust block_comment)
+  if (text.startsWith('/*') || node.type === 'block_comment') {
+    return extractBlockCommentText(text)
+  }
+  // Line comment // or #
+  if (text.startsWith('//')) {
+    return stripLinePrefix(text, '//')
+  }
+  if (text.startsWith('#')) {
+    return stripLinePrefix(text, '#')
+  }
+  return text.trim()
+}
+/**
+ * Strip comment prefix and optional following space
+ * Handles //!, ///, //, ##, #
+ */
+function stripLinePrefix(text: string, prefix: string): string {
+  let content = text.slice(prefix.length)
+  // Strip optional ! or / after // (for //! and ///)
+  if (prefix === '//' && (content.startsWith('!') || content.startsWith('/'))) {
+    content = content.slice(1)
+  }
+  // Strip optional extra # after # (for ##)
+  if (prefix === '#' && content.startsWith('#')) {
+    content = content.slice(1)
+  }
+  // Strip optional leading space
+  if (content.startsWith(' ')) {
+    content = content.slice(1)
+  }
+  return content.trimEnd()
+}
+/**
+ * Extract text from block comment, stripping delimiters and * prefixes
+ */
+function extractBlockCommentText(text: string): string {
+  // Remove /* and */
+  let content = text.slice(2)
+  if (content.endsWith('*/')) {
+    content = content.slice(0, -2)
+  }
+  // Remove leading * for JSDoc style
+  if (content.startsWith('*')) {
+    content = content.slice(1)
+  }
+  // Process lines, removing * prefixes
+  const lines = content.split('\n').map(line => {
+    const trimmed = line.trim()
+    if (trimmed.startsWith('* ')) {
+      return trimmed.slice(2)
+    }
+    if (trimmed === '*') {
+      return ''
+    }
+    if (trimmed.startsWith('*')) {
+      return trimmed.slice(1).trim()
+    }
+    return trimmed
+  })
+  return lines.join('\n').trim()
+}
+/**
+ * Extract Python docstring content from string node
+ */
+function extractPythonDocstring(node: SyntaxNode): string {
+  // Find string_content child which has the actual text
+  const content = findChild(node, 'string_content')
+  if (content) {
+    const lines = content.text.trim().split('\n')
+    return truncateDescription(lines)
+  }
+  // Fallback: extract from full text
+  let text = node.text
+  // Remove triple quotes
+  if (text.startsWith('"""') || text.startsWith("'''")) {
+    text = text.slice(3)
+  }
+  if (text.endsWith('"""') || text.endsWith("'''")) {
+    text = text.slice(0, -3)
+  }
+  const lines = text.trim().split('\n')
+  return truncateDescription(lines)
+}
+/**
+ * Get all children of a node as array
+ */
+function getChildren(node: SyntaxNode): SyntaxNode[] {
+  const children: SyntaxNode[] = []
+  for (let i = 0; i < node.childCount; i++) {
+    const child = node.child(i)
+    if (child) children.push(child)
+  }
+  return children
+}
+/**
+ * Find first child of given type
+ */
+function findChild(node: SyntaxNode, type: string): SyntaxNode | null {
+  for (let i = 0; i < node.childCount; i++) {
+    const child = node.child(i)
+    if (child?.type === type) return child
+  }
+  return null
+}

package/src/extract/submodules.test.ts ADDED Viewed

@@ -0,0 +1,95 @@
+// Tests for submodule detection and parsing logic.
+import { describe, expect, test } from 'bun:test'
+import { getSubmodules, getSubmodulePaths } from './submodules.js'
+import { getAllDiffData, parseNumstat, parseDiff } from './git-status.js'
+// ============================================================================
+// Integration: submodule detection in current repo (no submodules expected)
+// ============================================================================
+describe('getSubmodules', () => {
+  test('returns empty array when repo has no submodules', () => {
+    const result = getSubmodules(process.cwd())
+    expect(result).toMatchInlineSnapshot(`[]`)
+  })
+})
+describe('getSubmodulePaths', () => {
+  test('returns empty set when repo has no submodules', () => {
+    const result = getSubmodulePaths(process.cwd())
+    expect(result.size).toBe(0)
+  })
+})
+// ============================================================================
+// Diff filtering: submodule paths should be removed from diff output
+// ============================================================================
+describe('diff submodule filtering', () => {
+  test('parseNumstat includes submodule pointer changes as 1/1', () => {
+    // Simulates what git diff --numstat outputs for a submodule pointer change
+    const output = `1\t1\tvendor/some-lib
+10\t5\tsrc/main.ts`
+    const result = parseNumstat(output)
+    // Without filtering, the submodule shows as 1 added / 1 deleted
+    expect(result.size).toBe(2)
+    expect(result.get('vendor/some-lib')).toMatchInlineSnapshot(`
+{
+  "added": 1,
+  "deleted": 1,
+}
+`)
+  })
+  test('getAllDiffData filters out submodule paths', () => {
+    const submodulePaths = new Set(['vendor/some-lib', 'external/utils'])
+    // This tests the filtering logic with real git commands on the current repo.
+    // Since this repo has no submodules, the filter set won't match anything,
+    // but we verify the function accepts the parameter without error.
+    const result = getAllDiffData(process.cwd(), submodulePaths)
+    expect(result.fileStats).toBeDefined()
+    expect(result.fileDiffs).toBeDefined()
+    // Verify submodule paths are not in the results
+    expect(result.fileStats.has('vendor/some-lib')).toBe(false)
+    expect(result.fileDiffs.has('vendor/some-lib')).toBe(false)
+  })
+  test('parseDiff handles submodule pseudo-diff gracefully', () => {
+    // Git produces this pseudo-diff for submodule pointer changes
+    const diffOutput = `diff --git a/vendor/lib b/vendor/lib
+index abc1234..def5678 160000
+--- a/vendor/lib
++++ b/vendor/lib
+@@ -1 +1 @@
+-Subproject commit abc1234567890abcdef1234567890abcdef123456
++Subproject commit def5678901234567890abcdef1234567890abcdef`
+    const result = parseDiff(diffOutput)
+    // Parser will extract a hunk but it's meaningless for submodules.
+    // The important thing is it doesn't crash.
+    expect(result.has('vendor/lib')).toBe(true)
+    // In practice, getAllDiffData filters this out via submodulePaths
+  })
+})
+// ============================================================================
+// Builder: submodule entry formatting (tested via types)
+// ============================================================================
+describe('SubmoduleEntry format', () => {
+  test('formats initialized submodule with branch', () => {
+    // This tests the format that builder.ts produces
+    const label = 'main @ a1b2c3d'
+    expect(label).toMatchInlineSnapshot(`"main @ a1b2c3d"`)
+  })
+  test('formats detached HEAD submodule', () => {
+    const label = 'detached @ f4e5d6c'
+    expect(label).toMatchInlineSnapshot(`"detached @ f4e5d6c"`)
+  })
+  test('formats uninitialized submodule', () => {
+    const label = 'uninitialized @ abc1234'
+    expect(label).toMatchInlineSnapshot(`"uninitialized @ abc1234"`)
+  })
+})