npm - @probelabs/probe - Versions diffs - 0.6.0-rc295 → 0.6.0-rc297 - Mend

@probelabs/probe 0.6.0-rc295 → 0.6.0-rc297

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (31) hide show

package/README.md +7 -0
package/bin/binaries/{probe-v0.6.0-rc295-aarch64-apple-darwin.tar.gz → probe-v0.6.0-rc297-aarch64-apple-darwin.tar.gz} +0 -0
package/bin/binaries/{probe-v0.6.0-rc295-aarch64-unknown-linux-musl.tar.gz → probe-v0.6.0-rc297-aarch64-unknown-linux-musl.tar.gz} +0 -0
package/bin/binaries/{probe-v0.6.0-rc295-x86_64-apple-darwin.tar.gz → probe-v0.6.0-rc297-x86_64-apple-darwin.tar.gz} +0 -0
package/bin/binaries/{probe-v0.6.0-rc295-x86_64-pc-windows-msvc.zip → probe-v0.6.0-rc297-x86_64-pc-windows-msvc.zip} +0 -0
package/bin/binaries/{probe-v0.6.0-rc295-x86_64-unknown-linux-musl.tar.gz → probe-v0.6.0-rc297-x86_64-unknown-linux-musl.tar.gz} +0 -0
package/build/agent/ProbeAgent.d.ts +40 -2
package/build/agent/ProbeAgent.js +703 -11
package/build/agent/mcp/client.js +115 -4
package/build/agent/mcp/xmlBridge.js +13 -1
package/build/agent/otelLogBridge.js +184 -0
package/build/agent/simpleTelemetry.js +8 -0
package/build/delegate.js +75 -6
package/build/index.js +6 -2
package/build/tools/common.js +84 -11
package/build/tools/vercel.js +78 -18
package/cjs/agent/ProbeAgent.cjs +1095 -185
package/cjs/agent/simpleTelemetry.cjs +112 -0
package/cjs/index.cjs +1207 -185
package/index.d.ts +26 -0
package/package.json +2 -2
package/src/agent/ProbeAgent.d.ts +40 -2
package/src/agent/ProbeAgent.js +703 -11
package/src/agent/mcp/client.js +115 -4
package/src/agent/mcp/xmlBridge.js +13 -1
package/src/agent/otelLogBridge.js +184 -0
package/src/agent/simpleTelemetry.js +8 -0
package/src/delegate.js +75 -6
package/src/index.js +6 -2
package/src/tools/common.js +84 -11
package/src/tools/vercel.js +78 -18

package/build/tools/common.js CHANGED Viewed

@@ -10,7 +10,7 @@ import { resolve, isAbsolute } from 'path';
 export const searchSchema = z.object({
 	query: z.string().describe('Search query — natural language questions or Elasticsearch-style keywords both work. For keywords: use quotes for exact phrases, AND/OR for boolean logic, - for negation. Probe handles stemming and camelCase/snake_case splitting automatically, so do NOT try case or style variations of the same keyword.'),
 	path: z.string().optional().default('.').describe('Path to search in. For dependencies use "go:github.com/owner/repo", "js:package_name", or "rust:cargo_name" etc.'),
-	exact: z.boolean().optional().default(false).describe('Default (false) enables stemming and keyword splitting for exploratory search - "getUserData" matches "get", "user", "data", etc. Set true for precise symbol lookup where "getUserData" matches only "getUserData". Use true when you know the exact symbol name.'),
+	exact: z.boolean().optional().default(false).describe('Default (false) enables stemming and keyword splitting for exploratory search - "getUserData" matches "get", "user", "data", etc. Set true for precise symbol lookup OR when searching for strings with punctuation/quotes/empty values (e.g. \'description: ""\' — BM25 strips punctuation so exact=true is required for literal matching). Use true when you know the exact symbol name or need literal string matching.'),
 	maxTokens: z.number().nullable().optional().describe('Maximum tokens to return. Default is 20000. Set to null for unlimited results.'),
 	session: z.string().optional().describe('Session ID for result caching and pagination. Pass the session ID from a previous search to get additional results (next page). Results already shown in a session are automatically excluded. Omit for a fresh search.'),
 	nextPage: z.boolean().optional().default(false).describe('Set to true when requesting the next page of results. Requires passing the same session ID from the previous search output.')
@@ -188,9 +188,74 @@ export function areBothStuckResponses(response1, response2) {
 }
+/**
+ * Parse a shell-like string into tokens, respecting quoted substrings.
+ * Supports double quotes, single quotes, and escaped characters within quotes.
+ * Splits on commas and/or whitespace outside of quotes.
+ *
+ * @param {string} input - The string to tokenize
+ * @returns {string[]} Array of tokens with quotes stripped
+ *
+ * @example
+ * splitQuotedString('"path with spaces/file.md" other.rs')
+ * // Returns: ["path with spaces/file.md", "other.rs"]
+ */
+export function splitQuotedString(input) {
+	const tokens = [];
+	let current = '';
+	let inQuote = null; // null, '"', or "'"
+	let i = 0;
+	while (i < input.length) {
+		const ch = input[i];
+		if (inQuote) {
+			if (ch === '\\' && i + 1 < input.length) {
+				// Escaped character inside quotes — keep the literal character
+				current += input[i + 1];
+				i += 2;
+				continue;
+			}
+			if (ch === inQuote) {
+				// Closing quote
+				inQuote = null;
+				i++;
+				continue;
+			}
+			current += ch;
+			i++;
+		} else {
+			if (ch === '"' || ch === "'") {
+				inQuote = ch;
+				i++;
+				continue;
+			}
+			if (/[\s,]/.test(ch)) {
+				// Delimiter outside quotes
+				if (current.length > 0) {
+					tokens.push(current);
+					current = '';
+				}
+				i++;
+				continue;
+			}
+			current += ch;
+			i++;
+		}
+	}
+	if (current.length > 0) {
+		tokens.push(current);
+	}
+	return tokens;
+}
 /**
  * Parse targets string into array of file specifications
- * Handles both space-separated and comma-separated targets for extract tool
+ * Handles both space-separated and comma-separated targets for extract tool.
+ * Quoted strings (single or double) are preserved as single targets,
+ * allowing file paths with spaces.
  *
  * @param {string} targets - Space or comma-separated file targets (e.g., "file1.rs:10-20, file2.rs#symbol")
  * @returns {string[]} Array of individual file specifications
@@ -204,16 +269,15 @@ export function areBothStuckResponses(response1, response2) {
  * // Returns: ["file1.rs:10-20", "file2.rs:30-40"]
  *
  * @example
- * parseTargets("session.rs#AuthService.login auth.rs:2-100 config.rs#DatabaseConfig")
- * // Returns: ["session.rs#AuthService.login", "auth.rs:2-100", "config.rs#DatabaseConfig"]
+ * parseTargets('"Customers/First American/Meeting Notes.md" other.rs')
+ * // Returns: ["Customers/First American/Meeting Notes.md", "other.rs"]
  */
 export function parseTargets(targets) {
 	if (!targets || typeof targets !== 'string') {
 		return [];
 	}
-	// Split on any whitespace or comma (with optional surrounding whitespace) and filter out empty strings
-	return targets.split(/[\s,]+/).filter(f => f.length > 0);
+	return splitQuotedString(targets);
 }
 /**
@@ -227,7 +291,19 @@ export function parseTargets(targets) {
 export function parseAndResolvePaths(pathStr, cwd) {
 	if (!pathStr) return [];
-	// Split on comma and trim whitespace
+	// If the input contains quotes, use the quote-aware tokenizer which
+	// preserves quoted strings with spaces as single tokens.
+	if (/["']/.test(pathStr)) {
+		const paths = splitQuotedString(pathStr);
+		return paths.map(p => {
+			if (isAbsolute(p)) return p;
+			return cwd ? resolve(cwd, p) : p;
+		});
+	}
+	// No quotes: use comma-split + space-split heuristic (original behavior).
+	// Split on comma first, then auto-fix space-separated paths if each part
+	// looks like a file path.
 	let paths = pathStr.split(',').map(p => p.trim()).filter(p => p.length > 0);
 	// Auto-fix: model sometimes passes space-separated file paths as one string
@@ -242,10 +318,7 @@ export function parseAndResolvePaths(pathStr, cwd) {
 	// Resolve relative paths against cwd
 	return paths.map(p => {
-		if (isAbsolute(p)) {
-			return p;
-		}
-		// Resolve relative path against cwd
+		if (isAbsolute(p)) return p;
 		return cwd ? resolve(cwd, p) : p;
 	});
 }

package/build/tools/vercel.js CHANGED Viewed

@@ -254,6 +254,10 @@ function buildSearchDelegateTask({ searchQuery, searchPath, exact, language, all
 		'- Use exact=true when searching for a KNOWN symbol name (function, type, variable, struct).',
 		'- exact=true matches the literal string only — no stemming, no splitting.',
 		'- This is ideal for precise lookups: exact=true "ForwardMessage", exact=true "SessionLimiter", exact=true "ThrottleRetryLimit".',
+		'- IMPORTANT: Use exact=true when searching for strings containing punctuation, quotes, or empty values.',
+		'  Default BM25 search strips punctuation and treats quoted empty strings as noise.',
+		'  Example: searching for \'description: ""\' with exact=false will NOT find empty description fields — it just matches "description".',
+		'  Use exact=true for literal patterns like \'description: ""\', \'value: \\\'\\\'\', or any YAML/config field with specific punctuation.',
 		'- Do NOT use exact=true for exploratory/conceptual queries — use the default for those.',
 		'',
 		'Combining searches with OR:',
@@ -313,7 +317,13 @@ function buildSearchDelegateTask({ searchQuery, searchPath, exact, language, all
 		'WHEN TO STOP:',
 		'- After you have explored the main concept AND related subsystems.',
 		'- Once you have 5-15 targets covering different aspects of the query.',
-		'- If you get a "DUPLICATE SEARCH BLOCKED" message, move on.',
+		'- If you get a "DUPLICATE SEARCH BLOCKED" message, do NOT rephrase the same query — try a FUNDAMENTALLY different approach:',
+		'  * Switch between exact=true and exact=false',
+		'  * Search for a broader term and filter results manually',
+		'  * Use listFiles to browse the directory structure directly',
+		'  * Look for related/surrounding patterns instead of the exact string',
+		'- If 2-3 genuinely different search approaches fail, STOP and report what you tried and why it failed.',
+		'  Do NOT keep trying variations of the same failing concept.',
 		'',
 		'Strategy:',
 		'1. Analyze the query — identify key concepts, then brainstorm SYNONYMS and alternative terms for each.',
@@ -371,10 +381,10 @@ export const searchTool = (options = {}) => {
 		return result;
 	};
-	// Track previous non-paginated searches to detect and block duplicates
-	const previousSearches = new Set();
-	// Track how many times a duplicate search has been blocked (for escalating messages)
-	let consecutiveDupBlocks = 0;
+	// Track previous non-paginated searches: key → { hadResults: boolean }
+	const previousSearches = new Map();
+	// Track per-key consecutive block counts (not global, to avoid cross-query pollution)
+	const dupBlockCounts = new Map();
 	// Track pagination counts per query to cap runaway pagination
 	const paginationCounts = new Map();
 	const MAX_PAGES_PER_QUERY = 3;
@@ -444,22 +454,28 @@ export const searchTool = (options = {}) => {
 			if (!searchDelegate) {
 				// Block duplicate non-paginated searches (models sometimes repeat the exact same call)
 				// Allow pagination: only nextPage=true is a legitimate repeat of the same query
-				// Use query+exact as the key (ignore path) to prevent path-hopping evasion
-				// where model searches same term on different subpaths hoping for different results
-				const searchKey = `${searchQuery}::${exact || false}`;
+				// Include path in dedup key so same query across different repos is allowed (#520)
+				const searchKey = `${searchPath}::${searchQuery}::${exact || false}`;
 				if (!nextPage) {
 					if (previousSearches.has(searchKey)) {
-						consecutiveDupBlocks++;
+						const blockCount = (dupBlockCounts.get(searchKey) || 0) + 1;
+						dupBlockCounts.set(searchKey, blockCount);
 						if (debug) {
-							console.error(`[DEDUP] Blocked duplicate search (${consecutiveDupBlocks}x): "${searchQuery}" (path: "${searchPath}")`);
+							console.error(`[DEDUP] Blocked duplicate search (${blockCount}x): "${searchQuery}" (path: "${searchPath}")`);
 						}
-						if (consecutiveDupBlocks >= 3) {
-							return 'STOP. You have been blocked ' + consecutiveDupBlocks + ' times for repeating searches. You MUST output your final JSON answer NOW with whatever targets you have found. Do NOT call any more tools.';
+						if (blockCount >= 3) {
+							return 'STOP. You have been blocked ' + blockCount + ' times for repeating the same search. You MUST provide your final answer NOW with whatever information you have. Do NOT call any more tools.';
 						}
-						return 'DUPLICATE SEARCH BLOCKED (' + consecutiveDupBlocks + 'x). You already searched for this. Do NOT repeat — probe searches recursively across all paths. Either: (1) use extract on results you already found, (2) try a COMPLETELY different keyword, or (3) output your final answer NOW.';
+						const prev = previousSearches.get(searchKey);
+						if (prev.hadResults) {
+							return `DUPLICATE SEARCH BLOCKED (${blockCount}x). You already searched for "${searchQuery}" in this path and found results. Do NOT repeat. Use extract to examine the files you already found, try a COMPLETELY different keyword, or provide your final answer.`;
+						}
+						const exactHint = exact
+							? 'You used exact=true. Try a broader search with exact=false, or use listFiles to browse the directory structure.'
+							: 'Try exact=true if you need literal/punctuation matching (e.g. \'description: ""\'), or use listFiles to explore directories, or search for a broader/related term and filter manually.';
+						return `DUPLICATE SEARCH BLOCKED (${blockCount}x). You already searched for "${searchQuery}" in this path and got NO results. This term does not appear in the codebase. Do NOT repeat or rephrase — try a FUNDAMENTALLY different approach: ${exactHint} If multiple approaches have failed, provide your final answer with what you know.`;
 					}
-					previousSearches.add(searchKey);
-					consecutiveDupBlocks = 0; // Reset on successful new search
+					previousSearches.set(searchKey, { hadResults: false });
 					paginationCounts.set(searchKey, 0);
 				} else {
 					// Cap pagination to prevent runaway page-through of broad queries
@@ -474,6 +490,16 @@ export const searchTool = (options = {}) => {
 				}
 				try {
 					const result = maybeAnnotate(await runRawSearch());
+					// Track whether this search had results for better dedup messages
+					if (typeof result === 'string' && result.includes('No results found')) {
+						// Append contextual hint for ticket/issue ID queries
+						if (/^[A-Z]+-\d+$/.test(searchQuery.trim()) || /^[A-Z]+-\d+$/.test(searchQuery.replace(/"/g, '').trim())) {
+							return result + '\n\n⚠️ Your query looks like a ticket/issue ID (e.g., JIRA-1234). Ticket IDs are rarely present in source code. Search for the technical concepts described in the ticket instead (e.g., function names, error messages, variable names).';
+						}
+					} else if (typeof result === 'string') {
+						const entry = previousSearches.get(searchKey);
+						if (entry) entry.hadResults = true;
+					}
 					// Track files found in search results for staleness detection
 					if (options.fileTracker && typeof result === 'string') {
 						options.fileTracker.trackFilesFromOutput(result, effectiveSearchCwd).catch(() => {});
@@ -862,7 +888,11 @@ export const extractTool = (options = {}) => {
  * @returns {Object} Configured delegate tool
  */
 export const delegateTool = (options = {}) => {
-	const { debug = false, timeout = 300, cwd, allowedFolders, workspaceRoot, enableBash = false, bashConfig, architectureFileName, enableMcp = false, mcpConfig = null, mcpConfigPath = null, delegationManager = null } = options;
+	const { debug = false, timeout = 300, cwd, allowedFolders, workspaceRoot, enableBash = false, bashConfig, architectureFileName, enableMcp = false, mcpConfig = null, mcpConfigPath = null, delegationManager = null,
+		// Timeout settings inherited from parent agent
+		timeoutBehavior, maxOperationTimeout, requestTimeout, gracefulTimeoutBonusSteps,
+		negotiatedTimeoutBudget, negotiatedTimeoutMaxRequests, negotiatedTimeoutMaxPerRequest,
+		parentOperationStartTime, onSubagentCreated, onSubagentCompleted } = options;
 	return tool({
 		name: 'delegate',
@@ -941,9 +971,32 @@ export const delegateTool = (options = {}) => {
 			}
 			// Execute delegation - let errors propagate naturally
+			// Cap delegate timeout to remaining parent budget (with 10% headroom)
+			let effectiveTimeout = timeout;
+			if (parentOperationStartTime && maxOperationTimeout) {
+				const elapsed = Date.now() - parentOperationStartTime;
+				const remaining = maxOperationTimeout - elapsed;
+				const budgetCap = Math.max(30, Math.floor(remaining * 0.9 / 1000)); // seconds, min 30s
+				if (budgetCap < effectiveTimeout) {
+					effectiveTimeout = budgetCap;
+					if (debug) {
+						console.error(`[DELEGATE] Capping timeout from ${timeout}s to ${effectiveTimeout}s (remaining parent budget: ${Math.floor(remaining/1000)}s)`);
+					}
+					if (tracer) {
+						tracer.addEvent('delegation.budget_capped', {
+							'delegation.original_timeout_s': timeout,
+							'delegation.effective_timeout_s': effectiveTimeout,
+							'delegation.parent_elapsed_ms': elapsed,
+							'delegation.parent_remaining_ms': remaining,
+							'delegation.parent_session_id': parentSessionId,
+						});
+					}
+				}
+			}
 			const result = await delegate({
 				task,
-				timeout,
+				timeout: effectiveTimeout,
 				debug,
 				currentIteration: currentIteration || 0,
 				maxIterations: maxIterations || 30,
@@ -961,7 +1014,14 @@ export const delegateTool = (options = {}) => {
 				mcpConfig,
 				mcpConfigPath,
 				delegationManager,  // Per-instance delegation limits
-				parentAbortSignal
+				parentAbortSignal,
+				// Inherit timeout settings for subagent
+				timeoutBehavior,
+				requestTimeout,
+				gracefulTimeoutBonusSteps,
+				// Subagent lifecycle callbacks for graceful stop coordination
+				onSubagentCreated,
+				onSubagentCompleted,
 			});
 			return result;