@probelabs/probe 0.6.0-rc229 → 0.6.0-rc230

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
package/package.json CHANGED
@@ -1,6 +1,6 @@
1
1
  {
2
2
  "name": "@probelabs/probe",
3
- "version": "0.6.0-rc229",
3
+ "version": "0.6.0-rc230",
4
4
  "description": "Node.js wrapper for the probe code search tool",
5
5
  "main": "src/index.js",
6
6
  "module": "src/index.js",
@@ -58,6 +58,8 @@ import {
58
58
  implementToolDefinition,
59
59
  editToolDefinition,
60
60
  createToolDefinition,
61
+ googleSearchToolDefinition,
62
+ urlContextToolDefinition,
61
63
  attemptCompletionSchema,
62
64
  parseXmlToolCallWithThinking
63
65
  } from './tools.js';
@@ -404,6 +406,10 @@ export class ProbeAgent {
404
406
  // Initialize the AI model
405
407
  this.initializeModel();
406
408
 
409
+ // Gemini built-in tools (provider-defined, server-side)
410
+ // These are enabled automatically when the provider is Google
411
+ this._geminiToolsEnabled = this._initializeGeminiBuiltinTools();
412
+
407
413
  // Note: MCP initialization is now done in initialize() method
408
414
  // Constructor must remain synchronous for backward compatibility
409
415
  }
@@ -1320,6 +1326,15 @@ export class ProbeAgent {
1320
1326
  abortSignal: controller.signal
1321
1327
  };
1322
1328
 
1329
+ // Strip Gemini provider-defined tools when falling back to non-Google provider
1330
+ // These tools have no execute function and would cause errors on other providers
1331
+ if (config.provider !== 'google' && fallbackOptions.tools) {
1332
+ delete fallbackOptions.tools;
1333
+ if (this.debug) {
1334
+ console.error(`[DEBUG] Stripped Gemini built-in tools for fallback to ${config.provider} provider`);
1335
+ }
1336
+ }
1337
+
1323
1338
  const providerRetryManager = new RetryManager({
1324
1339
  maxRetries: config.maxRetries ?? this.retryConfig.maxRetries ?? 3,
1325
1340
  initialDelay: this.retryConfig.initialDelay ?? 1000,
@@ -1442,6 +1457,83 @@ export class ProbeAgent {
1442
1457
  }
1443
1458
  }
1444
1459
 
1460
+ /**
1461
+ * Initialize Gemini built-in tools (gemini_google_search, gemini_url_context).
1462
+ * These are provider-defined tools that execute server-side on Google's infrastructure.
1463
+ * They are only available when the provider is Google Gemini.
1464
+ * @returns {{ googleSearch: boolean, urlContext: boolean }} Which tools were enabled
1465
+ * @private
1466
+ */
1467
+ _initializeGeminiBuiltinTools() {
1468
+ const isToolAllowed = (toolName) => this.allowedTools.isEnabled(toolName);
1469
+ const result = { googleSearch: false, urlContext: false };
1470
+
1471
+ if (this.apiType !== 'google') {
1472
+ // Log info about unavailability for non-Google providers
1473
+ if (isToolAllowed('gemini_google_search') || isToolAllowed('gemini_url_context')) {
1474
+ if (this.debug) {
1475
+ console.error(`[DEBUG] Gemini built-in tools (gemini_google_search, gemini_url_context) are not available: provider is '${this.apiType}', not 'google'. These tools require the Google Gemini provider.`);
1476
+ }
1477
+ }
1478
+ return result;
1479
+ }
1480
+
1481
+ // Check SDK support
1482
+ if (!this.provider || !this.provider.tools) {
1483
+ console.error('[ProbeAgent] Gemini built-in tools unavailable: @ai-sdk/google does not expose provider.tools. Upgrade to @ai-sdk/google v2.0.14+.');
1484
+ return result;
1485
+ }
1486
+
1487
+ if (isToolAllowed('gemini_google_search')) {
1488
+ result.googleSearch = true;
1489
+ if (this.debug) {
1490
+ console.error('[DEBUG] Gemini built-in tool enabled: gemini_google_search');
1491
+ }
1492
+ }
1493
+
1494
+ if (isToolAllowed('gemini_url_context')) {
1495
+ result.urlContext = true;
1496
+ if (this.debug) {
1497
+ console.error('[DEBUG] Gemini built-in tool enabled: gemini_url_context');
1498
+ }
1499
+ }
1500
+
1501
+ return result;
1502
+ }
1503
+
1504
+ /**
1505
+ * Build Gemini provider-defined tools object for streamText().
1506
+ * Returns undefined if no Gemini tools are enabled.
1507
+ * @returns {Object|undefined}
1508
+ * @private
1509
+ */
1510
+ _buildGeminiProviderTools() {
1511
+ if (this.apiType !== 'google' || !this._geminiToolsEnabled) {
1512
+ return undefined;
1513
+ }
1514
+
1515
+ const { googleSearch, urlContext } = this._geminiToolsEnabled;
1516
+ if (!googleSearch && !urlContext) {
1517
+ return undefined;
1518
+ }
1519
+
1520
+ if (!this.provider || !this.provider.tools) {
1521
+ return undefined;
1522
+ }
1523
+
1524
+ const tools = {};
1525
+ const providerTools = this.provider.tools;
1526
+
1527
+ if (googleSearch && providerTools.googleSearch) {
1528
+ tools.google_search = providerTools.googleSearch({});
1529
+ }
1530
+ if (urlContext && providerTools.urlContext) {
1531
+ tools.url_context = providerTools.urlContext({});
1532
+ }
1533
+
1534
+ return Object.keys(tools).length > 0 ? tools : undefined;
1535
+ }
1536
+
1445
1537
  /**
1446
1538
  * Initialize AWS Bedrock model
1447
1539
  */
@@ -2420,6 +2512,14 @@ ${extractGuidance}
2420
2512
  toolDefinitions += `${analyzeAllToolDefinition}\n`;
2421
2513
  }
2422
2514
 
2515
+ // Gemini built-in tools (only when using Google provider)
2516
+ if (this._geminiToolsEnabled?.googleSearch && isToolAllowed('gemini_google_search')) {
2517
+ toolDefinitions += `${googleSearchToolDefinition}\n`;
2518
+ }
2519
+ if (this._geminiToolsEnabled?.urlContext && isToolAllowed('gemini_url_context')) {
2520
+ toolDefinitions += `${urlContextToolDefinition}\n`;
2521
+ }
2522
+
2423
2523
  // Build XML tool guidelines with dynamic examples based on allowed tools
2424
2524
  // Build examples only for allowed tools
2425
2525
  let toolExamples = '';
@@ -2497,6 +2597,12 @@ The configuration is loaded from src/config.js lines 15-25 which contains the da
2497
2597
  availableToolsList += '- attempt_completion: Finalize the task and provide the result to the user.\n';
2498
2598
  availableToolsList += '- attempt_complete: Quick completion using previous response (shorthand).\n';
2499
2599
  }
2600
+ if (this._geminiToolsEnabled?.googleSearch && isToolAllowed('gemini_google_search')) {
2601
+ availableToolsList += '- gemini_google_search: (auto) Web search via Google — invoked automatically by the model when it needs current information.\n';
2602
+ }
2603
+ if (this._geminiToolsEnabled?.urlContext && isToolAllowed('gemini_url_context')) {
2604
+ availableToolsList += '- gemini_url_context: (auto) URL content reader via Google — automatically fetches and reads URLs mentioned in the conversation.\n';
2605
+ }
2500
2606
 
2501
2607
  let xmlToolGuidelines = `
2502
2608
  # Tool Use Formatting
@@ -3049,12 +3155,21 @@ Follow these instructions carefully:
3049
3155
  // Prepare messages with potential image content
3050
3156
  const messagesForAI = this.prepareMessagesWithImages(currentMessages);
3051
3157
 
3052
- const result = await this.streamTextWithRetryAndFallback({
3158
+ // Build streamText options, including Gemini provider-defined tools if applicable
3159
+ const streamOptions = {
3053
3160
  model: this.provider ? this.provider(this.model) : this.model,
3054
3161
  messages: messagesForAI,
3055
3162
  maxTokens: maxResponseTokens,
3056
3163
  temperature: 0.3,
3057
- });
3164
+ };
3165
+
3166
+ // Inject Gemini built-in tools (gemini_google_search, gemini_url_context) when using Google provider
3167
+ const geminiProviderTools = this._buildGeminiProviderTools();
3168
+ if (geminiProviderTools) {
3169
+ streamOptions.tools = geminiProviderTools;
3170
+ }
3171
+
3172
+ const result = await this.streamTextWithRetryAndFallback(streamOptions);
3058
3173
 
3059
3174
  // Get the promise reference BEFORE consuming stream (doesn't lock it)
3060
3175
  const usagePromise = result.usage;
@@ -3585,6 +3700,12 @@ Follow these instructions carefully:
3585
3700
 
3586
3701
  let toolResultContent = typeof toolResult === 'string' ? toolResult : JSON.stringify(toolResult, null, 2);
3587
3702
 
3703
+ // Convert absolute workspace paths to relative in tool results
3704
+ if (this.workspaceRoot && toolResultContent) {
3705
+ const wsPrefix = this.workspaceRoot.endsWith(sep) ? this.workspaceRoot : this.workspaceRoot + sep;
3706
+ toolResultContent = toolResultContent.split(wsPrefix).join('');
3707
+ }
3708
+
3588
3709
  // Truncate if output exceeds token limit
3589
3710
  try {
3590
3711
  const truncateResult = await truncateIfNeeded(toolResultContent, this.tokenCounter, this.sessionId, this.maxOutputTokens);
@@ -15,7 +15,13 @@ const __dirname = dirname(__filename);
15
15
  * Timeout configuration constants
16
16
  */
17
17
  export const DEFAULT_TIMEOUT = 30000; // 30 seconds
18
- export const MAX_TIMEOUT = 600000; // 10 minutes max to prevent resource exhaustion
18
+ export const MAX_TIMEOUT = (() => {
19
+ if (process.env.MCP_MAX_TIMEOUT) {
20
+ const parsed = parseInt(process.env.MCP_MAX_TIMEOUT, 10);
21
+ if (!isNaN(parsed) && parsed >= 30000 && parsed <= 7200000) return parsed;
22
+ }
23
+ return 1800000; // 30 minutes default - workflow tools (code checkouts, AI exploration) need time
24
+ })();
19
25
 
20
26
  /**
21
27
  * Validate and normalize a timeout value
@@ -27,6 +27,8 @@ import {
27
27
  bashToolDefinition,
28
28
  editToolDefinition,
29
29
  createToolDefinition,
30
+ googleSearchToolDefinition,
31
+ urlContextToolDefinition,
30
32
  parseXmlToolCall
31
33
  } from '../index.js';
32
34
  import { randomUUID } from 'crypto';
@@ -108,6 +110,8 @@ export {
108
110
  editToolDefinition,
109
111
  createToolDefinition,
110
112
  attemptCompletionToolDefinition,
113
+ googleSearchToolDefinition,
114
+ urlContextToolDefinition,
111
115
  parseXmlToolCall
112
116
  };
113
117
 
package/src/index.js CHANGED
@@ -35,6 +35,8 @@ import {
35
35
  analyzeAllToolDefinition,
36
36
  attemptCompletionToolDefinition,
37
37
  bashToolDefinition,
38
+ googleSearchToolDefinition,
39
+ urlContextToolDefinition,
38
40
  parseXmlToolCall
39
41
  } from './tools/common.js';
40
42
  import {
@@ -114,6 +116,8 @@ export {
114
116
  bashToolDefinition,
115
117
  editToolDefinition,
116
118
  createToolDefinition,
119
+ googleSearchToolDefinition,
120
+ urlContextToolDefinition,
117
121
  // Export parser function
118
122
  parseXmlToolCall,
119
123
  // Export task management
@@ -386,6 +386,30 @@ User: Check system info
386
386
  </examples>
387
387
  `;
388
388
 
389
+ export const googleSearchToolDefinition = `
390
+ ## gemini_google_search (Gemini Built-in)
391
+ Description: Web search powered by Google. This is a built-in Gemini capability that automatically searches the web when the model needs current information. The model decides when to search and integrates results directly into its response with source citations.
392
+
393
+ This tool is invoked automatically by the model — you do NOT need to use XML tool calls for it. Simply ask questions that require up-to-date or real-world information and the model will search the web as needed.
394
+
395
+ Capabilities:
396
+ - Real-time web search with grounded citations
397
+ - Automatic query generation and result synthesis
398
+ - Source attribution with URLs
399
+ `;
400
+
401
+ export const urlContextToolDefinition = `
402
+ ## gemini_url_context (Gemini Built-in)
403
+ Description: URL content reader powered by Google. This is a built-in Gemini capability that automatically fetches and analyzes the content of URLs mentioned in the conversation. When you include URLs in your message, the model can read and understand their content.
404
+
405
+ This tool is invoked automatically by the model — you do NOT need to use XML tool calls for it. Simply include URLs in your message and the model will fetch and analyze their content.
406
+
407
+ Capabilities:
408
+ - Fetch and read web page content from URLs in the prompt
409
+ - Supports up to 20 URLs per request
410
+ - Processes HTML content (does not execute JavaScript)
411
+ `;
412
+
389
413
  export const searchDescription = 'Search code in the repository. Free-form questions are accepted, but Elasticsearch-style keyword queries work best. Use this tool first for any code-related questions.';
390
414
  export const queryDescription = 'Search code using ast-grep structural pattern matching. Use this tool to find specific code structures like functions, classes, or methods.';
391
415
  export const extractDescription = 'Extract code blocks from files based on file paths and optional line numbers. Use this tool to see complete context after finding relevant files.';
@@ -55,9 +55,9 @@ export function safeRealpath(inputPath) {
55
55
  * - Does NOT restrict access to specific directories (that's the responsibility
56
56
  * of higher-level components like ProbeAgent with allowedFolders)
57
57
  *
58
- * @param {string} inputPath - The path to validate
58
+ * @param {string} inputPath - The path to validate (can be a file or directory; file paths are resolved to their parent directory)
59
59
  * @param {string} [defaultPath] - Default path to use if inputPath is not provided
60
- * @returns {Promise<string>} Normalized absolute path
60
+ * @returns {Promise<string>} Normalized absolute directory path. If inputPath is a file, returns its parent directory.
61
61
  * @throws {PathError} If the path is invalid or doesn't exist
62
62
  */
63
63
  export async function validateCwdPath(inputPath, defaultPath = process.cwd()) {
@@ -72,6 +72,32 @@ export async function validateCwdPath(inputPath, defaultPath = process.cwd()) {
72
72
  try {
73
73
  const stats = await fs.stat(normalizedPath);
74
74
  if (!stats.isDirectory()) {
75
+ // If the path is a file, resolve to its parent directory
76
+ // This handles cases where a file path is passed as cwd
77
+ // Use safeRealpath to resolve symlinks before extracting parent directory
78
+ const resolvedPath = safeRealpath(normalizedPath);
79
+ const dirPath = path.dirname(resolvedPath);
80
+ try {
81
+ const dirStats = await fs.stat(dirPath);
82
+ if (dirStats.isDirectory()) {
83
+ return safeRealpath(dirPath);
84
+ }
85
+ } catch (dirError) {
86
+ if (dirError.code === 'ENOENT') {
87
+ throw new PathError(`Parent directory does not exist for file: ${normalizedPath}`, {
88
+ suggestion: 'The specified path is a file whose parent directory does not exist.',
89
+ details: { path: normalizedPath, parentPath: dirPath, type: 'file' }
90
+ });
91
+ }
92
+ if (dirError.code === 'EACCES') {
93
+ throw new PathError(`Permission denied accessing parent directory: ${dirPath}`, {
94
+ recoverable: false,
95
+ suggestion: 'Permission denied accessing the parent directory of the specified file.',
96
+ details: { path: normalizedPath, parentPath: dirPath, type: 'file' }
97
+ });
98
+ }
99
+ throw dirError;
100
+ }
75
101
  throw new PathError(`Path is not a directory: ${normalizedPath}`, {
76
102
  suggestion: 'The specified path is a file, not a directory. Please provide a directory path for searching.',
77
103
  details: { path: normalizedPath, type: 'file' }