npm - @telnyx/voice-agent-tester - Versions diffs - 0.2.0 - Mend

@telnyx/voice-agent-tester 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (33) hide show

package/.github/CODEOWNERS +4 -0
package/.github/workflows/ci.yml +29 -0
package/.github/workflows/draft-release.yml +72 -0
package/.github/workflows/publish-release.yml +39 -0
package/.release-it.json +31 -0
package/CHANGELOG.md +30 -0
package/CLAUDE.md +72 -0
package/LICENSE +21 -0
package/README.md +92 -0
package/assets/appointment_data.mp3 +0 -0
package/assets/confirmation.mp3 +0 -0
package/assets/greet_me_angry.mp3 +0 -0
package/assets/hello_make_an_appointment.mp3 +0 -0
package/assets/name_lebron_james.mp3 +0 -0
package/assets/recording-processor.js +86 -0
package/assets/tell_me_joke_laugh.mp3 +0 -0
package/assets/tell_me_something_funny.mp3 +0 -0
package/assets/tell_me_something_sad.mp3 +0 -0
package/benchmarks/applications/elevenlabs.yaml +10 -0
package/benchmarks/applications/telnyx.yaml +10 -0
package/benchmarks/applications/vapi.yaml +10 -0
package/benchmarks/scenarios/appointment.yaml +16 -0
package/javascript/audio_input_hooks.js +291 -0
package/javascript/audio_output_hooks.js +876 -0
package/package.json +61 -0
package/src/index.js +560 -0
package/src/provider-import.js +315 -0
package/src/report.js +228 -0
package/src/server.js +31 -0
package/src/transcription.js +138 -0
package/src/voice-agent-tester.js +1033 -0
package/tests/integration.test.js +138 -0
package/tests/voice-agent-tester.test.js +190 -0

package/package.json ADDED Viewed

@@ -0,0 +1,61 @@
+{
+  "name": "@telnyx/voice-agent-tester",
+  "version": "0.2.0",
+  "description": "A command-line tool to test voice agents using Puppeteer",
+  "main": "src/index.js",
+  "type": "module",
+  "scripts": {
+    "start": "node src/index.js",
+    "server": "node src/server.js",
+    "test": "node --experimental-vm-modules node_modules/jest/bin/jest.js",
+    "test:watch": "jest --watch",
+    "release": "release-it"
+  },
+  "bin": {
+    "voice-agent-tester": "./src/index.js"
+  },
+  "repository": {
+    "type": "git",
+    "url": "git://github.com/team-telnyx/voice-agent-tester.git"
+  },
+  "publishConfig": {
+    "access": "public",
+    "@telnyx:registry": "https://registry.npmjs.org"
+  },
+  "dependencies": {
+    "@puppeteer/browsers": "^2.4.0",
+    "express": "^5.1.0",
+    "glob": "^11.1.0",
+    "openai": "^4.104.0",
+    "puppeteer": "^24.3.0",
+    "puppeteer-stream": "^3.0.8",
+    "yaml": "^2.3.0",
+    "yargs": "^17.7.0"
+  },
+  "devDependencies": {
+    "@jest/globals": "^29.0.0",
+    "@release-it/conventional-changelog": "^10.0.4",
+    "jest": "^29.0.0",
+    "release-it": "^19.2.3"
+  },
+  "jest": {
+    "testEnvironment": "node",
+    "moduleNameMapper": {
+      "^(\\.{1,2}/.*)\\.js$": "$1"
+    },
+    "transform": {},
+    "testMatch": [
+      "**/tests/**/*.test.js"
+    ]
+  },
+  "keywords": [
+    "voice",
+    "agent",
+    "testing",
+    "puppeteer",
+    "automation"
+  ],
+  "author": "Voice Agent Tester",
+  "license": "MIT",
+  "packageManager": "yarn@4.11.0+sha512.4e54aeace9141df2f0177c266b05ec50dc044638157dae128c471ba65994ac802122d7ab35bcd9e81641228b7dcf24867d28e750e0bcae8a05277d600008ad54"
+}

package/src/index.js ADDED Viewed

@@ -0,0 +1,560 @@
+#!/usr/bin/env node
+import fs from 'fs';
+import path from 'path';
+import { fileURLToPath } from 'url';
+import readline from 'readline';
+import yargs from 'yargs';
+import { hideBin } from 'yargs/helpers';
+import YAML from 'yaml';
+import { VoiceAgentTester } from './voice-agent-tester.js';
+import { ReportGenerator } from './report.js';
+import { createServer } from './server.js';
+import { importAssistantsFromProvider, getAssistant, enableWebCalls, SUPPORTED_PROVIDERS } from './provider-import.js';
+const __filename = fileURLToPath(import.meta.url);
+const __dirname = path.dirname(__filename);
+// Helper function to resolve file paths from comma-separated input or folder
+function resolveConfigPaths(input) {
+  const paths = [];
+  const items = input.split(',').map(s => s.trim());
+  for (const item of items) {
+    const resolvedPath = path.resolve(item);
+    if (fs.existsSync(resolvedPath)) {
+      const stat = fs.statSync(resolvedPath);
+      if (stat.isDirectory()) {
+        // If it's a directory, find all .yaml files
+        const files = fs.readdirSync(resolvedPath)
+          .filter(f => f.endsWith('.yaml') || f.endsWith('.yml'))
+          .map(f => path.join(resolvedPath, f));
+        paths.push(...files);
+      } else if (stat.isFile()) {
+        paths.push(resolvedPath);
+      }
+    } else {
+      throw new Error(`Path not found: ${resolvedPath}`);
+    }
+  }
+  return paths;
+}
+// Helper function to parse params string into an object
+function parseParams(paramsString) {
+  if (!paramsString) {
+    return {};
+  }
+  const params = {};
+  const pairs = paramsString.split(',');
+  for (const pair of pairs) {
+    const [key, ...valueParts] = pair.split('=');
+    if (key && valueParts.length > 0) {
+      params[key.trim()] = valueParts.join('=').trim();
+    }
+  }
+  return params;
+}
+// Helper function to substitute template variables in URL
+function substituteUrlParams(url, params) {
+  if (!url) return url;
+  let result = url;
+  for (const [key, value] of Object.entries(params)) {
+    // Replace {{key}} with value
+    const templatePattern = new RegExp(`\\{\\{${key}\\}\\}`, 'g');
+    result = result.replace(templatePattern, value);
+  }
+  return result;
+}
+// Helper function to load and validate application config
+function loadApplicationConfig(configPath, params = {}) {
+  const configFile = fs.readFileSync(configPath, 'utf8');
+  const config = YAML.parse(configFile);
+  if (!config.url && !config.html) {
+    throw new Error(`Application config must contain "url" or "html" field: ${configPath}`);
+  }
+  // Substitute URL template params
+  const url = substituteUrlParams(config.url, params);
+  return {
+    name: path.basename(configPath, path.extname(configPath)),
+    path: configPath,
+    url: url,
+    html: config.html,
+    steps: config.steps || [],
+    tags: config.tags || []
+  };
+}
+// Helper function to load scenario config
+function loadScenarioConfig(configPath) {
+  const configFile = fs.readFileSync(configPath, 'utf8');
+  const config = YAML.parse(configFile);
+  return {
+    name: path.basename(configPath, path.extname(configPath)),
+    path: configPath,
+    steps: config.steps || [],
+    background: config.background || null,
+    tags: config.tags || []
+  };
+}
+// Helper function to prompt user for y/n response
+function promptUser(question) {
+  return new Promise((resolve) => {
+    const rl = readline.createInterface({
+      input: process.stdin,
+      output: process.stdout
+    });
+    rl.question(question, (answer) => {
+      rl.close();
+      resolve(answer.toLowerCase().trim() === 'y' || answer.toLowerCase().trim() === 'yes');
+    });
+  });
+}
+// Parse command-line arguments
+const argv = yargs(hideBin(process.argv))
+  .option('applications', {
+    alias: 'a',
+    type: 'string',
+    description: 'Comma-separated application paths or folder path',
+    demandOption: true
+  })
+  .option('scenarios', {
+    alias: 's',
+    type: 'string',
+    description: 'Comma-separated scenario paths or folder path',
+    demandOption: true
+  })
+  .option('verbose', {
+    alias: 'v',
+    type: 'boolean',
+    description: 'Show browser console logs',
+    default: false
+  })
+  .option('assets-server', {
+    type: 'string',
+    description: 'Assets server URL',
+    default: `http://localhost:${process.env.HTTP_PORT || process.env.PORT || 3333}`
+  })
+  .option('report', {
+    alias: 'r',
+    type: 'string',
+    description: 'Generate CSV report with step elapsed times to specified file',
+    default: null
+  })
+  .option('repeat', {
+    type: 'number',
+    description: 'Number of repetitions to run each app+scenario combination (closes and recreates browser for each)',
+    default: 1
+  })
+  .option('headless', {
+    type: 'boolean',
+    description: 'Run browser in headless mode',
+    default: true
+  })
+  .option('application-tags', {
+    type: 'string',
+    description: 'Comma-separated list of application tags to filter by',
+    default: null
+  })
+  .option('scenario-tags', {
+    type: 'string',
+    description: 'Comma-separated list of scenario tags to filter by',
+    default: null
+  })
+  .option('concurrency', {
+    alias: 'c',
+    type: 'number',
+    description: 'Number of tests to run in parallel',
+    default: 1
+  })
+  .option('record', {
+    type: 'boolean',
+    description: 'Record video and audio of the test in webm format',
+    default: false
+  })
+  .option('params', {
+    alias: 'p',
+    type: 'string',
+    description: 'Comma-separated key=value pairs for URL template substitution (e.g., --params key=value)',
+    default: null
+  })
+  .option('provider', {
+    type: 'string',
+    description: `Import from external provider (${SUPPORTED_PROVIDERS.join(', ')}) - requires --api-key, --provider-api-key, --provider-import-id`,
+    choices: SUPPORTED_PROVIDERS
+  })
+  .option('api-key', {
+    type: 'string',
+    description: 'Telnyx API key for authentication and import operations'
+  })
+  .option('provider-api-key', {
+    type: 'string',
+    description: 'External provider API key (required with --provider for import)'
+  })
+  .option('provider-import-id', {
+    type: 'string',
+    description: 'Provider assistant/agent ID to import (required with --provider)'
+  })
+  .option('assistant-id', {
+    type: 'string',
+    description: 'Assistant/agent ID for direct benchmarking (works with all providers)'
+  })
+  .option('debug', {
+    alias: 'd',
+    type: 'boolean',
+    description: 'Enable detailed timeout diagnostics for audio events',
+    default: false
+  })
+  .help()
+  .argv;
+async function main() {
+  let server;
+  let exitCode = 0;
+  const tempHtmlPaths = [];
+  try {
+    // Start the assets server
+    server = createServer();
+    // Resolve application and scenario paths
+    const applicationPaths = resolveConfigPaths(argv.applications);
+    const scenarioPaths = resolveConfigPaths(argv.scenarios);
+    if (applicationPaths.length === 0) {
+      throw new Error('No application config files found');
+    }
+    if (scenarioPaths.length === 0) {
+      throw new Error('No scenario config files found');
+    }
+    // Parse URL parameters for template substitution
+    const params = parseParams(argv.params);
+    // Handle provider import if requested
+    if (argv.provider) {
+      // Validate required options for provider import
+      if (!argv.apiKey) {
+        throw new Error('--api-key (Telnyx) is required when using --provider');
+      }
+      if (!argv.providerApiKey) {
+        throw new Error('--provider-api-key is required when using --provider');
+      }
+      if (!argv.providerImportId) {
+        throw new Error('--provider-import-id is required when using --provider');
+      }
+      const importResult = await importAssistantsFromProvider({
+        provider: argv.provider,
+        providerApiKey: argv.providerApiKey,
+        telnyxApiKey: argv.apiKey,
+        assistantId: argv.providerImportId
+      });
+      // Use the imported assistant's Telnyx ID
+      const selectedAssistant = importResult.assistants[0];
+      // Inject the imported assistant ID into params (overrides CLI assistant-id with Telnyx ID)
+      if (selectedAssistant) {
+        params.assistantId = selectedAssistant.id;
+        console.log(`📝 Injected Telnyx assistantId from ${argv.provider} import: ${selectedAssistant.id}`);
+      }
+    } else if (!argv.assistantId) {
+      throw new Error('--assistant-id is required');
+    } else {
+      // Inject assistant-id into params for URL template substitution
+      params.assistantId = argv.assistantId;
+      // Direct Telnyx use case - optionally check web calls support if api-key provided
+      if (argv.apiKey) {
+        console.log(`\n🔍 Checking assistant configuration...`);
+        try {
+          const assistant = await getAssistant({
+            assistantId: argv.assistantId,
+            telnyxApiKey: argv.apiKey
+          });
+          const supportsWebCalls = assistant.telephony_settings?.supports_unauthenticated_web_calls;
+          if (!supportsWebCalls) {
+            console.log(`❌ Unauthenticated web calls: disabled`);
+            console.warn(`\n⚠️  Warning: Assistant "${assistant.name}" does not support unauthenticated web calls.`);
+            console.warn(`   The benchmark may not work correctly without this setting enabled.\n`);
+            const shouldEnable = await promptUser('Would you like to enable unauthenticated web calls? (y/n): ');
+            if (shouldEnable) {
+              await enableWebCalls({
+                assistantId: argv.assistantId,
+                telnyxApiKey: argv.apiKey,
+                assistant
+              });
+            } else {
+              console.log('   Proceeding without enabling web calls...\n');
+            }
+          } else {
+            console.log(`✅ Unauthenticated web calls: enabled`);
+          }
+        } catch (error) {
+          console.log(`⚠️  Could not check assistant: ${error.message}`);
+        }
+      }
+    }
+    if (Object.keys(params).length > 0) {
+      console.log(`📝 URL parameters: ${JSON.stringify(params)}`);
+    }
+    // Load all application and scenario configs
+    let applications = applicationPaths.map(p => loadApplicationConfig(p, params));
+    let scenarios = scenarioPaths.map(loadScenarioConfig);
+    // Filter applications by tags if specified
+    if (argv.applicationTags) {
+      const filterTags = argv.applicationTags.split(',').map(t => t.trim());
+      applications = applications.filter(app =>
+        app.tags.some(tag => filterTags.includes(tag))
+      );
+      if (applications.length === 0) {
+        throw new Error(`No applications found with tags: ${filterTags.join(', ')}`);
+      }
+    }
+    // Filter scenarios by tags if specified
+    if (argv.scenarioTags) {
+      const filterTags = argv.scenarioTags.split(',').map(t => t.trim());
+      scenarios = scenarios.filter(scenario =>
+        scenario.tags.some(tag => filterTags.includes(tag))
+      );
+      if (scenarios.length === 0) {
+        throw new Error(`No scenarios found with tags: ${filterTags.join(', ')}`);
+      }
+    }
+    console.log(`\n📋 Loaded ${applications.length} application(s) and ${scenarios.length} scenario(s)`);
+    console.log(`Applications: ${applications.map(a => a.name).join(', ')}`);
+    console.log(`Scenarios: ${scenarios.map(s => s.name).join(', ')}`);
+    // Create matrix of all combinations
+    const combinations = [];
+    for (const app of applications) {
+      for (const scenario of scenarios) {
+        combinations.push({ app, scenario });
+      }
+    }
+    const totalRuns = combinations.length * argv.repeat;
+    console.log(`\n🎯 Running ${combinations.length} combination(s) × ${argv.repeat} repetition(s) = ${totalRuns} total run(s)\n`);
+    // Create a single report generator for metrics tracking
+    const reportGenerator = new ReportGenerator(argv.report || 'temp_metrics.csv');
+    // Helper function to execute a single test run
+    async function executeRun({ app, scenario, repetition, runNumber }) {
+      console.log(`\n${'='.repeat(80)}`);
+      console.log(`📱 Application: ${app.name}`);
+      console.log(`📝 Scenario: ${scenario.name}`);
+      if (argv.repeat > 1) {
+        console.log(`🔁 Repetition: ${repetition}`);
+      }
+      console.log(`🏃 Run: ${runNumber}/${totalRuns}`);
+      console.log(`${'='.repeat(80)}`);
+      // Handle HTML content vs URL
+      let targetUrl;
+      let tempHtmlPath = null;
+      if (app.html) {
+        // Create temporary HTML file and serve it
+        const assetsDir = path.join(__dirname, '..', 'assets');
+        if (!fs.existsSync(assetsDir)) {
+          fs.mkdirSync(assetsDir, { recursive: true });
+        }
+        tempHtmlPath = path.join(assetsDir, `temp_${app.name}_${Date.now()}.html`);
+        fs.writeFileSync(tempHtmlPath, app.html, 'utf8');
+        tempHtmlPaths.push(tempHtmlPath);
+        targetUrl = `${argv.assetsServer}/assets/${path.basename(tempHtmlPath)}`;
+        console.log(`HTML content served at: ${targetUrl}`);
+      } else {
+        targetUrl = app.url;
+        console.log(`URL: ${targetUrl}`);
+      }
+      // Application and scenario steps are executed separately
+      console.log(`Total steps: ${app.steps.length + scenario.steps.length} (${app.steps.length} from app + ${scenario.steps.length} from suite)\n`);
+      const tester = new VoiceAgentTester({
+        verbose: argv.verbose,
+        headless: argv.headless,
+        assetsServerUrl: argv.assetsServer,
+        reportGenerator: reportGenerator,
+        record: argv.record,
+        debug: argv.debug
+      });
+      try {
+        await tester.runScenario(targetUrl, app.steps, scenario.steps, app.name, scenario.name, repetition, scenario.background);
+        console.log(`✅ Completed successfully (Run ${runNumber}/${totalRuns})`);
+        return { success: true };
+      } catch (error) {
+        // Store only the first line for summary, but print full message here (with diagnostics)
+        const shortMessage = error.message.split('\n')[0];
+        const errorInfo = {
+          app: app.name,
+          scenario: scenario.name,
+          repetition,
+          error: shortMessage
+        };
+        // Print full diagnostics here (only place they appear)
+        console.error(`❌ Error (Run ${runNumber}/${totalRuns}):\n${error.message}`);
+        return { success: false, error: errorInfo };
+      }
+    }
+    // Build all test runs (combination x repetitions)
+    const allRuns = [];
+    let runNumber = 0;
+    for (const { app, scenario } of combinations) {
+      const repetitions = argv.repeat || 1;
+      for (let i = 0; i < repetitions; i++) {
+        runNumber++;
+        allRuns.push({
+          app,
+          scenario,
+          repetition: i,
+          runNumber
+        });
+      }
+    }
+    // Execute runs with concurrency limit using a worker pool
+    const concurrency = Math.min(argv.concurrency || 1, allRuns.length);
+    console.log(`⚡ Concurrency level: ${concurrency}`);
+    // Worker pool implementation - start new tests as soon as one finishes
+    const allResults = [];
+    let nextRunIndex = 0;
+    // Create a pool of worker promises
+    const workers = [];
+    for (let i = 0; i < concurrency; i++) {
+      workers.push(runWorker(i + 1));
+    }
+    // Worker function that processes runs from the queue
+    async function runWorker(workerId) {
+      const workerResults = [];
+      while (nextRunIndex < allRuns.length) {
+        const runIndex = nextRunIndex++;
+        const run = allRuns[runIndex];
+        if (concurrency > 1) {
+          console.log(`\n👷 Worker ${workerId}: Starting run ${run.runNumber}/${totalRuns}`);
+        }
+        const result = await executeRun(run);
+        workerResults.push(result);
+      }
+      return workerResults;
+    }
+    // Wait for all workers to complete
+    const workerResultArrays = await Promise.all(workers);
+    // Flatten all worker results into a single array
+    workerResultArrays.forEach(workerResults => {
+      allResults.push(...workerResults);
+    });
+    // Aggregate results
+    const results = {
+      successful: allResults.filter(r => r.success).length,
+      failed: allResults.filter(r => !r.success).length,
+      errors: allResults.filter(r => !r.success).map(r => r.error)
+    };
+    // Generate the final report if requested, and always show metrics summary
+    if (argv.report) {
+      reportGenerator.generateCSV();
+    }
+    reportGenerator.generateMetricsSummary();
+    // Print final summary
+    console.log(`\n${'='.repeat(80)}`);
+    console.log(`📊 FINAL SUMMARY`);
+    console.log(`${'='.repeat(80)}`);
+    console.log(`✅ Successful runs: ${results.successful}/${totalRuns}`);
+    if (results.failed > 0) {
+      console.log(`\n🔍 Failure Details:`);
+      results.errors.forEach(({ app, scenario, repetition, error }) => {
+        console.log(`  ${app} + ${scenario} (rep ${repetition}): ${error}`);
+      });
+    }
+    if (results.failed === 0) {
+      console.log(`\n🎉 All runs completed successfully!`);
+    } else {
+      console.log(`\n⚠️  Completed with ${results.failed} failure(s).`);
+      // Show helpful hint for direct Telnyx usage (when not using --provider)
+      if (!argv.provider && argv.assistantId) {
+        const editUrl = `https://portal.telnyx.com/#/login/sign-in?redirectTo=/ai/assistants/edit/${argv.assistantId}`;
+        console.log(`\n💡 Tip: Make sure that the "Supports Unauthenticated Web Calls" option is enabled in your Telnyx assistant settings.`);
+        console.log(`   Edit assistant: ${editUrl}`);
+        console.log(`   Or provide --api-key to enable this setting automatically via CLI.`);
+      }
+    }
+    // Set exit code based on results
+    if (results.failed > 0) {
+      exitCode = 1;
+    }
+  } catch (error) {
+    console.error('Error running scenarios:', error.message);
+    exitCode = 1;
+  } finally {
+    // Clean up temporary HTML files if created
+    for (const tempHtmlPath of tempHtmlPaths) {
+      if (fs.existsSync(tempHtmlPath)) {
+        fs.unlinkSync(tempHtmlPath);
+      }
+    }
+    if (tempHtmlPaths.length > 0) {
+      console.log('Temporary HTML files cleaned up');
+    }
+    // Close the server to allow process to exit
+    if (server) {
+      server.close(() => {
+        console.log('Server closed');
+        process.exit(exitCode);
+      });
+    } else {
+      process.exit(exitCode);
+    }
+  }
+}
+if (import.meta.url === `file://${process.argv[1]}`) {
+  main();
+}