npm - @artemiskit/cli - Versions diffs - 0.1.7 → 0.2.0 - Mend

@artemiskit/cli 0.1.7 → 0.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (36) hide show

package/CHANGELOG.md +106 -0
package/bin/artemis.ts +0 -0
package/dist/index.js +70954 -35881
package/dist/src/cli.d.ts.map +1 -1
package/dist/src/commands/compare.d.ts.map +1 -1
package/dist/src/commands/init.d.ts.map +1 -1
package/dist/src/commands/redteam.d.ts.map +1 -1
package/dist/src/commands/run.d.ts.map +1 -1
package/dist/src/commands/stress.d.ts.map +1 -1
package/dist/src/config/loader.d.ts +3 -1
package/dist/src/config/loader.d.ts.map +1 -1
package/dist/src/config/schema.d.ts +8 -0
package/dist/src/config/schema.d.ts.map +1 -1
package/dist/src/ui/index.d.ts +3 -1
package/dist/src/ui/index.d.ts.map +1 -1
package/dist/src/ui/panels.d.ts +21 -0
package/dist/src/ui/panels.d.ts.map +1 -1
package/dist/src/ui/prompts.d.ts +92 -0
package/dist/src/ui/prompts.d.ts.map +1 -0
package/dist/src/utils/adapter.d.ts.map +1 -1
package/dist/src/utils/update-checker.d.ts +31 -0
package/dist/src/utils/update-checker.d.ts.map +1 -0
package/package.json +6 -6
package/src/cli.ts +22 -1
package/src/commands/compare.ts +25 -0
package/src/commands/init.ts +221 -77
package/src/commands/redteam.ts +63 -10
package/src/commands/run.ts +542 -137
package/src/commands/stress.ts +76 -3
package/src/config/loader.ts +5 -2
package/src/config/schema.ts +1 -0
package/src/ui/index.ts +19 -0
package/src/ui/panels.ts +153 -5
package/src/ui/prompts.ts +749 -0
package/src/utils/adapter.ts +8 -0
package/src/utils/update-checker.ts +121 -0

package/src/commands/init.ts CHANGED Viewed

@@ -7,7 +7,14 @@ import { appendFile, mkdir, readFile, writeFile } from 'node:fs/promises';
 import { join } from 'node:path';
 import chalk from 'chalk';
 import { Command } from 'commander';
-import { createSpinner, icons } from '../ui/index.js';
+import {
+  type InitWizardResult,
+  createSpinner,
+  icons,
+  isInteractive,
+  runInitWizard,
+} from '../ui/index.js';
+import { checkForUpdateAndNotify, getCurrentVersion } from '../utils/update-checker.js';
 const DEFAULT_CONFIG = `# ArtemisKit Configuration
 project: my-project
@@ -85,19 +92,116 @@ const ENV_KEYS = [
   'ANTHROPIC_API_KEY=',
 ];
+/**
+ * Generate config content from wizard results
+ */
+function generateConfigFromWizard(wizard: InitWizardResult): string {
+  const providerConfigs: Record<string, string> = {
+    openai: `  openai:
+    apiKey: \${OPENAI_API_KEY}
+    defaultModel: ${wizard.model}`,
+    'azure-openai': `  azure-openai:
+    apiKey: \${AZURE_OPENAI_API_KEY}
+    resourceName: \${AZURE_OPENAI_RESOURCE}
+    deploymentName: \${AZURE_OPENAI_DEPLOYMENT}
+    apiVersion: "2024-02-15-preview"`,
+    anthropic: `  anthropic:
+    apiKey: \${ANTHROPIC_API_KEY}
+    defaultModel: ${wizard.model}`,
+    google: `  google:
+    apiKey: \${GOOGLE_AI_API_KEY}
+    defaultModel: ${wizard.model}`,
+    mistral: `  mistral:
+    apiKey: \${MISTRAL_API_KEY}
+    defaultModel: ${wizard.model}`,
+    ollama: `  ollama:
+    baseUrl: http://localhost:11434
+    defaultModel: ${wizard.model}`,
+  };
+  const storageConfig =
+    wizard.storageType === 'supabase'
+      ? `storage:
+  type: supabase
+  supabaseUrl: \${SUPABASE_URL}
+  supabaseKey: \${SUPABASE_ANON_KEY}`
+      : `storage:
+  type: local
+  basePath: ./artemis-runs`;
+  return `# ArtemisKit Configuration
+project: ${wizard.projectName}
+# Default provider settings
+provider: ${wizard.provider}
+model: ${wizard.model}
+# Provider configurations
+providers:
+${providerConfigs[wizard.provider] || providerConfigs.openai}
+# Storage configuration
+${storageConfig}
+# Scenarios directory
+scenariosDir: ./scenarios
+# Output settings
+output:
+  format: json
+  dir: ./artemis-output
+`;
+}
 function renderWelcomeBanner(): string {
+  // Brand color for "KIT" portion: #fb923c (orange)
+  const brandColor = chalk.hex('#fb923c');
+  const version = getCurrentVersion();
+  // Randomly color each border character white or brand color
+  const colorBorderChar = (char: string): string => {
+    return Math.random() > 0.5 ? chalk.white(char) : brandColor(char);
+  };
+  const colorBorder = (str: string): string => {
+    return str.split('').map(colorBorderChar).join('');
+  };
+  // All lines are exactly 52 chars inside the borders for perfect alignment
+  const topBorder = `╭${'─'.repeat(52)}╮`;
+  const bottomBorder = `╰${'─'.repeat(52)}╯`;
+  const sideBorderLeft = '│';
+  const sideBorderRight = '│';
+  const emptyContent = ' '.repeat(52);
+  // Version line: "v0.1.7" centered in brand color
+  const versionText = `v${version}`;
+  const versionPadding = Math.floor((52 - versionText.length) / 2);
+  const versionLine =
+    ' '.repeat(versionPadding) +
+    brandColor(versionText) +
+    ' '.repeat(52 - versionPadding - versionText.length);
+  // Tagline centered
+  const tagline = 'Open-source testing toolkit for LLM applications';
+  const taglinePadding = Math.floor((52 - tagline.length) / 2);
+  const taglineLine =
+    ' '.repeat(taglinePadding) +
+    chalk.gray(tagline) +
+    ' '.repeat(52 - taglinePadding - tagline.length);
   const lines = [
     '',
-    chalk.cyan('  ╔═══════════════════════════════════════════════════════╗'),
-    chalk.cyan('  ║                                                       ║'),
-    chalk.cyan('  ║') +
-      chalk.bold.white('     🎯 Welcome to ArtemisKit                         ') +
-      chalk.cyan('║'),
-    chalk.cyan('  ║') +
-      chalk.gray('     LLM Testing & Evaluation Toolkit                 ') +
-      chalk.cyan('║'),
-    chalk.cyan('  ║                                                       ║'),
-    chalk.cyan('  ╚═══════════════════════════════════════════════════════╝'),
+    `  ${colorBorder(topBorder)}`,
+    `  ${colorBorderChar(sideBorderLeft)}${emptyContent}${colorBorderChar(sideBorderRight)}`,
+    `  ${colorBorderChar(sideBorderLeft)}        ${chalk.bold.white('▄▀█ █▀█ ▀█▀ █▀▀ █▀▄▀█ █ █▀ ')}${brandColor.bold('█▄▀ █ ▀█▀')}        ${colorBorderChar(sideBorderRight)}`,
+    `  ${colorBorderChar(sideBorderLeft)}        ${chalk.bold.white('█▀█ █▀▄  █  ██▄ █ ▀ █ █ ▄█ ')}${brandColor.bold('█ █ █  █ ')}        ${colorBorderChar(sideBorderRight)}`,
+    `  ${colorBorderChar(sideBorderLeft)}${emptyContent}${colorBorderChar(sideBorderRight)}`,
+    `  ${colorBorderChar(sideBorderLeft)}${versionLine}${colorBorderChar(sideBorderRight)}`,
+    `  ${colorBorderChar(sideBorderLeft)}${emptyContent}${colorBorderChar(sideBorderRight)}`,
+    `  ${colorBorderChar(sideBorderLeft)}${taglineLine}${colorBorderChar(sideBorderRight)}`,
+    `  ${colorBorderChar(sideBorderLeft)}${emptyContent}${colorBorderChar(sideBorderRight)}`,
+    `  ${colorBorder(bottomBorder)}`,
     '',
   ];
   return lines.join('\n');
@@ -193,79 +297,119 @@ export function initCommand(): Command {
     .description('Initialize ArtemisKit in the current directory')
     .option('-f, --force', 'Overwrite existing configuration')
     .option('--skip-env', 'Skip adding environment variables to .env')
-    .action(async (options: { force?: boolean; skipEnv?: boolean }) => {
-      const spinner = createSpinner();
-      try {
-        const cwd = process.cwd();
-        // Show welcome banner
-        console.log(renderWelcomeBanner());
-        // Step 1: Create directories
-        spinner.start('Creating project structure...');
-        await mkdir(join(cwd, 'scenarios'), { recursive: true });
-        await mkdir(join(cwd, 'artemis-runs'), { recursive: true });
-        await mkdir(join(cwd, 'artemis-output'), { recursive: true });
-        spinner.succeed('Created project structure');
-        // Step 2: Write config file
-        const configPath = join(cwd, 'artemis.config.yaml');
-        const configExists = existsSync(configPath);
-        if (configExists && !options.force) {
-          spinner.info('Config file already exists (use --force to overwrite)');
-        } else {
-          spinner.start('Writing configuration...');
-          await writeFile(configPath, DEFAULT_CONFIG);
-          spinner.succeed(
-            configExists ? 'Overwrote artemis.config.yaml' : 'Created artemis.config.yaml'
-          );
-        }
+    .option('-i, --interactive', 'Run interactive setup wizard')
+    .option('-y, --yes', 'Use defaults without prompts (non-interactive)')
+    .action(
+      async (options: {
+        force?: boolean;
+        skipEnv?: boolean;
+        interactive?: boolean;
+        yes?: boolean;
+      }) => {
+        const spinner = createSpinner();
+        try {
+          const cwd = process.cwd();
+          // Show welcome banner
+          console.log(renderWelcomeBanner());
+          // Determine if we should run interactive wizard
+          const shouldRunWizard =
+            options.interactive || (isInteractive() && !options.yes && !options.force);
+          let configContent = DEFAULT_CONFIG;
+          let createExample = true;
+          // Run interactive wizard if applicable
+          if (shouldRunWizard) {
+            try {
+              const wizardResult = await runInitWizard();
+              configContent = generateConfigFromWizard(wizardResult);
+              createExample = wizardResult.createExample;
+              console.log(''); // Add spacing after wizard
+            } catch (wizardError) {
+              // If wizard fails (e.g., user cancels), fall back to defaults
+              if ((wizardError as Error).message?.includes('closed')) {
+                console.log(chalk.yellow('\n  Setup cancelled. Using defaults.\n'));
+              } else {
+                throw wizardError;
+              }
+            }
+          }
-        // Step 3: Write example scenario
-        const scenarioPath = join(cwd, 'scenarios', 'example.yaml');
-        const scenarioExists = existsSync(scenarioPath);
-        if (scenarioExists && !options.force) {
-          spinner.info('Example scenario already exists (use --force to overwrite)');
-        } else {
-          spinner.start('Creating example scenario...');
-          await writeFile(scenarioPath, DEFAULT_SCENARIO);
-          spinner.succeed(
-            scenarioExists ? 'Overwrote scenarios/example.yaml' : 'Created scenarios/example.yaml'
-          );
-        }
+          // Step 1: Create directories
+          spinner.start('Creating project structure...');
+          await mkdir(join(cwd, 'scenarios'), { recursive: true });
+          await mkdir(join(cwd, 'artemis-runs'), { recursive: true });
+          await mkdir(join(cwd, 'artemis-output'), { recursive: true });
+          spinner.succeed('Created project structure');
+          // Step 2: Write config file
+          const configPath = join(cwd, 'artemis.config.yaml');
+          const configExists = existsSync(configPath);
-        // Step 4: Update .env file
-        if (!options.skipEnv) {
-          spinner.start('Updating .env file...');
-          const { added, skipped } = await appendEnvKeys(cwd);
-          if (added.length > 0) {
-            spinner.succeed(`Added ${added.length} environment variable(s) to .env`);
-            if (skipped.length > 0) {
-              console.log(
-                chalk.dim(
-                  `  ${icons.info} Skipped ${skipped.length} existing key(s): ${skipped.join(', ')}`
-                )
+          if (configExists && !options.force) {
+            spinner.info('Config file already exists (use --force to overwrite)');
+          } else {
+            spinner.start('Writing configuration...');
+            await writeFile(configPath, configContent);
+            spinner.succeed(
+              configExists ? 'Overwrote artemis.config.yaml' : 'Created artemis.config.yaml'
+            );
+          }
+          // Step 3: Write example scenario (if requested)
+          if (createExample) {
+            const scenarioPath = join(cwd, 'scenarios', 'example.yaml');
+            const scenarioExists = existsSync(scenarioPath);
+            if (scenarioExists && !options.force) {
+              spinner.info('Example scenario already exists (use --force to overwrite)');
+            } else {
+              spinner.start('Creating example scenario...');
+              await writeFile(scenarioPath, DEFAULT_SCENARIO);
+              spinner.succeed(
+                scenarioExists
+                  ? 'Overwrote scenarios/example.yaml'
+                  : 'Created scenarios/example.yaml'
               );
             }
-          } else if (skipped.length > 0) {
-            spinner.info('All environment variables already exist in .env');
-          } else {
-            spinner.succeed('Created .env with environment variables');
           }
-        }
-        // Show success panel
-        console.log(renderSuccessPanel());
-      } catch (error) {
-        spinner.fail('Error');
-        console.error(chalk.red(`\n${icons.failed} ${(error as Error).message}`));
-        process.exit(1);
+          // Step 4: Update .env file
+          if (!options.skipEnv) {
+            spinner.start('Updating .env file...');
+            const { added, skipped } = await appendEnvKeys(cwd);
+            if (added.length > 0) {
+              spinner.succeed(`Added ${added.length} environment variable(s) to .env`);
+              if (skipped.length > 0) {
+                console.log(
+                  chalk.dim(
+                    `  ${icons.info} Skipped ${skipped.length} existing key(s): ${skipped.join(', ')}`
+                  )
+                );
+              }
+            } else if (skipped.length > 0) {
+              spinner.info('All environment variables already exist in .env');
+            } else {
+              spinner.succeed('Created .env with environment variables');
+            }
+          }
+          // Show success panel
+          console.log(renderSuccessPanel());
+          // Non-blocking update check (fire and forget)
+          checkForUpdateAndNotify();
+        } catch (error) {
+          spinner.fail('Error');
+          console.error(chalk.red(`\n${icons.failed} ${(error as Error).message}`));
+          process.exit(1);
+        }
       }
-    });
+    );
   return cmd;
 }

package/src/commands/redteam.ts CHANGED Viewed

@@ -19,14 +19,18 @@ import {
   parseScenarioFile,
 } from '@artemiskit/core';
 import {
+  type ConversationTurn,
   CotInjectionMutation,
+  EncodingMutation,
   InstructionFlipMutation,
+  MultiTurnMutation,
   type Mutation,
   RedTeamGenerator,
   RoleSpoofMutation,
   SeverityMapper,
   TypoMutation,
   UnsafeResponseDetector,
+  loadCustomAttacks,
 } from '@artemiskit/redteam';
 import { generateJSONReport, generateRedTeamHTMLReport } from '@artemiskit/reports';
 import chalk from 'chalk';
@@ -55,6 +59,7 @@ interface RedteamOptions {
   model?: string;
   mutations?: string[];
   count?: number;
+  customAttacks?: string;
   save?: boolean;
   output?: string;
   verbose?: boolean;
@@ -73,9 +78,10 @@ export function redteamCommand(): Command {
     .option('-m, --model <model>', 'Model to use')
     .option(
       '--mutations <mutations...>',
-      'Mutations to apply (typo, role-spoof, instruction-flip, cot-injection)'
+      'Mutations to apply (typo, role-spoof, instruction-flip, cot-injection, encoding, multi-turn)'
     )
     .option('-c, --count <number>', 'Number of mutated prompts per case', '5')
+    .option('--custom-attacks <path>', 'Path to custom attacks YAML file')
     .option('--save', 'Save results to storage')
     .option('-o, --output <dir>', 'Output directory for reports')
     .option('-v, --verbose', 'Verbose output')
@@ -131,7 +137,7 @@ export function redteamCommand(): Command {
         spinner.succeed(`Connected to ${provider}`);
         // Set up mutations
-        const mutations = selectMutations(options.mutations);
+        const mutations = selectMutations(options.mutations, options.customAttacks);
         const generator = new RedTeamGenerator(mutations);
         const detector = new UnsafeResponseDetector();
         const count = Number.parseInt(String(options.count)) || 5;
@@ -179,12 +185,47 @@ export function redteamCommand(): Command {
         for (const testCase of scenario.cases) {
           console.log(chalk.bold(`Testing case: ${testCase.id}`));
-          const originalPrompt =
-            typeof testCase.prompt === 'string'
-              ? testCase.prompt
-              : testCase.prompt.map((m) => m.content).join('\n');
+          // Handle both string and array prompts (consistent with run command)
+          // For array prompts: last user message is the attack target, rest is context
+          let attackPrompt: string;
+          let conversationPrefix: ConversationTurn[] | undefined;
+          if (typeof testCase.prompt === 'string') {
+            // Simple string prompt - use directly
+            attackPrompt = testCase.prompt;
+          } else {
+            // Array prompt - extract last user message as attack, rest as context
+            const messages = testCase.prompt;
+            const lastUserIndex = messages.map((m) => m.role).lastIndexOf('user');
+            if (lastUserIndex === -1) {
+              // No user message found - use concatenated content
+              attackPrompt = messages.map((m) => m.content).join('\n');
+            } else {
+              // Extract attack prompt (last user message)
+              attackPrompt = messages[lastUserIndex].content;
+              // Extract conversation prefix (everything before the last user message)
+              if (lastUserIndex > 0) {
+                conversationPrefix = messages.slice(0, lastUserIndex).map((m) => ({
+                  role: m.role as 'user' | 'assistant' | 'system',
+                  content: m.content,
+                }));
+              }
+            }
+          }
+          // Clear any previous prefix and set new one if applicable
+          for (const mutation of mutations) {
+            if (mutation instanceof MultiTurnMutation) {
+              mutation.clearConversationPrefix();
+              if (conversationPrefix && conversationPrefix.length > 0) {
+                mutation.setConversationPrefix(conversationPrefix);
+              }
+            }
+          }
-          const mutatedPrompts = generator.generate(originalPrompt, count);
+          const mutatedPrompts = generator.generate(attackPrompt, count);
           for (const mutated of mutatedPrompts) {
             completedTests++;
@@ -474,19 +515,31 @@ export function redteamCommand(): Command {
   return cmd;
 }
-function selectMutations(names?: string[]): Mutation[] {
+function selectMutations(names?: string[], customAttacksPath?: string): Mutation[] {
   const allMutations: Record<string, Mutation> = {
     typo: new TypoMutation(),
     'role-spoof': new RoleSpoofMutation(),
     'instruction-flip': new InstructionFlipMutation(),
     'cot-injection': new CotInjectionMutation(),
+    encoding: new EncodingMutation(),
+    'multi-turn': new MultiTurnMutation(),
   };
+  let mutations: Mutation[];
   if (!names || names.length === 0) {
-    return Object.values(allMutations);
+    mutations = Object.values(allMutations);
+  } else {
+    mutations = names.filter((name) => name in allMutations).map((name) => allMutations[name]);
+  }
+  // Load custom attacks if path provided
+  if (customAttacksPath) {
+    const customMutations = loadCustomAttacks(customAttacksPath);
+    mutations.push(...customMutations);
   }
-  return names.filter((name) => name in allMutations).map((name) => allMutations[name]);
+  return mutations;
 }
 /**