npm - @arclabs561/ai-visual-test - Versions diffs - 0.5.1 - Mend

@arclabs561/ai-visual-test 0.5.1

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (93) hide show

package/.secretsignore.example +20 -0
package/CHANGELOG.md +360 -0
package/CONTRIBUTING.md +63 -0
package/DEPLOYMENT.md +80 -0
package/LICENSE +22 -0
package/README.md +142 -0
package/SECURITY.md +108 -0
package/api/health.js +34 -0
package/api/validate.js +252 -0
package/index.d.ts +1221 -0
package/package.json +112 -0
package/public/index.html +149 -0
package/src/batch-optimizer.mjs +451 -0
package/src/bias-detector.mjs +370 -0
package/src/bias-mitigation.mjs +233 -0
package/src/cache.mjs +433 -0
package/src/config.mjs +268 -0
package/src/constants.mjs +80 -0
package/src/context-compressor.mjs +350 -0
package/src/convenience.mjs +617 -0
package/src/cost-tracker.mjs +257 -0
package/src/cross-modal-consistency.mjs +170 -0
package/src/data-extractor.mjs +232 -0
package/src/dynamic-few-shot.mjs +140 -0
package/src/dynamic-prompts.mjs +361 -0
package/src/ensemble/index.mjs +53 -0
package/src/ensemble-judge.mjs +366 -0
package/src/error-handler.mjs +67 -0
package/src/errors.mjs +167 -0
package/src/experience-propagation.mjs +128 -0
package/src/experience-tracer.mjs +487 -0
package/src/explanation-manager.mjs +299 -0
package/src/feedback-aggregator.mjs +248 -0
package/src/game-goal-prompts.mjs +478 -0
package/src/game-player.mjs +548 -0
package/src/hallucination-detector.mjs +155 -0
package/src/helpers/playwright.mjs +80 -0
package/src/human-validation-manager.mjs +516 -0
package/src/index.mjs +364 -0
package/src/judge.mjs +929 -0
package/src/latency-aware-batch-optimizer.mjs +192 -0
package/src/load-env.mjs +159 -0
package/src/logger.mjs +55 -0
package/src/metrics.mjs +187 -0
package/src/model-tier-selector.mjs +221 -0
package/src/multi-modal/index.mjs +36 -0
package/src/multi-modal-fusion.mjs +190 -0
package/src/multi-modal.mjs +524 -0
package/src/natural-language-specs.mjs +1071 -0
package/src/pair-comparison.mjs +277 -0
package/src/persona/index.mjs +42 -0
package/src/persona-enhanced.mjs +200 -0
package/src/persona-experience.mjs +572 -0
package/src/position-counterbalance.mjs +140 -0
package/src/prompt-composer.mjs +375 -0
package/src/render-change-detector.mjs +583 -0
package/src/research-enhanced-validation.mjs +436 -0
package/src/retry.mjs +152 -0
package/src/rubrics.mjs +231 -0
package/src/score-tracker.mjs +277 -0
package/src/smart-validator.mjs +447 -0
package/src/spec-config.mjs +106 -0
package/src/spec-templates.mjs +347 -0
package/src/specs/index.mjs +38 -0
package/src/temporal/index.mjs +102 -0
package/src/temporal-adaptive.mjs +163 -0
package/src/temporal-batch-optimizer.mjs +222 -0
package/src/temporal-constants.mjs +69 -0
package/src/temporal-context.mjs +49 -0
package/src/temporal-decision-manager.mjs +271 -0
package/src/temporal-decision.mjs +669 -0
package/src/temporal-errors.mjs +58 -0
package/src/temporal-note-pruner.mjs +173 -0
package/src/temporal-preprocessor.mjs +543 -0
package/src/temporal-prompt-formatter.mjs +219 -0
package/src/temporal-validation.mjs +159 -0
package/src/temporal.mjs +415 -0
package/src/type-guards.mjs +311 -0
package/src/uncertainty-reducer.mjs +470 -0
package/src/utils/index.mjs +175 -0
package/src/validation-framework.mjs +321 -0
package/src/validation-result-normalizer.mjs +64 -0
package/src/validation.mjs +243 -0
package/src/validators/accessibility-programmatic.mjs +345 -0
package/src/validators/accessibility-validator.mjs +223 -0
package/src/validators/batch-validator.mjs +143 -0
package/src/validators/hybrid-validator.mjs +268 -0
package/src/validators/index.mjs +34 -0
package/src/validators/prompt-builder.mjs +218 -0
package/src/validators/rubric.mjs +85 -0
package/src/validators/state-programmatic.mjs +260 -0
package/src/validators/state-validator.mjs +291 -0
package/vercel.json +27 -0

package/SECURITY.md ADDED Viewed

@@ -0,0 +1,108 @@
+# Security Policy
+## Supported Versions
+| Version | Supported          |
+| ------- | ------------------ |
+| 0.1.x   | :white_check_mark: |
+## Reporting a Vulnerability
+If you discover a security vulnerability, please report it responsibly:
+1. **Email:** security@henrywallace.io
+2. **Include:**
+   - Description of the vulnerability
+   - Steps to reproduce
+   - Potential impact
+   - Suggested fix (if any)
+**Please do not** open a public GitHub issue for security vulnerabilities.
+We will acknowledge receipt within 48 hours and provide an update on the status of the vulnerability within 7 days.
+## Security Best Practices
+### For Package Users
+1. **Always use environment variables** for API keys
+   - Never hardcode secrets in your code
+   - Use `.env` files (not committed to git)
+   - Rotate keys regularly
+2. **Enable secret detection**
+   - Use the provided pre-commit hook
+   - Review `.secretsignore.example` for configuration
+   - Run `node scripts/detect-secrets.mjs --scan-history` periodically
+3. **Validate inputs**
+   - Validate file paths before passing to functions
+   - Sanitize user-provided prompts
+   - Set reasonable size limits on inputs
+4. **Monitor API usage**
+   - Set up rate limiting if using the API
+   - Monitor for unusual patterns
+   - Review error logs regularly
+5. **Keep dependencies updated**
+   - Regularly update `@playwright/test` peer dependency
+   - Run `npm audit` regularly
+   - Review security advisories
+### For Contributors
+1. **Follow secure coding practices**
+   - Never commit secrets
+   - Use the pre-commit hook
+   - Review code for security issues
+2. **Test security features**
+   - Add security-focused tests
+   - Test input validation
+   - Test error handling
+3. **Document security considerations**
+   - Document any security assumptions
+   - Note any known limitations
+   - Update this file for new vulnerabilities
+## Known Security Considerations
+### API Endpoint (`/api/validate`)
+- **Authentication** - Optional API key authentication via `API_KEY` or `VLLM_API_KEY` environment variable
+  - Set `REQUIRE_AUTH=true` to enforce authentication
+  - API key can be provided via `X-API-Key` header or `Authorization: Bearer <key>` header
+- **Rate Limiting** - Built-in rate limiting (10 requests/minute by default, configurable via `RATE_LIMIT_MAX_REQUESTS`)
+  - Rate limit headers: `X-RateLimit-Limit`, `X-RateLimit-Remaining`, `X-RateLimit-Reset`
+  - Returns 429 status when limit exceeded
+  - Uses in-memory store (use Redis for production multi-instance deployments)
+- **Error messages** - Sanitized to prevent information leakage
+### File Operations
+- **Path validation** - Always validate file paths before use
+- **Temporary files** - Cleaned up automatically, but ensure proper error handling
+### Environment Variables
+- **No validation** - Validate required environment variables at startup
+- **No encryption** - Store sensitive values securely
+## Security Features
+- ✅ Pre-commit secret detection (enhanced with red team recommendations)
+- ✅ Git history scanning option
+- ✅ Zero runtime dependencies
+- ✅ Input validation
+- ✅ Error handling with sanitization
+- ✅ Rate limiting (configurable, in-memory or Redis)
+- ✅ Authentication (optional API key)
+- ✅ Path traversal protection
+- ✅ Size limits on all inputs
+## Changelog
+See [CHANGELOG.md](./CHANGELOG.md) for security-related updates.

package/api/health.js ADDED Viewed

@@ -0,0 +1,34 @@
+/**
+ * Health check endpoint
+ *
+ * GET /api/health
+ */
+import { createConfig } from '../src/index.mjs';
+export default async function handler(req, res) {
+  if (req.method !== 'GET') {
+    return res.status(405).json({ error: 'Method not allowed' });
+  }
+  try {
+    const config = createConfig();
+    return res.status(200).json({
+      status: 'ok',
+      enabled: config.enabled,
+      provider: config.provider,
+      version: '0.1.0',
+      timestamp: new Date().toISOString()
+    });
+  } catch (error) {
+    // SECURITY: Don't expose internal error details
+    // Log server-side for debugging, return generic message to client
+    console.error('[Health] Error:', error);
+    return res.status(500).json({
+      status: 'error',
+      error: 'Health check failed'
+    });
+  }
+}

package/api/validate.js ADDED Viewed

@@ -0,0 +1,252 @@
+/**
+ * Vercel Serverless Function for VLLM Screenshot Validation
+ *
+ * POST /api/validate
+ *
+ * Body:
+ * {
+ *   "image": "base64-encoded-image",
+ *   "prompt": "Evaluation prompt",
+ *   "context": { ... }
+ * }
+ *
+ * Returns:
+ * {
+ *   "enabled": boolean,
+ *   "provider": string,
+ *   "score": number|null,
+ *   "issues": string[],
+ *   "assessment": string|null,
+ *   "reasoning": string,
+ *   "estimatedCost": object|null,
+ *   "responseTime": number
+ * }
+ */
+import { validateScreenshot, createConfig, normalizeValidationResult } from '../src/index.mjs';
+import { writeFileSync, unlinkSync } from 'fs';
+import { join } from 'path';
+import { tmpdir } from 'os';
+import { randomBytes } from 'crypto';
+// Security limits
+const MAX_IMAGE_SIZE = 10 * 1024 * 1024; // 10MB
+const MAX_PROMPT_LENGTH = 5000;
+const MAX_CONTEXT_SIZE = 10000;
+// Rate limiting configuration
+const RATE_LIMIT_WINDOW = 60 * 1000; // 1 minute
+const RATE_LIMIT_MAX_REQUESTS = parseInt(process.env.RATE_LIMIT_MAX_REQUESTS || '10', 10);
+const rateLimitStore = new Map(); // In-memory store (use Redis in production)
+// Authentication configuration
+const API_KEY = process.env.API_KEY || process.env.VLLM_API_KEY || null;
+// Default to requiring auth if API key is set (more secure)
+// Set REQUIRE_AUTH=false explicitly to disable
+const REQUIRE_AUTH = process.env.REQUIRE_AUTH !== 'false' && API_KEY !== null;
+/**
+ * Simple rate limiter (in-memory)
+ * For production, use Redis or a dedicated rate limiting service
+ */
+function checkRateLimit(identifier) {
+  const now = Date.now();
+  const windowStart = now - RATE_LIMIT_WINDOW;
+  // Clean up old entries
+  for (const [key, timestamps] of rateLimitStore.entries()) {
+    const recent = timestamps.filter(ts => ts > windowStart);
+    if (recent.length === 0) {
+      rateLimitStore.delete(key);
+    } else {
+      rateLimitStore.set(key, recent);
+    }
+  }
+  // Check current identifier
+  const timestamps = rateLimitStore.get(identifier) || [];
+  const recent = timestamps.filter(ts => ts > windowStart);
+  if (recent.length >= RATE_LIMIT_MAX_REQUESTS) {
+    return {
+      allowed: false,
+      remaining: 0,
+      resetAt: Math.min(...recent) + RATE_LIMIT_WINDOW
+    };
+  }
+  // Add current request
+  recent.push(now);
+  rateLimitStore.set(identifier, recent);
+  return {
+    allowed: true,
+    remaining: RATE_LIMIT_MAX_REQUESTS - recent.length,
+    resetAt: now + RATE_LIMIT_WINDOW
+  };
+}
+/**
+ * Get client identifier for rate limiting
+ */
+function getClientIdentifier(req) {
+  // Try to get IP from various headers (Vercel, Cloudflare, etc.)
+  const forwarded = req.headers['x-forwarded-for'];
+  const realIp = req.headers['x-real-ip'];
+  const ip = forwarded?.split(',')[0] || realIp || req.socket?.remoteAddress || 'unknown';
+  // If API key is provided, use it as identifier (more accurate)
+  const apiKey = req.headers['x-api-key'] || req.headers['authorization']?.replace('Bearer ', '');
+  return apiKey || ip;
+}
+/**
+ * Check authentication
+ */
+function checkAuth(req) {
+  if (!REQUIRE_AUTH || !API_KEY) {
+    return { authenticated: true };
+  }
+  // SECURITY: Only accept API key from headers, not request body
+  // API keys in request bodies are logged, visible in dev tools, and stored in history
+  const providedKey = req.headers['x-api-key'] ||
+                     req.headers['authorization']?.replace('Bearer ', '');
+  if (!providedKey) {
+    return { authenticated: false, error: 'Authentication required. Provide API key via X-API-Key header or Authorization: Bearer <key>' };
+  }
+  if (providedKey !== API_KEY) {
+    return { authenticated: false, error: 'Invalid API key' };
+  }
+  return { authenticated: true };
+}
+export default async function handler(req, res) {
+  // Only allow POST
+  if (req.method !== 'POST') {
+    return res.status(405).json({ error: 'Method not allowed' });
+  }
+  // Check authentication
+  const authResult = checkAuth(req);
+  if (!authResult.authenticated) {
+    return res.status(401).json({ error: authResult.error });
+  }
+  // Check rate limit
+  const clientId = getClientIdentifier(req);
+  const rateLimit = checkRateLimit(clientId);
+  if (!rateLimit.allowed) {
+    res.setHeader('X-RateLimit-Limit', RATE_LIMIT_MAX_REQUESTS);
+    res.setHeader('X-RateLimit-Remaining', 0);
+    res.setHeader('X-RateLimit-Reset', new Date(rateLimit.resetAt).toISOString());
+    return res.status(429).json({
+      error: 'Rate limit exceeded',
+      retryAfter: Math.ceil((rateLimit.resetAt - Date.now()) / 1000)
+    });
+  }
+  // Set rate limit headers
+  res.setHeader('X-RateLimit-Limit', RATE_LIMIT_MAX_REQUESTS);
+  res.setHeader('X-RateLimit-Remaining', rateLimit.remaining);
+  res.setHeader('X-RateLimit-Reset', new Date(rateLimit.resetAt).toISOString());
+  try {
+    const { image, prompt, context = {} } = req.body;
+    // Validate input presence
+    if (!image) {
+      return res.status(400).json({ error: 'Missing image (base64 encoded)' });
+    }
+    if (!prompt) {
+      return res.status(400).json({ error: 'Missing prompt' });
+    }
+    // Validate input size
+    if (typeof image !== 'string' || image.length > MAX_IMAGE_SIZE) {
+      return res.status(400).json({ error: 'Image too large or invalid format' });
+    }
+    if (typeof prompt !== 'string' || prompt.length > MAX_PROMPT_LENGTH) {
+      return res.status(400).json({ error: 'Prompt too long' });
+    }
+    if (context && typeof context === 'object') {
+      const contextSize = JSON.stringify(context).length;
+      if (contextSize > MAX_CONTEXT_SIZE) {
+        return res.status(400).json({ error: 'Context too large' });
+      }
+    }
+    // Decode base64 image
+    // SECURITY: Whitelist specific MIME types to prevent unexpected formats
+    const validMimeTypes = ['image/png', 'image/jpeg', 'image/jpg', 'image/gif', 'image/webp'];
+    const mimeMatch = image.match(/^data:(image\/(?:png|jpeg|jpg|gif|webp));base64,/);
+    if (!mimeMatch) {
+      return res.status(400).json({ error: 'Invalid image MIME type. Supported: image/png, image/jpeg, image/jpg, image/gif, image/webp' });
+    }
+    let imageBuffer;
+    try {
+      const base64Data = image.replace(/^data:image\/(?:png|jpeg|jpg|gif|webp);base64,/, '');
+      imageBuffer = Buffer.from(base64Data, 'base64');
+      // Additional validation: check decoded buffer size matches expected
+      // Base64 encoding increases size by ~33%, so decoded should be smaller
+      const expectedMaxDecoded = Math.floor(MAX_IMAGE_SIZE * 0.75); // Conservative estimate
+      if (imageBuffer.length > expectedMaxDecoded) {
+        return res.status(400).json({ error: 'Decoded image exceeds maximum size' });
+      }
+    } catch (error) {
+      return res.status(400).json({ error: 'Invalid base64 image' });
+    }
+    // Save to temporary file with secure random name (prevents race conditions and information disclosure)
+    // SECURITY: Use cryptographically secure random suffix to prevent collisions
+    const randomSuffix = randomBytes(16).toString('hex');
+    const tempPath = join(tmpdir(), `vllm-validate-${randomSuffix}.png`);
+    // RESOURCE PROTECTION: File system operation is rate-limited by API rate limiting above
+    // This writeFileSync is bounded by:
+    // 1. Rate limiting (prevents too many concurrent operations)
+    // 2. Size limits (MAX_IMAGE_SIZE prevents large files)
+    // 3. Serverless timeout (function will timeout if operation takes too long)
+    writeFileSync(tempPath, imageBuffer);
+    try {
+      // Validate screenshot
+      const result = await validateScreenshot(tempPath, prompt, context);
+      // Clean up temp file
+      unlinkSync(tempPath);
+      // Normalize result structure before returning (ensures consistent API response)
+      const normalizedResult = normalizeValidationResult(result, 'api/validate');
+      // Return normalized result
+      return res.status(200).json(normalizedResult);
+    } catch (error) {
+      // Clean up temp file on error
+      try {
+        unlinkSync(tempPath);
+      } catch {}
+      throw error;
+    }
+  } catch (error) {
+    // Log full error for debugging (server-side only)
+    console.error('[VLLM API] Error:', error);
+    // Return sanitized error to client (don't leak internal details)
+    // Never expose: file paths, API keys, internal structure, stack traces
+    const sanitizedError = error instanceof Error
+      ? 'Validation failed. Please check your input and try again.'
+      : 'Validation failed';
+    return res.status(500).json({
+      error: sanitizedError
+    });
+  }
+}