npm - agentic-qe - Versions diffs - 2.0.0 → 2.1.0 - Mend

agentic-qe 2.0.0 → 2.1.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (116) hide show

package/.claude/agents/qx-partner.md +17 -4
package/.claude/skills/accessibility-testing/SKILL.md +144 -692
package/.claude/skills/agentic-quality-engineering/SKILL.md +176 -529
package/.claude/skills/api-testing-patterns/SKILL.md +180 -560
package/.claude/skills/brutal-honesty-review/SKILL.md +113 -603
package/.claude/skills/bug-reporting-excellence/SKILL.md +116 -517
package/.claude/skills/chaos-engineering-resilience/SKILL.md +127 -72
package/.claude/skills/cicd-pipeline-qe-orchestrator/SKILL.md +209 -404
package/.claude/skills/code-review-quality/SKILL.md +158 -608
package/.claude/skills/compatibility-testing/SKILL.md +148 -38
package/.claude/skills/compliance-testing/SKILL.md +132 -63
package/.claude/skills/consultancy-practices/SKILL.md +114 -446
package/.claude/skills/context-driven-testing/SKILL.md +117 -381
package/.claude/skills/contract-testing/SKILL.md +176 -141
package/.claude/skills/database-testing/SKILL.md +137 -130
package/.claude/skills/exploratory-testing-advanced/SKILL.md +160 -629
package/.claude/skills/holistic-testing-pact/SKILL.md +140 -188
package/.claude/skills/localization-testing/SKILL.md +145 -33
package/.claude/skills/mobile-testing/SKILL.md +132 -448
package/.claude/skills/mutation-testing/SKILL.md +147 -41
package/.claude/skills/performance-testing/SKILL.md +200 -546
package/.claude/skills/quality-metrics/SKILL.md +164 -519
package/.claude/skills/refactoring-patterns/SKILL.md +132 -699
package/.claude/skills/regression-testing/SKILL.md +120 -926
package/.claude/skills/risk-based-testing/SKILL.md +157 -660
package/.claude/skills/security-testing/SKILL.md +199 -538
package/.claude/skills/sherlock-review/SKILL.md +163 -699
package/.claude/skills/shift-left-testing/SKILL.md +161 -465
package/.claude/skills/shift-right-testing/SKILL.md +161 -519
package/.claude/skills/six-thinking-hats/SKILL.md +175 -1110
package/.claude/skills/skills-manifest.json +71 -20
package/.claude/skills/tdd-london-chicago/SKILL.md +131 -448
package/.claude/skills/technical-writing/SKILL.md +103 -154
package/.claude/skills/test-automation-strategy/SKILL.md +166 -772
package/.claude/skills/test-data-management/SKILL.md +126 -910
package/.claude/skills/test-design-techniques/SKILL.md +179 -89
package/.claude/skills/test-environment-management/SKILL.md +136 -91
package/.claude/skills/test-reporting-analytics/SKILL.md +169 -92
package/.claude/skills/testability-scoring/SKILL.md +172 -538
package/.claude/skills/testability-scoring/scripts/generate-html-report.js +0 -0
package/.claude/skills/visual-testing-advanced/SKILL.md +155 -78
package/.claude/skills/xp-practices/SKILL.md +151 -587
package/CHANGELOG.md +48 -0
package/README.md +23 -16
package/dist/agents/QXPartnerAgent.d.ts +8 -1
package/dist/agents/QXPartnerAgent.d.ts.map +1 -1
package/dist/agents/QXPartnerAgent.js +1174 -112
package/dist/agents/QXPartnerAgent.js.map +1 -1
package/dist/agents/lifecycle/AgentLifecycleManager.d.ts.map +1 -1
package/dist/agents/lifecycle/AgentLifecycleManager.js +34 -31
package/dist/agents/lifecycle/AgentLifecycleManager.js.map +1 -1
package/dist/cli/commands/init-claude-md-template.d.ts.map +1 -1
package/dist/cli/commands/init-claude-md-template.js +14 -0
package/dist/cli/commands/init-claude-md-template.js.map +1 -1
package/dist/core/SwarmCoordinator.d.ts +180 -0
package/dist/core/SwarmCoordinator.d.ts.map +1 -0
package/dist/core/SwarmCoordinator.js +473 -0
package/dist/core/SwarmCoordinator.js.map +1 -0
package/dist/core/metrics/MetricsAggregator.d.ts +228 -0
package/dist/core/metrics/MetricsAggregator.d.ts.map +1 -0
package/dist/core/metrics/MetricsAggregator.js +482 -0
package/dist/core/metrics/MetricsAggregator.js.map +1 -0
package/dist/core/metrics/index.d.ts +5 -0
package/dist/core/metrics/index.d.ts.map +1 -0
package/dist/core/metrics/index.js +11 -0
package/dist/core/metrics/index.js.map +1 -0
package/dist/core/optimization/SwarmOptimizer.d.ts +5 -0
package/dist/core/optimization/SwarmOptimizer.d.ts.map +1 -1
package/dist/core/optimization/SwarmOptimizer.js +17 -0
package/dist/core/optimization/SwarmOptimizer.js.map +1 -1
package/dist/core/orchestration/AdaptiveScheduler.d.ts +190 -0
package/dist/core/orchestration/AdaptiveScheduler.d.ts.map +1 -0
package/dist/core/orchestration/AdaptiveScheduler.js +460 -0
package/dist/core/orchestration/AdaptiveScheduler.js.map +1 -0
package/dist/core/orchestration/WorkflowOrchestrator.d.ts +13 -0
package/dist/core/orchestration/WorkflowOrchestrator.d.ts.map +1 -1
package/dist/core/orchestration/WorkflowOrchestrator.js +32 -0
package/dist/core/orchestration/WorkflowOrchestrator.js.map +1 -1
package/dist/core/recovery/CircuitBreaker.d.ts +176 -0
package/dist/core/recovery/CircuitBreaker.d.ts.map +1 -0
package/dist/core/recovery/CircuitBreaker.js +382 -0
package/dist/core/recovery/CircuitBreaker.js.map +1 -0
package/dist/core/recovery/RecoveryOrchestrator.d.ts +186 -0
package/dist/core/recovery/RecoveryOrchestrator.d.ts.map +1 -0
package/dist/core/recovery/RecoveryOrchestrator.js +476 -0
package/dist/core/recovery/RecoveryOrchestrator.js.map +1 -0
package/dist/core/recovery/RetryStrategy.d.ts +127 -0
package/dist/core/recovery/RetryStrategy.d.ts.map +1 -0
package/dist/core/recovery/RetryStrategy.js +314 -0
package/dist/core/recovery/RetryStrategy.js.map +1 -0
package/dist/core/recovery/index.d.ts +8 -0
package/dist/core/recovery/index.d.ts.map +1 -0
package/dist/core/recovery/index.js +27 -0
package/dist/core/recovery/index.js.map +1 -0
package/dist/core/skills/DependencyResolver.d.ts +99 -0
package/dist/core/skills/DependencyResolver.d.ts.map +1 -0
package/dist/core/skills/DependencyResolver.js +260 -0
package/dist/core/skills/DependencyResolver.js.map +1 -0
package/dist/core/skills/ManifestGenerator.d.ts +114 -0
package/dist/core/skills/ManifestGenerator.d.ts.map +1 -0
package/dist/core/skills/ManifestGenerator.js +449 -0
package/dist/core/skills/ManifestGenerator.js.map +1 -0
package/dist/core/skills/index.d.ts +9 -0
package/dist/core/skills/index.d.ts.map +1 -0
package/dist/core/skills/index.js +24 -0
package/dist/core/skills/index.js.map +1 -0
package/dist/mcp/server.d.ts +9 -9
package/dist/mcp/server.d.ts.map +1 -1
package/dist/mcp/server.js +1 -2
package/dist/mcp/server.js.map +1 -1
package/dist/types/qx.d.ts +39 -7
package/dist/types/qx.d.ts.map +1 -1
package/dist/types/qx.js.map +1 -1
package/dist/visualization/api/RestEndpoints.js +1 -1
package/dist/visualization/api/RestEndpoints.js.map +1 -1
package/package.json +13 -55

package/.claude/skills/performance-testing/SKILL.md CHANGED Viewed

@@ -1,297 +1,149 @@
 ---
 name: performance-testing
-description: Test application performance, scalability, and resilience. Use when planning load testing, stress testing, or optimizing system performance.
+description: "Test application performance, scalability, and resilience. Use when planning load testing, stress testing, or optimizing system performance."
+category: specialized-testing
+priority: high
+tokenEstimate: 1100
+agents: [qe-performance-tester, qe-quality-analyzer, qe-production-intelligence]
+implementation_status: optimized
+optimization_version: 1.0
+last_optimized: 2025-12-02
+dependencies: []
+quick_reference_card: true
+tags: [performance, load-testing, stress-testing, scalability, k6, bottlenecks]
 ---
 # Performance Testing
-## Core Principle
+<default_to_action>
+When testing performance or planning load tests:
+1. DEFINE SLOs: p95 response time, throughput, error rate targets
+2. IDENTIFY critical paths: revenue flows, high-traffic pages, key APIs
+3. CREATE realistic scenarios: user journeys, think time, varied data
+4. EXECUTE with monitoring: CPU, memory, DB queries, network
+5. ANALYZE bottlenecks and fix before production
+**Quick Test Type Selection:**
+- Expected load validation → Load testing
+- Find breaking point → Stress testing
+- Sudden traffic spike → Spike testing
+- Memory leaks, resource exhaustion → Endurance/soak testing
+- Horizontal/vertical scaling → Scalability testing
+**Critical Success Factors:**
+- Performance is a feature, not an afterthought
+- Test early and often, not just before release
+- Focus on user-impacting bottlenecks
+</default_to_action>
+## Quick Reference Card
+### When to Use
+- Before major releases
+- After infrastructure changes
+- Before scaling events (Black Friday)
+- When setting SLAs/SLOs
+### Test Types
+| Type | Purpose | When |
+|------|---------|------|
+| **Load** | Expected traffic | Every release |
+| **Stress** | Beyond capacity | Quarterly |
+| **Spike** | Sudden surge | Before events |
+| **Endurance** | Memory leaks | After code changes |
+| **Scalability** | Scaling validation | Infrastructure changes |
-**Performance is a feature, not an afterthought.**
-Test performance like you test functionality: continuously, automatically, and with clear acceptance criteria.
-## Why Performance Testing Matters
-### User Impact
-- 100ms delay = 1% drop in conversions (Amazon)
-- 53% of mobile users abandon sites taking > 3 seconds (Google)
-- Slow = Broken (in users' eyes)
-### Business Impact
-- Lost revenue from abandoned transactions
-- Increased infrastructure costs
-- Degraded user experience
-- Reputation damage
-### Technical Impact
-- Scalability limits
-- Infrastructure bottlenecks
-- Hidden architectural problems
-## Types of Performance Testing
-### 1. Load Testing
-**What**: System behavior under expected load
-**Goal**: Verify the system handles typical usage
-**Example**:
-- E-commerce site handling 1,000 concurrent users
-- API serving 10,000 requests/minute
-- Database processing 500 transactions/second
-**When**: Before every major release
-**Tools**: k6, JMeter, Gatling, Artillery
-### 2. Stress Testing
-**What**: System behavior under extreme load (beyond capacity)
-**Goal**: Find breaking point, see how system fails
-**Example**:
-- Ramping up from 1,000 to 10,000 concurrent users
-- Pushing API until response time degrades
-- Filling database until queries slow
-**When**: Before scaling infrastructure, quarterly at minimum
-**What to look for**: Graceful degradation, not catastrophic failure
-### 3. Spike Testing
-**What**: System behavior under sudden load increase
-**Goal**: Test auto-scaling, handling unexpected traffic
-**Example**:
-- Black Friday sale announcement
-- Viral social media post
-- Marketing campaign launch
-**When**: Before major events, after infrastructure changes
-**Pattern**: Instant ramp from normal to 5-10x load
-### 4. Endurance/Soak Testing
-**What**: System behavior over extended time
-**Goal**: Find memory leaks, resource exhaustion, gradual degradation
-**Example**:
-- Run at normal load for 24-72 hours
-- Monitor memory, connections, file handles
-- Check for resource leaks
-**When**: After significant code changes, quarterly
-**What to look for**: Stable resource usage over time
-### 5. Scalability Testing
-**What**: How system performs as load increases
-**Goal**: Validate horizontal/vertical scaling
-**Example**:
-- Add servers, measure throughput improvement
-- Test auto-scaling triggers
-- Find scaling limits
-**When**: Before capacity planning, infrastructure changes
-## Performance Testing Strategy
-### Start with Requirements
-**Bad**: "The system should be fast"
-**Good**: "95th percentile response time < 200ms under 1,000 concurrent users"
-**Define SLOs (Service Level Objectives)**:
-- **Response Time**: 95th percentile < 200ms
-- **Throughput**: 10,000 requests/minute minimum
-- **Error Rate**: < 0.1% under load
-- **Resource Usage**: CPU < 70%, Memory < 80%
-### Identify Critical Paths
-Don't test everything equally. Focus on:
-- Revenue-generating flows (checkout, payment)
-- High-traffic pages (homepage, product pages)
-- Critical APIs (authentication, data access)
-- Resource-intensive operations (search, reports)
-### Realistic Scenarios
-**Bad**: Every user hits homepage repeatedly
-**Good**:
-- 40% browse products
-- 30% search
-- 20% view product details
-- 10% checkout
-Include:
-- Think time (users don't click instantly)
-- Varied data (different products, users, queries)
-- Realistic workflows (browse → search → add to cart → checkout)
-## Setting Up Performance Tests
-### Test Environment
-**Ideal**: Production-like infrastructure
-- Same server specs
-- Same database size
-- Same network topology
-- Same third-party integrations (or mocks)
+### Key Metrics
+| Metric | Target | Why |
+|--------|--------|-----|
+| p95 response | < 200ms | User experience |
+| Throughput | 10k req/min | Capacity |
+| Error rate | < 0.1% | Reliability |
+| CPU | < 70% | Headroom |
+| Memory | < 80% | Stability |
+### Tools
+- **k6**: Modern, JS-based, CI/CD friendly
+- **JMeter**: Enterprise, feature-rich
+- **Artillery**: Simple YAML configs
+- **Gatling**: Scala, great reporting
+### Agent Coordination
+- `qe-performance-tester`: Load test orchestration
+- `qe-quality-analyzer`: Results analysis
+- `qe-production-intelligence`: Production comparison
-**Reality**: Often scaled-down version
-- Document differences
-- Extrapolate results carefully
-- Validate with production monitoring
+---
-### Test Data
+## Defining SLOs
-**Requirements**:
-- Realistic volume (don't test with 100 users when you have 10M)
-- Varied data (avoid cache hits skewing results)
-- Production-like distribution (80/20 rule applies)
+**Bad:** "The system should be fast"
+**Good:** "p95 response time < 200ms under 1,000 concurrent users"
-**Example**:
-```
-Products: 100,000 (matching production)
-Users: 50,000 test accounts
-Orders: 1M historical orders
-Search queries: Real query distribution
+```javascript
+export const options = {
+  thresholds: {
+    http_req_duration: ['p(95)<200'],  // 95% < 200ms
+    http_req_failed: ['rate<0.01'],     // < 1% failures
+  },
+};
 ```
-### Monitoring During Tests
+---
-**Essential metrics**:
-- Response time (avg, 50th, 95th, 99th percentile)
-- Throughput (requests/second)
-- Error rate
-- CPU, memory, disk I/O
-- Database query time
-- Network latency
+## Realistic Scenarios
-**Tools**:
-- Application: New Relic, Datadog, Dynatrace
-- Infrastructure: Prometheus, Grafana
-- Database: Query analyzers, slow query logs
+**Bad:** Every user hits homepage repeatedly
+**Good:** Model actual user behavior
-## Common Performance Bottlenecks
+```javascript
+// Realistic distribution
+// 40% browse, 30% search, 20% details, 10% checkout
+export default function () {
+  const action = Math.random();
+  if (action < 0.4) browse();
+  else if (action < 0.7) search();
+  else if (action < 0.9) viewProduct();
+  else checkout();
-### 1. Database
+  sleep(randomInt(1, 5)); // Think time
+}
+```
-**Symptoms**:
-- Slow queries under load
-- Connection pool exhaustion
-- Lock contention
+---
-**Solutions**:
-- Add indexes on filtered columns
-- Optimize N+1 queries
-- Increase connection pool size
-- Add read replicas
-- Implement caching
+## Common Bottlenecks
-### 2. N+1 Queries
+### Database
+**Symptoms:** Slow queries under load, connection pool exhaustion
+**Fixes:** Add indexes, optimize N+1 queries, increase pool size, read replicas
-**Problem**:
+### N+1 Queries
 ```javascript
-// Load 100 orders
+// BAD: 100 orders = 101 queries
 const orders = await Order.findAll();
-// For each order, load customer (100 queries!)
 for (const order of orders) {
   const customer = await Customer.findById(order.customerId);
 }
-```
-**Fix**:
-```javascript
-// Load orders with customers in one query
-const orders = await Order.findAll({
-  include: [Customer]
-});
+// GOOD: 1 query
+const orders = await Order.findAll({ include: [Customer] });
 ```
-### 3. Synchronous Processing
-**Problem**: Blocking operations in request path
-**Example**: Sending email during checkout
-**Fix**:
-- Use message queues (RabbitMQ, SQS)
-- Process asynchronously
-- Return response immediately
-### 4. Memory Leaks
+### Synchronous Processing
+**Problem:** Blocking operations in request path (sending email during checkout)
+**Fix:** Use message queues, process async, return immediately
-**Symptoms**:
-- Memory usage grows over time
-- Performance degrades gradually
-- Eventually crashes
+### Memory Leaks
+**Detection:** Endurance testing, memory profiling
+**Common causes:** Event listeners not cleaned, caches without eviction
-**Detection**:
-- Endurance testing
-- Memory profiling (heap dumps)
-- Monitor garbage collection
+### External Dependencies
+**Solutions:** Aggressive timeouts, circuit breakers, caching, graceful degradation
-**Common causes**:
-- Event listeners not cleaned up
-- Caches without eviction
-- Circular references
-- Global state accumulation
-### 5. Inadequate Caching
-**Problem**: Recalculating same results repeatedly
-**Strategy**:
-- Cache expensive operations
-- Use CDN for static assets
-- Implement application-level caching (Redis)
-- Browser caching (Cache-Control headers)
-**Balance**: Cache hit rate vs. memory usage
-### 6. External Dependencies
-**Problem**: Third-party APIs slow or unavailable
-**Solutions**:
-- Set aggressive timeouts
-- Implement circuit breakers
-- Cache responses when possible
-- Degrade gracefully if unavailable
-## Performance Testing in CI/CD
-### Continuous Performance Testing
-**Approach 1: Smoke Tests**
-- Run small load test on every commit
-- 10 concurrent users for 1 minute
-- Catch major regressions quickly
-**Approach 2: Nightly Tests**
-- Full load test overnight
-- More comprehensive scenarios
-- Trend analysis over time
-**Approach 3: Pre-Production Gate**
-- Load test before production deploy
-- Automated pass/fail criteria
-- Block deployment if performance degrades
+---
-### Example: k6 in CI/CD
+## k6 CI/CD Example
 ```javascript
 // performance-test.js
@@ -301,275 +153,76 @@ import { check, sleep } from 'k6';
 export const options = {
   stages: [
     { duration: '1m', target: 50 },   // Ramp up
-    { duration: '3m', target: 50 },   // Stay at 50 users
+    { duration: '3m', target: 50 },   // Steady
     { duration: '1m', target: 0 },    // Ramp down
   ],
   thresholds: {
-    http_req_duration: ['p(95)<200'],  // 95% of requests < 200ms
-    http_req_failed: ['rate<0.01'],    // < 1% failures
+    http_req_duration: ['p(95)<200'],
+    http_req_failed: ['rate<0.01'],
   },
 };
 export default function () {
   const res = http.get('https://api.example.com/products');
   check(res, {
     'status is 200': (r) => r.status === 200,
     'response time < 200ms': (r) => r.timings.duration < 200,
   });
   sleep(1);
 }
 ```
 ```yaml
-# .github/workflows/performance.yml
-name: Performance Tests
-on:
-  pull_request:
-    branches: [main]
-jobs:
-  performance:
-    runs-on: ubuntu-latest
-    steps:
-      - uses: actions/checkout@v2
-      - name: Run k6 test
-        uses: grafana/k6-action@v0.3.0
-        with:
-          filename: performance-test.js
-      - name: Upload results
-        uses: actions/upload-artifact@v2
-        with:
-          name: k6-results
-          path: results.json
+# GitHub Actions
+- name: Run k6 test
+  uses: grafana/k6-action@v0.3.0
+  with:
+    filename: performance-test.js
 ```
-## Analyzing Performance Test Results
-### Key Metrics
-**Response Time Distribution**:
-- **Average**: Misleading (outliers skew it)
-- **Median (50th percentile)**: Typical user experience
-- **95th percentile**: "Slow but acceptable"
-- **99th percentile**: Worst user experience
-**Throughput**:
-- Requests/second sustained
-- How it changes with load
-- Where it plateaus (capacity)
-**Error Rate**:
-- Should stay flat as load increases
-- Spike indicates breaking point
+---
-### Interpreting Results
+## Analyzing Results
-**Good**:
+### Good Results
 ```
-Load: 1,000 users
-Response time p95: 180ms
-Throughput: 5,000 req/s
-Error rate: 0.05%
-CPU: 65%, Memory: 70%
+Load: 1,000 users | p95: 180ms | Throughput: 5,000 req/s
+Error rate: 0.05% | CPU: 65% | Memory: 70%
 ```
-**Problems**:
+### Problems
 ```
-Load: 1,000 users
-Response time p95: 3,500ms ❌ (too slow)
-Throughput: 500 req/s ❌ (way below target)
-Error rate: 5% ❌ (too many errors)
-CPU: 95%, Memory: 90% ❌ (maxed out)
+Load: 1,000 users | p95: 3,500ms ❌ | Throughput: 500 req/s ❌
+Error rate: 5% ❌ | CPU: 95% ❌ | Memory: 90% ❌
 ```
 ### Root Cause Analysis
+1. Correlate metrics: When response time spikes, what changes?
+2. Check logs: Errors, warnings, slow queries
+3. Profile code: Where is time spent?
+4. Monitor resources: CPU, memory, disk
+5. Trace requests: End-to-end flow
-1. **Correlate metrics**: When response time spikes, what else changes?
-2. **Check logs**: Errors, warnings, slow queries
-3. **Profile code**: Where is time spent?
-4. **Monitor resources**: CPU, memory, network, disk
-5. **Trace requests**: End-to-end request flow
-## Production Performance Monitoring
-### Synthetic Monitoring
-**What**: Automated tests hitting production
-**Example**:
-- Every 5 minutes, test critical flows
-- Measure response time from multiple locations
-- Alert if degradation detected
-**Tools**: Pingdom, Datadog Synthetics, New Relic Synthetics
-### Real User Monitoring (RUM)
-**What**: Measure actual user experience
-**Metrics**:
-- Page load time
-- Time to interactive
-- API response times
-- Error rates
-**Tools**: Google Analytics, New Relic Browser, Datadog RUM
-### Alerting
-**Set alerts on**:
-- p95 response time > threshold
-- Error rate > 1%
-- Throughput drops suddenly
-- Queue depth growing
-**Don't alert on**:
-- Average response time (too noisy)
-- Single slow request (outliers happen)
-## Performance Testing Anti-Patterns
-### ❌ Testing Too Late
-**Problem**: Find performance issues in production
-**Fix**: Test early and often, catch issues before release
-### ❌ Unrealistic Scenarios
-**Problem**: Test doesn't match real usage
-**Example**: All users hitting same endpoint simultaneously
-**Fix**: Model realistic user journeys, think time, data distribution
-### ❌ Ignoring Ramp-Up
-**Problem**: 0 to 1,000 users instantly
-**Real world**: Traffic grows gradually (usually)
-**Fix**: Ramp up over time, see how system adapts
-### ❌ Testing Without Monitoring
-**Problem**: Can't see what's happening during test
-**Fix**: Monitor everything during tests
-### ❌ No Baseline
-**Problem**: Don't know if results are good or bad
-**Fix**: Establish baseline, track trends over time
-### ❌ One-Time Testing
-**Problem**: Test once before launch, never again
-**Fix**: Continuous performance testing, trend monitoring
-## Tools Overview
-### Load Testing Tools
-**k6**: Modern, developer-friendly, JavaScript-based
-- Good for: CI/CD integration, API testing
-- Learning curve: Low
-**JMeter**: Mature, feature-rich, GUI-based
-- Good for: Complex scenarios, extensive protocols
-- Learning curve: Medium
-**Gatling**: Scala-based, great reporting
-- Good for: High load, detailed metrics
-- Learning curve: Medium
-**Artillery**: Node.js, simple YAML configs
-- Good for: Quick tests, simple scenarios
-- Learning curve: Very low
-**Locust**: Python-based, distributed testing
-- Good for: Custom user behavior, Python ecosystems
-- Learning curve: Low-Medium
-### APM (Application Performance Monitoring)
-- **New Relic**: Comprehensive, expensive
-- **Datadog**: Infrastructure + APM combined
-- **Dynatrace**: AI-powered root cause analysis
-- **AppDynamics**: Enterprise-focused
-### Database Profiling
-- **pg_stat_statements** (PostgreSQL)
-- **MySQL slow query log**
-- **MongoDB profiler**
-- **Redis SLOWLOG**
-## Real-World Example
-### Scenario: E-Commerce Checkout Slow
-**Problem**: Checkout taking 5+ seconds under load
-**Investigation**:
-1. Load test: Reproduce issue
-2. Monitor: Database CPU at 95%
-3. Profile: Slow query on order creation
-4. Root cause: Missing index on `orders.user_id`
-**Fix**:
-```sql
-CREATE INDEX idx_orders_user_id ON orders(user_id);
-```
-**Result**:
-- Checkout time: 5s → 300ms
-- Database CPU: 95% → 40%
-- Throughput: 5x improvement
-## When NOT to Performance Test
-- **MVPs/Prototypes**: Focus on validating idea first
-- **Internal tools**: With < 10 users, performance rarely matters
-- **One-time scripts**: Not worth the effort
-- **Before optimization**: Profile first, optimize second, then test
-## Checklist: Before Going to Production
-- [ ] Load test passed (expected traffic)
-- [ ] Stress test passed (2-3x expected traffic)
-- [ ] Spike test passed (sudden traffic surge)
-- [ ] Endurance test passed (24+ hours)
-- [ ] Database indexes in place
-- [ ] Caching configured
-- [ ] Monitoring and alerting set up
-- [ ] Auto-scaling configured (if applicable)
-- [ ] Performance baseline established
+---
-## Remember
+## Anti-Patterns
-**Performance is a feature**: Test it like functionality
-**Test continuously**: Not just before launch
-**Monitor production**: Synthetic + real user monitoring
-**Set realistic goals**: Based on business requirements
-**Fix what matters**: Focus on user-impacting bottlenecks
-**Trend over time**: Performance degrades gradually, catch it early
+| ❌ Anti-Pattern | ✅ Better |
+|----------------|-----------|
+| Testing too late | Test early and often |
+| Unrealistic scenarios | Model real user behavior |
+| 0 to 1000 users instantly | Ramp up gradually |
+| No monitoring during tests | Monitor everything |
+| No baseline | Establish and track trends |
+| One-time testing | Continuous performance testing |
-## Using with QE Agents
+---
-### Automated Performance Testing
+## Agent-Assisted Performance Testing
-**qe-performance-tester** orchestrates load testing:
 ```typescript
-// Agent runs comprehensive load test
-const perfTest = await agent.runLoadTest({
+// Comprehensive load test
+await Task("Load Test", {
   target: 'https://api.example.com',
   scenarios: {
     checkout: { vus: 100, duration: '5m' },
@@ -578,57 +231,47 @@ const perfTest = await agent.runLoadTest({
   },
   thresholds: {
     'http_req_duration': ['p(95)<200'],
-    'http_req_failed': ['rate<0.01'],
-    'http_reqs': ['rate>100']
+    'http_req_failed': ['rate<0.01']
   }
-});
-// Returns detailed performance report
-```
+}, "qe-performance-tester");
-### Bottleneck Analysis
-```typescript
-// Agent identifies performance bottlenecks
-const analysis = await qe-performance-tester.analyzeBottlenecks({
+// Bottleneck analysis
+await Task("Analyze Bottlenecks", {
   testResults: perfTest,
-  metrics: ['cpu', 'memory', 'db_queries', 'network', 'cache_hits']
-});
-// Returns:
-// {
-//   bottlenecks: [
-//     { component: 'database', severity: 'high', suggestion: 'Add index on orders.created_at' },
-//     { component: 'api', severity: 'medium', suggestion: 'Enable response caching' }
-//   ]
-// }
-```
+  metrics: ['cpu', 'memory', 'db_queries', 'network']
+}, "qe-performance-tester");
-### Continuous Performance Monitoring
-```typescript
-// Agent integrates performance testing in CI/CD
-const ciPerformance = await qe-performance-tester.ciIntegration({
-  mode: 'smoke',  // Quick test on every commit
+// CI integration
+await Task("CI Performance Gate", {
+  mode: 'smoke',
   duration: '1m',
   vus: 10,
-  failOn: {
-    'p95_response_time': 300,  // ms
-    'error_rate': 0.01         // 1%
-  }
-});
+  failOn: { 'p95_response_time': 300, 'error_rate': 0.01 }
+}, "qe-performance-tester");
 ```
-### Fleet Coordination for Performance
+---
+## Agent Coordination Hints
+### Memory Namespace
+```
+aqe/performance/
+├── results/*       - Test execution results
+├── baselines/*     - Performance baselines
+├── bottlenecks/*   - Identified bottlenecks
+└── trends/*        - Historical trends
+```
+### Fleet Coordination
 ```typescript
-const performanceFleet = await FleetManager.coordinate({
+const perfFleet = await FleetManager.coordinate({
   strategy: 'performance-testing',
   agents: [
-    'qe-performance-tester',       // Run load tests
-    'qe-quality-analyzer',         // Analyze results
-    'qe-production-intelligence',  // Compare to production
-    'qe-deployment-readiness'      // Go/no-go decision
+    'qe-performance-tester',
+    'qe-quality-analyzer',
+    'qe-production-intelligence',
+    'qe-deployment-readiness'
   ],
   topology: 'sequential'
 });
@@ -636,21 +279,32 @@ const performanceFleet = await FleetManager.coordinate({
 ---
-## Related Skills
+## Pre-Production Checklist
+- [ ] Load test passed (expected traffic)
+- [ ] Stress test passed (2-3x expected)
+- [ ] Spike test passed (sudden surge)
+- [ ] Endurance test passed (24+ hours)
+- [ ] Database indexes in place
+- [ ] Caching configured
+- [ ] Monitoring and alerting set up
+- [ ] Performance baseline established
-**Testing:**
+---
+## Related Skills
 - [agentic-quality-engineering](../agentic-quality-engineering/) - Agent coordination
-- [api-testing-patterns](../api-testing-patterns/) - API performance testing
+- [api-testing-patterns](../api-testing-patterns/) - API performance
+- [chaos-engineering-resilience](../chaos-engineering-resilience/) - Resilience testing
-**Quality:**
-- [quality-metrics](../quality-metrics/) - Performance metrics tracking
-- [risk-based-testing](../risk-based-testing/) - Performance risk assessment
+---
-## Resources
+## Remember
-- **k6 Documentation**: k6.io/docs
-- **Google Web Fundamentals**: Performance optimization guides
-- **"Release It!"** by Michael Nygard: Production-ready patterns
-- **High Performance Browser Networking** by Ilya Grigorik
+**Performance is a feature:** Test it like functionality
+**Test continuously:** Not just before launch
+**Monitor production:** Synthetic + real user monitoring
+**Fix what matters:** Focus on user-impacting bottlenecks
+**Trend over time:** Catch degradation early
-Performance testing isn't optional—it's how you ensure your system works when it matters most.
+**With Agents:** Agents automate load testing, analyze bottlenecks, and compare with production. Use agents to maintain performance at scale.