Load Testing and Performance Benchmarking Guide

Load testing validates that your application handles expected (and unexpected) traffic levels. Without it, you're hoping your system works—with it, you know.

Types of Performance Testing#

Load Testing:
- Expected traffic levels
- Verify system meets requirements
- Find breaking points

Stress Testing:
- Beyond normal capacity
- Find system limits
- Observe failure modes

Spike Testing:
- Sudden traffic bursts
- Flash sale scenarios
- Viral content handling

Soak Testing:
- Extended duration
- Memory leaks
- Resource exhaustion

Load Testing Tools#

k6 (Recommended)#

// k6 script: load-test.js
import http from 'k6/http';
import { check, sleep } from 'k6';

export const options = {
  stages: [
    { duration: '2m', target: 100 },  // Ramp up to 100 users
    { duration: '5m', target: 100 },  // Stay at 100 users
    { duration: '2m', target: 200 },  // Ramp up to 200 users
    { duration: '5m', target: 200 },  // Stay at 200 users
    { duration: '2m', target: 0 },    // Ramp down
  ],
  thresholds: {
    http_req_duration: ['p(95)<500'],  // 95% of requests under 500ms
    http_req_failed: ['rate<0.01'],    // Less than 1% errors
  },
};

export default function () {
  const res = http.get('https://api.example.com/products');

  check(res, {
    'status is 200': (r) => r.status === 200,
    'response time < 500ms': (r) => r.timings.duration < 500,
  });

  sleep(1);
}

Artillery#

# artillery.yml
config:
  target: "https://api.example.com"
  phases:
    - duration: 120
      arrivalRate: 10
      name: "Warm up"
    - duration: 300
      arrivalRate: 50
      name: "Sustained load"
    - duration: 60
      arrivalRate: 100
      name: "Spike"

scenarios:
  - name: "Browse and purchase"
    weight: 70
    flow:
      - get:
          url: "/products"
      - think: 2
      - get:
          url: "/products/{{ $randomNumber(1, 100) }}"
      - think: 3
      - post:
          url: "/cart"
          json:
            productId: "{{ $randomNumber(1, 100) }}"
            quantity: 1

  - name: "Search"
    weight: 30
    flow:
      - get:
          url: "/search?q={{ $randomString(5) }}"

Autocannon (Node.js)#

const autocannon = require('autocannon');

async function runBenchmark() {
  const result = await autocannon({
    url: 'http://localhost:3000/api/users',
    connections: 100,
    duration: 30,
    pipelining: 10,
    headers: {
      'Authorization': 'Bearer token',
    },
  });

  console.log(autocannon.printResult(result));
}

runBenchmark();

Realistic Load Patterns#

User Journey Simulation#

// k6: Simulate real user behavior
import http from 'k6/http';
import { group, sleep } from 'k6';

export default function () {
  group('Homepage', () => {
    http.get('https://example.com/');
    sleep(2 + Math.random() * 3);  // 2-5 seconds think time
  });

  group('Browse products', () => {
    http.get('https://example.com/products');
    sleep(1 + Math.random() * 2);

    http.get('https://example.com/products/123');
    sleep(3 + Math.random() * 5);
  });

  group('Add to cart', () => {
    http.post('https://example.com/cart', JSON.stringify({
      productId: '123',
      quantity: 1,
    }), {
      headers: { 'Content-Type': 'application/json' },
    });
    sleep(1);
  });

  group('Checkout', () => {
    http.get('https://example.com/checkout');
    sleep(5 + Math.random() * 10);  // Filling form

    http.post('https://example.com/orders', JSON.stringify({
      paymentMethod: 'card',
    }), {
      headers: { 'Content-Type': 'application/json' },
    });
  });
}

Traffic Distribution#

// Different endpoints have different traffic
export const options = {
  scenarios: {
    browse: {
      executor: 'constant-vus',
      vus: 80,
      duration: '10m',
      exec: 'browseScenario',
    },
    purchase: {
      executor: 'constant-vus',
      vus: 15,
      duration: '10m',
      exec: 'purchaseScenario',
    },
    admin: {
      executor: 'constant-vus',
      vus: 5,
      duration: '10m',
      exec: 'adminScenario',
    },
  },
};

Measuring Results#

Key Metrics#

Response Time:
- Average: Overall performance
- p50 (median): Typical user experience
- p95: Most users' experience
- p99: Worst case for most
- Max: Absolute worst case

Throughput:
- Requests per second (RPS)
- Transactions per second (TPS)
- Data transferred per second

Errors:
- Error rate percentage
- Error types distribution
- Errors under load vs normal

Resources:
- CPU utilization
- Memory usage
- Network I/O
- Database connections

Setting Targets#

// Define acceptable thresholds
export const options = {
  thresholds: {
    // Response time targets
    http_req_duration: [
      'p(50)<200',   // Median under 200ms
      'p(95)<500',   // 95th percentile under 500ms
      'p(99)<1000',  // 99th percentile under 1s
    ],

    // Error rate targets
    http_req_failed: ['rate<0.01'],  // <1% errors

    // Throughput targets
    http_reqs: ['rate>100'],  // >100 requests/second

    // Custom metrics
    'my_custom_metric': ['avg<100'],
  },
};

Database Load Testing#

// Test database queries under load
import sql from 'k6/x/sql';

const db = sql.open('postgres', 'postgres://user:pass@localhost/db');

export default function () {
  // Read-heavy scenario
  const results = sql.query(db, `
    SELECT * FROM orders
    WHERE created_at > NOW() - INTERVAL '7 days'
    ORDER BY created_at DESC
    LIMIT 100
  `);

  // Write scenario
  sql.query(db, `
    INSERT INTO events (user_id, event_type, created_at)
    VALUES ($1, $2, NOW())
  `, [Math.floor(Math.random() * 10000), 'page_view']);
}

CI/CD Integration#

# .github/workflows/load-test.yml
name: Load Test

on:
  push:
    branches: [main]
  schedule:
    - cron: '0 2 * * *'  # Daily at 2 AM

jobs:
  load-test:
    runs-on: ubuntu-latest
    steps:
      - uses: actions/checkout@v3

      - name: Setup k6
        uses: grafana/setup-k6-action@v1

      - name: Run load test
        run: k6 run --out json=results.json load-test.js

      - name: Check thresholds
        run: |
          if grep -q '"thresholds":{"http_req_duration":\[{"ok":false' results.json; then
            echo "Performance thresholds not met"
            exit 1
          fi

      - name: Upload results
        uses: actions/upload-artifact@v3
        with:
          name: load-test-results
          path: results.json

Analyzing Results#

Finding Bottlenecks#

Symptoms → Likely Causes

High CPU:
- Inefficient algorithms
- Missing caching
- Synchronous operations

High Memory:
- Memory leaks
- Large object retention
- Missing cleanup

High Latency:
- Database queries
- External API calls
- Network issues

High Error Rate:
- Resource exhaustion
- Timeout misconfigurations
- Connection pool limits

Performance Profiling#

// Add profiling to identify slow code
const { performance } = require('perf_hooks');

async function profiledEndpoint(req, res) {
  const marks = {};

  marks.start = performance.now();

  // Database query
  marks.dbStart = performance.now();
  const data = await db.query('SELECT * FROM users');
  marks.dbEnd = performance.now();

  // Processing
  marks.processStart = performance.now();
  const processed = processData(data);
  marks.processEnd = performance.now();

  // Response
  marks.end = performance.now();

  // Log timings
  console.log({
    total: marks.end - marks.start,
    database: marks.dbEnd - marks.dbStart,
    processing: marks.processEnd - marks.processStart,
  });

  res.json(processed);
}

Optimization Strategies#

Quick Wins#

// 1. Add caching
const cache = new Map();

async function getCachedData(key: string): Promise<Data> {
  if (cache.has(key)) return cache.get(key);
  const data = await fetchData(key);
  cache.set(key, data);
  return data;
}

// 2. Connection pooling
const pool = new Pool({
  max: 20,
  idleTimeoutMillis: 30000,
  connectionTimeoutMillis: 2000,
});

// 3. Batch operations
async function getUsersOptimized(ids: string[]): Promise<User[]> {
  // Instead of N queries, do 1
  return db.users.findMany({ where: { id: { in: ids } } });
}

// 4. Async where possible
app.post('/order', async (req, res) => {
  const order = await createOrder(req.body);

  // Don't wait for these
  sendConfirmationEmail(order).catch(console.error);
  updateAnalytics(order).catch(console.error);

  res.json(order);
});

Load testing is essential for production confidence. Test regularly, set realistic thresholds, and integrate into CI/CD. The goal isn't just finding limits—it's understanding your system's behavior under stress.

Remember: test in an environment as close to production as possible. Load test results are only as good as the environment they're run in.