API Rate Limiting: Protecting Your Services

Rate limiting protects your API from abuse and ensures fair usage. This guide covers algorithms, implementation patterns, and best practices.

Why Rate Limiting?#

Prevent abuse: Stop malicious actors from overwhelming your service
Ensure fairness: Distribute resources fairly among users
Protect infrastructure: Prevent cascading failures
Cost control: Limit expensive operations

Rate Limiting Algorithms#

Fixed Window#

Simple but has burst issues at window boundaries:

class FixedWindowRateLimiter {
  private windows: Map<string, { count: number; resetAt: number }> = new Map();

  constructor(private limit: number, private windowMs: number) {}

  isAllowed(key: string): boolean {
    const now = Date.now();
    const window = this.windows.get(key);

    if (!window || now >= window.resetAt) {
      this.windows.set(key, {
        count: 1,
        resetAt: now + this.windowMs,
      });
      return true;
    }

    if (window.count < this.limit) {
      window.count++;
      return true;
    }

    return false;
  }
}

Sliding Window Log#

More accurate but memory-intensive:

class SlidingWindowLogRateLimiter {
  private requests: Map<string, number[]> = new Map();

  constructor(private limit: number, private windowMs: number) {}

  isAllowed(key: string): boolean {
    const now = Date.now();
    const windowStart = now - this.windowMs;

    let timestamps = this.requests.get(key) || [];
    timestamps = timestamps.filter(t => t > windowStart);

    if (timestamps.length < this.limit) {
      timestamps.push(now);
      this.requests.set(key, timestamps);
      return true;
    }

    return false;
  }
}

Sliding Window Counter#

Hybrid approach with better memory efficiency:

class SlidingWindowCounterRateLimiter {
  private windows: Map<string, {
    current: number;
    previous: number;
    currentStart: number;
  }> = new Map();

  constructor(private limit: number, private windowMs: number) {}

  isAllowed(key: string): boolean {
    const now = Date.now();
    const currentWindow = Math.floor(now / this.windowMs);

    let data = this.windows.get(key);

    if (!data || data.currentStart < currentWindow - 1) {
      data = { current: 0, previous: 0, currentStart: currentWindow };
      this.windows.set(key, data);
    } else if (data.currentStart < currentWindow) {
      data.previous = data.current;
      data.current = 0;
      data.currentStart = currentWindow;
    }

    // Calculate weighted count
    const elapsed = (now % this.windowMs) / this.windowMs;
    const weightedCount = data.previous * (1 - elapsed) + data.current;

    if (weightedCount < this.limit) {
      data.current++;
      return true;
    }

    return false;
  }
}

Token Bucket#

Allows bursts while maintaining average rate:

class TokenBucketRateLimiter {
  private buckets: Map<string, { tokens: number; lastRefill: number }> = new Map();

  constructor(
    private capacity: number,
    private refillRate: number, // tokens per second
  ) {}

  isAllowed(key: string, tokens: number = 1): boolean {
    const now = Date.now();
    let bucket = this.buckets.get(key);

    if (!bucket) {
      bucket = { tokens: this.capacity, lastRefill: now };
      this.buckets.set(key, bucket);
    }

    // Refill tokens
    const elapsed = (now - bucket.lastRefill) / 1000;
    bucket.tokens = Math.min(
      this.capacity,
      bucket.tokens + elapsed * this.refillRate
    );
    bucket.lastRefill = now;

    if (bucket.tokens >= tokens) {
      bucket.tokens -= tokens;
      return true;
    }

    return false;
  }
}

Redis Implementation#

Distributed rate limiting with Redis:

import Redis from 'ioredis';

class RedisRateLimiter {
  constructor(
    private redis: Redis,
    private limit: number,
    private windowMs: number
  ) {}

  async isAllowed(key: string): Promise<{ allowed: boolean; remaining: number; resetAt: number }> {
    const now = Date.now();
    const windowKey = `ratelimit:${key}:${Math.floor(now / this.windowMs)}`;

    const multi = this.redis.multi();
    multi.incr(windowKey);
    multi.pexpire(windowKey, this.windowMs);

    const results = await multi.exec();
    const count = results?.[0]?.[1] as number;

    const allowed = count <= this.limit;
    const remaining = Math.max(0, this.limit - count);
    const resetAt = (Math.floor(now / this.windowMs) + 1) * this.windowMs;

    return { allowed, remaining, resetAt };
  }
}

// Sliding window with Redis sorted sets
class RedisSlidingWindowLimiter {
  constructor(
    private redis: Redis,
    private limit: number,
    private windowMs: number
  ) {}

  async isAllowed(key: string): Promise<boolean> {
    const now = Date.now();
    const windowStart = now - this.windowMs;
    const setKey = `ratelimit:sliding:${key}`;

    await this.redis.zremrangebyscore(setKey, 0, windowStart);

    const count = await this.redis.zcard(setKey);

    if (count < this.limit) {
      await this.redis
        .multi()
        .zadd(setKey, now.toString(), `${now}-${Math.random()}`)
        .pexpire(setKey, this.windowMs)
        .exec();
      return true;
    }

    return false;
  }
}

Express Middleware#

import { Request, Response, NextFunction } from 'express';

function rateLimitMiddleware(limiter: RateLimiter) {
  return async (req: Request, res: Response, next: NextFunction) => {
    const key = req.ip || req.headers['x-forwarded-for'] as string;

    const result = await limiter.isAllowed(key);

    // Set rate limit headers
    res.set({
      'X-RateLimit-Limit': limiter.limit.toString(),
      'X-RateLimit-Remaining': result.remaining.toString(),
      'X-RateLimit-Reset': result.resetAt.toString(),
    });

    if (!result.allowed) {
      res.status(429).json({
        error: 'Too Many Requests',
        retryAfter: Math.ceil((result.resetAt - Date.now()) / 1000),
      });
      return;
    }

    next();
  };
}

// Usage
app.use('/api', rateLimitMiddleware(
  new RedisRateLimiter(redis, 100, 60000) // 100 requests per minute
));

Tiered Rate Limits#

Different limits for different users:

interface RateLimitTier {
  name: string;
  requestsPerMinute: number;
  requestsPerDay: number;
}

const tiers: Record<string, RateLimitTier> = {
  free: { name: 'Free', requestsPerMinute: 10, requestsPerDay: 1000 },
  pro: { name: 'Pro', requestsPerMinute: 100, requestsPerDay: 50000 },
  enterprise: { name: 'Enterprise', requestsPerMinute: 1000, requestsPerDay: 1000000 },
};

async function getTierForUser(userId: string): Promise<RateLimitTier> {
  const user = await db.users.findById(userId);
  return tiers[user.plan] || tiers.free;
}

function tieredRateLimitMiddleware() {
  return async (req: Request, res: Response, next: NextFunction) => {
    const userId = req.user?.id;
    const tier = await getTierForUser(userId);

    const minuteKey = `${userId}:minute`;
    const dayKey = `${userId}:day`;

    const [minuteAllowed, dayAllowed] = await Promise.all([
      limiter.isAllowed(minuteKey, tier.requestsPerMinute, 60000),
      limiter.isAllowed(dayKey, tier.requestsPerDay, 86400000),
    ]);

    if (!minuteAllowed.allowed || !dayAllowed.allowed) {
      return res.status(429).json({ error: 'Rate limit exceeded' });
    }

    next();
  };
}

Best Practices#

Clear error messages: Tell users when they can retry
Rate limit headers: Include X-RateLimit-* headers
Gradual backoff: Increase limits for good actors
Multiple dimensions: Limit by IP, user, and endpoint
Monitoring: Alert on unusual patterns

Conclusion#

Choose the right algorithm based on your needs: token bucket for APIs allowing bursts, sliding window for strict limits. Implement at multiple layers and provide clear feedback to API consumers.

Share this article