Rate Limiting Algorithms Explained

Rate limiting protects APIs from abuse and ensures fair resource usage. Different algorithms offer different trade-offs between accuracy, memory, and performance.

Rate Limiting Algorithms#

Token Bucket:
- Tokens added at fixed rate
- Requests consume tokens
- Allows bursts up to bucket size

Sliding Window Log:
- Stores timestamp of each request
- Counts requests in sliding window
- Most accurate, highest memory

Sliding Window Counter:
- Combines fixed and sliding windows
- Good accuracy with less memory
- Best overall choice

Fixed Window Counter:
- Counts requests per time window
- Simple but allows boundary bursts
- Simplest implementation

Token Bucket Implementation#

import Redis from 'ioredis';

class TokenBucket {
  constructor(
    private redis: Redis,
    private maxTokens: number,
    private refillRate: number, // tokens per second
    private prefix = 'ratelimit'
  ) {}

  async consume(key: string, tokens = 1): Promise<RateLimitResult> {
    const now = Date.now();
    const redisKey = `${this.prefix}:${key}`;

    // Lua script for atomic operation
    const script = `
      local key = KEYS[1]
      local max_tokens = tonumber(ARGV[1])
      local refill_rate = tonumber(ARGV[2])
      local now = tonumber(ARGV[3])
      local requested = tonumber(ARGV[4])

      local data = redis.call('HMGET', key, 'tokens', 'last_refill')
      local tokens = tonumber(data[1]) or max_tokens
      local last_refill = tonumber(data[2]) or now

      -- Calculate tokens to add
      local elapsed = (now - last_refill) / 1000
      local refill = math.floor(elapsed * refill_rate)
      tokens = math.min(max_tokens, tokens + refill)

      local allowed = tokens >= requested
      if allowed then
        tokens = tokens - requested
      end

      redis.call('HMSET', key, 'tokens', tokens, 'last_refill', now)
      redis.call('EXPIRE', key, math.ceil(max_tokens / refill_rate) + 1)

      return {allowed and 1 or 0, tokens, max_tokens}
    `;

    const result = await this.redis.eval(
      script,
      1,
      redisKey,
      this.maxTokens,
      this.refillRate,
      now,
      tokens
    ) as [number, number, number];

    return {
      allowed: result[0] === 1,
      remaining: result[1],
      limit: result[2],
      resetAt: now + Math.ceil((this.maxTokens - result[1]) / this.refillRate) * 1000,
    };
  }
}

// Usage
const bucket = new TokenBucket(redis, 100, 10); // 100 tokens, refill 10/sec

app.use(async (req, res, next) => {
  const result = await bucket.consume(req.ip);

  res.setHeader('X-RateLimit-Limit', result.limit);
  res.setHeader('X-RateLimit-Remaining', result.remaining);
  res.setHeader('X-RateLimit-Reset', result.resetAt);

  if (!result.allowed) {
    return res.status(429).json({ error: 'Rate limit exceeded' });
  }

  next();
});

Sliding Window Counter#

class SlidingWindowCounter {
  constructor(
    private redis: Redis,
    private limit: number,
    private windowMs: number,
    private prefix = 'ratelimit'
  ) {}

  async check(key: string): Promise<RateLimitResult> {
    const now = Date.now();
    const windowStart = now - this.windowMs;
    const currentWindow = Math.floor(now / this.windowMs);
    const previousWindow = currentWindow - 1;

    const redisKey = `${this.prefix}:${key}`;

    const script = `
      local key = KEYS[1]
      local current_window = ARGV[1]
      local previous_window = ARGV[2]
      local now = tonumber(ARGV[3])
      local window_ms = tonumber(ARGV[4])
      local limit = tonumber(ARGV[5])

      -- Get counts
      local current_count = tonumber(redis.call('HGET', key, current_window)) or 0
      local previous_count = tonumber(redis.call('HGET', key, previous_window)) or 0

      -- Calculate weighted count
      local window_start = math.floor(now / window_ms) * window_ms
      local elapsed = now - window_start
      local weight = (window_ms - elapsed) / window_ms
      local weighted_count = current_count + math.floor(previous_count * weight)

      local allowed = weighted_count < limit

      if allowed then
        redis.call('HINCRBY', key, current_window, 1)
        redis.call('EXPIRE', key, math.ceil(window_ms / 1000) * 2)
        weighted_count = weighted_count + 1
      end

      return {allowed and 1 or 0, limit - weighted_count, limit}
    `;

    const result = await this.redis.eval(
      script,
      1,
      redisKey,
      currentWindow.toString(),
      previousWindow.toString(),
      now,
      this.windowMs,
      this.limit
    ) as [number, number, number];

    return {
      allowed: result[0] === 1,
      remaining: Math.max(0, result[1]),
      limit: result[2],
      resetAt: (currentWindow + 1) * this.windowMs,
    };
  }
}

// Usage: 100 requests per minute
const limiter = new SlidingWindowCounter(redis, 100, 60000);

Fixed Window Counter#

class FixedWindowCounter {
  constructor(
    private redis: Redis,
    private limit: number,
    private windowMs: number,
    private prefix = 'ratelimit'
  ) {}

  async check(key: string): Promise<RateLimitResult> {
    const window = Math.floor(Date.now() / this.windowMs);
    const redisKey = `${this.prefix}:${key}:${window}`;

    const current = await this.redis.incr(redisKey);

    if (current === 1) {
      await this.redis.expire(redisKey, Math.ceil(this.windowMs / 1000));
    }

    const allowed = current <= this.limit;

    return {
      allowed,
      remaining: Math.max(0, this.limit - current),
      limit: this.limit,
      resetAt: (window + 1) * this.windowMs,
    };
  }
}

Tiered Rate Limiting#

interface RateLimitTier {
  name: string;
  requestsPerMinute: number;
  requestsPerHour: number;
  requestsPerDay: number;
}

const tiers: Record<string, RateLimitTier> = {
  free: { name: 'free', requestsPerMinute: 10, requestsPerHour: 100, requestsPerDay: 1000 },
  basic: { name: 'basic', requestsPerMinute: 60, requestsPerHour: 1000, requestsPerDay: 10000 },
  pro: { name: 'pro', requestsPerMinute: 300, requestsPerHour: 5000, requestsPerDay: 50000 },
};

class TieredRateLimiter {
  private limiters: Map<string, SlidingWindowCounter[]> = new Map();

  constructor(private redis: Redis) {}

  private getLimiters(tier: RateLimitTier): SlidingWindowCounter[] {
    if (!this.limiters.has(tier.name)) {
      this.limiters.set(tier.name, [
        new SlidingWindowCounter(this.redis, tier.requestsPerMinute, 60000, `rl:${tier.name}:min`),
        new SlidingWindowCounter(this.redis, tier.requestsPerHour, 3600000, `rl:${tier.name}:hour`),
        new SlidingWindowCounter(this.redis, tier.requestsPerDay, 86400000, `rl:${tier.name}:day`),
      ]);
    }
    return this.limiters.get(tier.name)!;
  }

  async check(key: string, tierName: string): Promise<RateLimitResult> {
    const tier = tiers[tierName] || tiers.free;
    const limiters = this.getLimiters(tier);

    // Check all limits
    const results = await Promise.all(
      limiters.map((limiter) => limiter.check(key))
    );

    // Find most restrictive
    const blocked = results.find((r) => !r.allowed);

    if (blocked) {
      return blocked;
    }

    // Return the limit closest to being exceeded
    return results.reduce((min, r) =>
      r.remaining / r.limit < min.remaining / min.limit ? r : min
    );
  }
}

Distributed Rate Limiting#

// Cluster-aware rate limiting with Redis
class DistributedRateLimiter {
  constructor(
    private redis: Redis,
    private syncInterval = 1000
  ) {}

  async checkWithSync(
    key: string,
    limit: number,
    windowMs: number
  ): Promise<RateLimitResult> {
    const now = Date.now();
    const window = Math.floor(now / windowMs);
    const localKey = `${key}:${window}`;

    // Local counter for this instance
    const localCount = this.incrementLocal(localKey);

    // Sync to Redis periodically
    if (localCount % 10 === 0 || this.shouldSync(localKey)) {
      await this.syncToRedis(key, window, localCount);
    }

    // Get global count
    const globalCount = await this.getGlobalCount(key, window);

    return {
      allowed: globalCount < limit,
      remaining: Math.max(0, limit - globalCount),
      limit,
      resetAt: (window + 1) * windowMs,
    };
  }

  private localCounts = new Map<string, number>();
  private lastSync = new Map<string, number>();

  private incrementLocal(key: string): number {
    const count = (this.localCounts.get(key) || 0) + 1;
    this.localCounts.set(key, count);
    return count;
  }

  private shouldSync(key: string): boolean {
    const last = this.lastSync.get(key) || 0;
    return Date.now() - last > this.syncInterval;
  }

  private async syncToRedis(key: string, window: number, count: number): Promise<void> {
    const redisKey = `ratelimit:${key}:${window}`;
    await this.redis.incrby(redisKey, count);
    this.localCounts.delete(`${key}:${window}`);
    this.lastSync.set(`${key}:${window}`, Date.now());
  }

  private async getGlobalCount(key: string, window: number): Promise<number> {
    const redisKey = `ratelimit:${key}:${window}`;
    const count = await this.redis.get(redisKey);
    return parseInt(count || '0', 10);
  }
}

Middleware Integration#

import rateLimit from 'express-rate-limit';
import RedisStore from 'rate-limit-redis';

// Express middleware with Redis store
const apiLimiter = rateLimit({
  store: new RedisStore({
    client: redis,
    prefix: 'rl:api:',
  }),
  windowMs: 60 * 1000,
  max: 100,
  standardHeaders: true,
  legacyHeaders: false,
  keyGenerator: (req) => req.user?.id || req.ip,
  handler: (req, res) => {
    res.status(429).json({
      error: 'Too many requests',
      retryAfter: Math.ceil(req.rateLimit.resetTime / 1000),
    });
  },
  skip: (req) => req.path === '/health',
});

// Different limits for different endpoints
const authLimiter = rateLimit({
  windowMs: 15 * 60 * 1000, // 15 minutes
  max: 5,
  skipSuccessfulRequests: true,
});

app.use('/api/', apiLimiter);
app.use('/api/auth/login', authLimiter);

Best Practices#

Algorithm Selection:
✓ Token bucket for bursty traffic
✓ Sliding window for accuracy
✓ Fixed window for simplicity

Implementation:
✓ Use Redis for distributed systems
✓ Return rate limit headers
✓ Provide clear error messages
✓ Allow for bursts when appropriate

Operations:
✓ Monitor rate limit hits
✓ Alert on sustained limit hits
✓ Provide upgrade paths
✓ Document limits clearly

Choose the right rate limiting algorithm based on your needs. Token bucket allows bursts, sliding window is most accurate, and fixed window is simplest. Use Redis for distributed systems and always return informative headers to clients.