Database Design Patterns for Applications

Good database design is the foundation of a scalable application. Here are patterns that solve common problems.

Normalization vs Denormalization#

-- Normalized: Data integrity, less redundancy
-- Good for: OLTP, frequently updated data

CREATE TABLE users (
  id UUID PRIMARY KEY,
  email VARCHAR(255) UNIQUE NOT NULL,
  name VARCHAR(100) NOT NULL
);

CREATE TABLE orders (
  id UUID PRIMARY KEY,
  user_id UUID REFERENCES users(id),
  total DECIMAL(10,2) NOT NULL,
  created_at TIMESTAMP DEFAULT NOW()
);

CREATE TABLE order_items (
  id UUID PRIMARY KEY,
  order_id UUID REFERENCES orders(id),
  product_id UUID REFERENCES products(id),
  quantity INT NOT NULL,
  price DECIMAL(10,2) NOT NULL
);

-- Denormalized: Faster reads, data redundancy
-- Good for: Read-heavy, analytics, caching

CREATE TABLE order_summary (
  id UUID PRIMARY KEY,
  user_id UUID,
  user_name VARCHAR(100),        -- Denormalized
  user_email VARCHAR(255),       -- Denormalized
  total DECIMAL(10,2),
  item_count INT,                -- Computed
  created_at TIMESTAMP
);

Soft Deletes#

-- Soft delete with timestamp
CREATE TABLE posts (
  id UUID PRIMARY KEY,
  title VARCHAR(255) NOT NULL,
  content TEXT,
  created_at TIMESTAMP DEFAULT NOW(),
  updated_at TIMESTAMP DEFAULT NOW(),
  deleted_at TIMESTAMP NULL      -- NULL = not deleted
);

-- Query active records
SELECT * FROM posts WHERE deleted_at IS NULL;

-- Query deleted records
SELECT * FROM posts WHERE deleted_at IS NOT NULL;

-- Soft delete
UPDATE posts SET deleted_at = NOW() WHERE id = ?;

-- Restore
UPDATE posts SET deleted_at = NULL WHERE id = ?;

-- Prisma implementation
model Post {
  id        String    @id @default(cuid())
  title     String
  deletedAt DateTime?

  @@index([deletedAt])
}

// Middleware for automatic filtering
prisma.$use(async (params, next) => {
  if (params.model === 'Post' && params.action === 'findMany') {
    params.args.where = { ...params.args.where, deletedAt: null };
  }
  return next(params);
});

Polymorphic Associations#

-- Option 1: Single Table Inheritance (STI)
CREATE TABLE notifications (
  id UUID PRIMARY KEY,
  type VARCHAR(50) NOT NULL,     -- 'email', 'sms', 'push'
  user_id UUID REFERENCES users(id),
  message TEXT NOT NULL,
  -- Email-specific
  email_subject VARCHAR(255),
  -- SMS-specific
  phone_number VARCHAR(20),
  -- Push-specific
  device_token VARCHAR(255),
  created_at TIMESTAMP DEFAULT NOW()
);

-- Option 2: Class Table Inheritance
CREATE TABLE notifications (
  id UUID PRIMARY KEY,
  user_id UUID REFERENCES users(id),
  message TEXT NOT NULL,
  created_at TIMESTAMP DEFAULT NOW()
);

CREATE TABLE email_notifications (
  id UUID PRIMARY KEY REFERENCES notifications(id),
  subject VARCHAR(255),
  recipient_email VARCHAR(255)
);

CREATE TABLE sms_notifications (
  id UUID PRIMARY KEY REFERENCES notifications(id),
  phone_number VARCHAR(20)
);

-- Option 3: Polymorphic with reference
CREATE TABLE comments (
  id UUID PRIMARY KEY,
  content TEXT NOT NULL,
  commentable_type VARCHAR(50) NOT NULL,  -- 'Post', 'Photo', 'Video'
  commentable_id UUID NOT NULL,
  created_at TIMESTAMP DEFAULT NOW()
);

-- Index for polymorphic lookups
CREATE INDEX idx_comments_polymorphic
ON comments(commentable_type, commentable_id);

Temporal Data (History)#

-- Audit trail with triggers
CREATE TABLE users (
  id UUID PRIMARY KEY,
  email VARCHAR(255),
  name VARCHAR(100),
  updated_at TIMESTAMP DEFAULT NOW()
);

CREATE TABLE users_history (
  id UUID PRIMARY KEY DEFAULT gen_random_uuid(),
  user_id UUID NOT NULL,
  email VARCHAR(255),
  name VARCHAR(100),
  changed_at TIMESTAMP DEFAULT NOW(),
  changed_by UUID,
  operation VARCHAR(10)  -- 'INSERT', 'UPDATE', 'DELETE'
);

-- Trigger function
CREATE OR REPLACE FUNCTION audit_users()
RETURNS TRIGGER AS $$
BEGIN
  IF TG_OP = 'DELETE' THEN
    INSERT INTO users_history (user_id, email, name, operation)
    VALUES (OLD.id, OLD.email, OLD.name, 'DELETE');
    RETURN OLD;
  ELSE
    INSERT INTO users_history (user_id, email, name, operation)
    VALUES (NEW.id, NEW.email, NEW.name, TG_OP);
    RETURN NEW;
  END IF;
END;
$$ LANGUAGE plpgsql;

CREATE TRIGGER users_audit_trigger
AFTER INSERT OR UPDATE OR DELETE ON users
FOR EACH ROW EXECUTE FUNCTION audit_users();

-- Bitemporal: Track valid time AND transaction time
CREATE TABLE prices (
  id UUID PRIMARY KEY,
  product_id UUID,
  amount DECIMAL(10,2),
  valid_from DATE NOT NULL,
  valid_to DATE,
  recorded_at TIMESTAMP DEFAULT NOW(),
  superseded_at TIMESTAMP
);

Tree Structures#

-- Adjacency List (simple, recursive queries needed)
CREATE TABLE categories (
  id UUID PRIMARY KEY,
  name VARCHAR(100),
  parent_id UUID REFERENCES categories(id)
);

-- Get descendants (PostgreSQL recursive CTE)
WITH RECURSIVE descendants AS (
  SELECT * FROM categories WHERE id = ?
  UNION ALL
  SELECT c.* FROM categories c
  JOIN descendants d ON c.parent_id = d.id
)
SELECT * FROM descendants;

-- Materialized Path (fast reads)
CREATE TABLE categories (
  id UUID PRIMARY KEY,
  name VARCHAR(100),
  path VARCHAR(1000)  -- '1/5/12/45'
);

-- Get all descendants
SELECT * FROM categories WHERE path LIKE '1/5/%';

-- Get ancestors
SELECT * FROM categories
WHERE '1/5/12/45' LIKE path || '%'
ORDER BY LENGTH(path);

-- Nested Sets (fast subtree queries, slow updates)
CREATE TABLE categories (
  id UUID PRIMARY KEY,
  name VARCHAR(100),
  lft INT NOT NULL,
  rgt INT NOT NULL
);

-- Get all descendants
SELECT * FROM categories
WHERE lft > parent.lft AND rgt < parent.rgt;

Many-to-Many with Metadata#

-- Join table with additional data
CREATE TABLE product_categories (
  product_id UUID REFERENCES products(id),
  category_id UUID REFERENCES categories(id),
  is_primary BOOLEAN DEFAULT FALSE,
  sort_order INT DEFAULT 0,
  added_at TIMESTAMP DEFAULT NOW(),
  added_by UUID REFERENCES users(id),
  PRIMARY KEY (product_id, category_id)
);

-- Ensure only one primary category per product
CREATE UNIQUE INDEX idx_primary_category
ON product_categories(product_id)
WHERE is_primary = TRUE;

Tagging Pattern#

CREATE TABLE tags (
  id UUID PRIMARY KEY,
  name VARCHAR(100) UNIQUE NOT NULL,
  slug VARCHAR(100) UNIQUE NOT NULL
);

CREATE TABLE post_tags (
  post_id UUID REFERENCES posts(id) ON DELETE CASCADE,
  tag_id UUID REFERENCES tags(id) ON DELETE CASCADE,
  PRIMARY KEY (post_id, tag_id)
);

-- Find posts with ALL specified tags
SELECT p.*
FROM posts p
WHERE (
  SELECT COUNT(*) FROM post_tags pt
  WHERE pt.post_id = p.id
  AND pt.tag_id IN (?, ?, ?)
) = 3;

-- Find posts with ANY specified tags
SELECT DISTINCT p.*
FROM posts p
JOIN post_tags pt ON p.id = pt.post_id
WHERE pt.tag_id IN (?, ?, ?);

-- PostgreSQL: Use array for simpler queries
CREATE TABLE posts (
  id UUID PRIMARY KEY,
  title VARCHAR(255),
  tags TEXT[] DEFAULT '{}'
);

SELECT * FROM posts WHERE 'javascript' = ANY(tags);
SELECT * FROM posts WHERE tags @> ARRAY['javascript', 'react'];

JSON/JSONB Columns#

-- Flexible schema for metadata
CREATE TABLE products (
  id UUID PRIMARY KEY,
  name VARCHAR(255) NOT NULL,
  price DECIMAL(10,2) NOT NULL,
  attributes JSONB DEFAULT '{}'
);

-- Index for JSON queries
CREATE INDEX idx_products_attributes ON products USING GIN(attributes);

-- Query JSON
SELECT * FROM products WHERE attributes->>'color' = 'red';
SELECT * FROM products WHERE attributes @> '{"size": "large"}';
SELECT * FROM products WHERE attributes ? 'warranty';

-- Update JSON
UPDATE products
SET attributes = attributes || '{"featured": true}'
WHERE id = ?;

-- Remove key
UPDATE products
SET attributes = attributes - 'temp_field'
WHERE id = ?;

Best Practices#

Design:
✓ Normalize first, denormalize when needed
✓ Use appropriate data types
✓ Add indexes for query patterns
✓ Plan for growth

Integrity:
✓ Use foreign keys
✓ Add constraints (NOT NULL, CHECK)
✓ Consider soft deletes for audit
✓ Use transactions

Performance:
✓ Index foreign keys
✓ Avoid over-indexing
✓ Partition large tables
✓ Monitor query plans

Choose database patterns based on your access patterns. Normalize for data integrity, denormalize for read performance. Use appropriate patterns for hierarchies, temporal data, and flexible schemas. Always index based on actual query patterns and monitor performance.