nginx load balancer and api

2026-04-15 05:02:12 +00:00 · 2025-12-30 16:16:06 +05:30 · 2025-12-30 16:16:06 +05:30 · 3469c7c83e
commit 3469c7c83e
parent 1a980a7a70
5 changed files with 502 additions and 0 deletions
--- a/app/init.py
+++ b/app/init.py
--- a/app/encoding.py
+++ b/app/encoding.py
@ -0,0 +1,52 @@
+"""
+Base62 encoding for short URL generation.
+
+- Uses 0-9, A-Z, a-z (62 characters)
+- URL-safe (no special characters)
+- More compact than hex (base16) or base64
+
+Length vs Capacity:
+- 6 chars: 62^6 = 56.8 billion unique URLs
+- 7 chars: 62^7 = 3.5 trillion unique URLs
+"""
+
+CHARSET = "0123456789ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz"
+BASE = len(CHARSET)  # 62
+
+
+def base62_encode(num: int) -> str:
+    """
+    Encode an integer to a base62 string.
+    """
+    if num < 0:
+        raise ValueError("Cannot encode negative numbers")
+    if num == 0:
+        return CHARSET[0]
+
+    result = []
+    while num:
+        result.append(CHARSET[num % BASE])
+        num //= BASE
+
+    return "".join(reversed(result))
+
+
+def base62_decode(encoded: str) -> int:
+    """
+    Decode a base62 string back to an integer.
+    """
+    if not encoded:
+        raise ValueError("Cannot decode empty string")
+
+    num = 0
+    for char in encoded:
+        if char not in CHARSET:
+            raise ValueError(f"Invalid character: {char}")
+        num = num * BASE + CHARSET.index(char)
+
+    return num
+
+
+def pad_to_length(encoded: str, length: int = 7) -> str:
+    """Pad encoded string to minimum length with leading zeros."""
+    return encoded.zfill(length)[-length:] if len(encoded) < length else encoded
--- a/app/main.py
+++ b/app/main.py
@ -0,0 +1,253 @@
+"""
+URL Shortener API
+
+Endpoints:
+- POST /shorten - Create a short URL
+- GET /{code} - Redirect to original URL
+- GET /stats/{code} - Get click statistics
+"""
+
+import os
+import asyncio
+from contextlib import asynccontextmanager
+from urllib.parse import urlparse
+
+import asyncpg
+import redis.asyncio as redis
+from fastapi import FastAPI, HTTPException, Request
+from fastapi.responses import RedirectResponse
+from pydantic import BaseModel, HttpUrl
+
+from app.encoding import base62_encode
+from app.snowflake import init_generator, generate_id
+
+
+# Configuration from environment
+DATABASE_URL = os.getenv("DATABASE_URL", "postgresql://urlshortner:localdev@localhost:5432/urlshortner")
+REDIS_URL = os.getenv("REDIS_URL", "redis://localhost:6379")
+MACHINE_ID = int(os.getenv("MACHINE_ID", "1"))
+BASE_URL = os.getenv("BASE_URL", "http://localhost")
+
+# Cache TTL in seconds (1 hour)
+CACHE_TTL = 3600
+
+# Global connections
+db_pool: asyncpg.Pool | None = None
+redis_client: redis.Redis | None = None
+
+
+@asynccontextmanager
+async def lifespan(app: FastAPI):
+    """Manage database and Redis connections."""
+    global db_pool, redis_client
+
+    # Startup
+    init_generator(MACHINE_ID)
+    db_pool = await asyncpg.create_pool(DATABASE_URL, min_size=5, max_size=20)
+    redis_client = redis.from_url(REDIS_URL, decode_responses=True)
+
+    print(f"[Startup] Connected to PostgreSQL and Redis. Machine ID: {MACHINE_ID}")
+
+    yield
+
+    # Shutdown
+    if db_pool:
+        await db_pool.close()
+    if redis_client:
+        await redis_client.close()
+
+    print("[Shutdown] Connections closed.")
+
+
+app = FastAPI(
+    title="URL Shortener",
+    description="Distributed URL shortening service",
+    version="1.0.0",
+    lifespan=lifespan,
+)
+
+
+# Request/Response models
+class ShortenRequest(BaseModel):
+    url: HttpUrl
+    custom_code: str | None = None  # Optional custom short code
+
+
+class ShortenResponse(BaseModel):
+    short_url: str
+    short_code: str
+    original_url: str
+
+
+class StatsResponse(BaseModel):
+    short_code: str
+    original_url: str
+    click_count: int
+    created_at: str
+
+
+# Endpoints
+@app.get("/health")
+async def health_check():
+    """Health check for load balancer."""
+    return {"status": "healthy", "machine_id": MACHINE_ID}
+
+
+@app.post("/shorten", response_model=ShortenResponse)
+async def shorten_url(request: ShortenRequest, req: Request):
+    """
+    Create a shortened URL.
+
+    Process:
+    1. Generate unique ID using Snowflake
+    2. Encode as base62 for short code
+    3. Store in PostgreSQL
+    4. Cache in Redis
+    """
+    original_url = str(request.url)
+
+    # Validate URL has a valid domain
+    parsed = urlparse(original_url)
+    if not parsed.netloc:
+        raise HTTPException(status_code=400, detail="Invalid URL")
+
+    # Generate short code
+    if request.custom_code:
+        short_code = request.custom_code
+        # Check if custom code already exists
+        existing = await redis_client.get(f"url:{short_code}")
+        if existing:
+            raise HTTPException(status_code=409, detail="Custom code already in use")
+    else:
+        # Generate using Snowflake + base62
+        snowflake_id = generate_id()
+        short_code = base62_encode(snowflake_id)
+
+    # Get client info
+    client_ip = req.headers.get("X-Real-IP", req.client.host if req.client else "unknown")
+    user_agent = req.headers.get("User-Agent", "")
+
+    # Store in database
+    try:
+        await db_pool.execute(
+            """
+            INSERT INTO urls (short_code, original_url, ip_address, user_agent)
+            VALUES ($1, $2, $3, $4)
+            """,
+            short_code,
+            original_url,
+            client_ip,
+            user_agent,
+        )
+    except asyncpg.UniqueViolationError:
+        raise HTTPException(status_code=409, detail="Short code collision. Please retry.")
+
+    # Cache in Redis
+    await redis_client.setex(f"url:{short_code}", CACHE_TTL, original_url)
+
+    return ShortenResponse(
+        short_url=f"{BASE_URL}/{short_code}",
+        short_code=short_code,
+        original_url=original_url,
+    )
+
+
+@app.get("/{short_code}")
+async def redirect_to_url(short_code: str, req: Request):
+    """
+    Redirect to the original URL.
+
+    Process:
+    1. Check Redis cache first (fast path)
+    2. If cache miss, query PostgreSQL
+    3. Update cache on miss
+    4. Track click asynchronously (fire and forget)
+    """
+    # Try cache first
+    original_url = await redis_client.get(f"url:{short_code}")
+
+    if not original_url:
+        # Cache miss - query database
+        row = await db_pool.fetchrow(
+            "SELECT original_url FROM urls WHERE short_code = $1",
+            short_code,
+        )
+
+        if not row:
+            raise HTTPException(status_code=404, detail="Short URL not found")
+
+        original_url = row["original_url"]
+
+        # Populate cache
+        await redis_client.setex(f"url:{short_code}", CACHE_TTL, original_url)
+
+    # Track click asynchronously (don't slow down redirect)
+    asyncio.create_task(
+        track_click(
+            short_code,
+            req.headers.get("X-Real-IP", req.client.host if req.client else None),
+            req.headers.get("User-Agent"),
+            req.headers.get("Referer"),
+        )
+    )
+
+    # 301 = permanent redirect (cacheable by browsers)
+    # 302 = temporary redirect (not cached, better for analytics)
+    return RedirectResponse(url=original_url, status_code=302)
+
+
+@app.get("/stats/{short_code}", response_model=StatsResponse)
+async def get_stats(short_code: str):
+    """Get statistics for a short URL."""
+    row = await db_pool.fetchrow(
+        """
+        SELECT short_code, original_url, click_count, created_at
+        FROM urls WHERE short_code = $1
+        """,
+        short_code,
+    )
+
+    if not row:
+        raise HTTPException(status_code=404, detail="Short URL not found")
+
+    return StatsResponse(
+        short_code=row["short_code"],
+        original_url=row["original_url"],
+        click_count=row["click_count"],
+        created_at=row["created_at"].isoformat(),
+    )
+
+
+async def track_click(
+    short_code: str,
+    ip_address: str | None,
+    user_agent: str | None,
+    referer: str | None,
+):
+    """
+    Track a click event asynchronously.
+
+    This runs in the background after the redirect is sent,
+    so it doesn't slow down the user experience.
+    """
+    try:
+        # Increment click count
+        await db_pool.execute(
+            "UPDATE urls SET click_count = click_count + 1 WHERE short_code = $1",
+            short_code,
+        )
+
+        # Store detailed click record
+        await db_pool.execute(
+            """
+            INSERT INTO clicks (short_code, ip_address, user_agent, referer)
+            VALUES ($1, $2, $3, $4)
+            """,
+            short_code,
+            ip_address,
+            user_agent,
+            referer,
+        )
+    except Exception as e:
+        # Log but don't fail - analytics shouldn't break redirects
+        print(f"[Warning] Failed to track click: {e}")
--- a/app/snowflake.py
+++ b/app/snowflake.py
@ -0,0 +1,142 @@
+"""
+Snowflake ID Generator for distributed unique ID generation.
+
+Structure (64 bits total):
+- 1 bit: sign (always 0)
+- 41 bits: timestamp in milliseconds (69 years from epoch)
+- 10 bits: machine/worker ID (1024 unique machines)
+- 12 bits: sequence number (4096 IDs per millisecond per machine)
+
+Benefits:
+- No coordination needed between machines
+- Time-sortable (IDs are roughly ordered by creation time)
+- Guaranteed unique across distributed system
+- High throughput: 4096 IDs/ms/machine = 4M IDs/second/machine
+
+Used by: Twitter, Discord, Instagram (with variations)
+"""
+
+import time
+import threading
+
+
+class SnowflakeGenerator:
+    # Custom epoch: Jan 1, 2024 00:00:00 UTC (extends usable time range)
+    EPOCH = 1704067200000  # milliseconds
+
+    # Bit lengths
+    TIMESTAMP_BITS = 41
+    MACHINE_ID_BITS = 10
+    SEQUENCE_BITS = 12
+
+    # Max values
+    MAX_MACHINE_ID = (1 << MACHINE_ID_BITS) - 1  # 1023
+    MAX_SEQUENCE = (1 << SEQUENCE_BITS) - 1  # 4095
+
+    # Bit shifts
+    TIMESTAMP_SHIFT = MACHINE_ID_BITS + SEQUENCE_BITS  # 22
+    MACHINE_ID_SHIFT = SEQUENCE_BITS  # 12
+
+    def __init__(self, machine_id: int):
+        """
+        Initialize generator with a unique machine ID.
+
+        Args:
+            machine_id: Unique identifier for this machine/worker (0-1023)
+        """
+        if not 0 <= machine_id <= self.MAX_MACHINE_ID:
+            raise ValueError(f"machine_id must be between 0 and {self.MAX_MACHINE_ID}")
+
+        self.machine_id = machine_id
+        self.sequence = 0
+        self.last_timestamp = -1
+        self._lock = threading.Lock()
+
+    def _current_timestamp(self) -> int:
+        """Get current time in milliseconds since our epoch."""
+        return int(time.time() * 1000) - self.EPOCH
+
+    def _wait_next_millis(self, last_timestamp: int) -> int:
+        """Block until next millisecond if we've exhausted sequence."""
+        timestamp = self._current_timestamp()
+        while timestamp <= last_timestamp:
+            time.sleep(0.0001)  # 0.1ms
+            timestamp = self._current_timestamp()
+        return timestamp
+
+    def generate(self) -> int:
+        """
+        Generate a unique Snowflake ID.
+
+        Thread-safe: Can be called from multiple threads.
+
+        Returns:
+            64-bit unique ID
+        """
+        with self._lock:
+            timestamp = self._current_timestamp()
+
+            if timestamp < self.last_timestamp:
+                # Clock moved backwards - this is problematic
+                raise RuntimeError(
+                    f"Clock moved backwards. Refusing to generate ID. "
+                    f"Last: {self.last_timestamp}, Current: {timestamp}"
+                )
+
+            if timestamp == self.last_timestamp:
+                # Same millisecond - increment sequence
+                self.sequence = (self.sequence + 1) & self.MAX_SEQUENCE
+
+                if self.sequence == 0:
+                    # Sequence exhausted - wait for next millisecond
+                    timestamp = self._wait_next_millis(self.last_timestamp)
+            else:
+                # New millisecond - reset sequence
+                self.sequence = 0
+
+            self.last_timestamp = timestamp
+
+            # Compose the ID
+            snowflake_id = (
+                (timestamp << self.TIMESTAMP_SHIFT)
+                | (self.machine_id << self.MACHINE_ID_SHIFT)
+                | self.sequence
+            )
+
+            return snowflake_id
+
+    def parse(self, snowflake_id: int) -> dict:
+        """
+        Parse a Snowflake ID into its components.
+
+        Useful for debugging and understanding ID generation.
+        """
+        timestamp = (snowflake_id >> self.TIMESTAMP_SHIFT) + self.EPOCH
+        machine_id = (snowflake_id >> self.MACHINE_ID_SHIFT) & self.MAX_MACHINE_ID
+        sequence = snowflake_id & self.MAX_SEQUENCE
+
+        return {
+            "timestamp_ms": timestamp,
+            "timestamp_iso": time.strftime(
+                "%Y-%m-%d %H:%M:%S", time.gmtime(timestamp / 1000)
+            ),
+            "machine_id": machine_id,
+            "sequence": sequence,
+        }
+
+
+# Module-level generator (initialized in main.py)
+_generator: SnowflakeGenerator | None = None
+
+
+def init_generator(machine_id: int) -> None:
+    """Initialize the global Snowflake generator."""
+    global _generator
+    _generator = SnowflakeGenerator(machine_id)
+
+
+def generate_id() -> int:
+    """Generate a unique Snowflake ID using the global generator."""
+    if _generator is None:
+        raise RuntimeError("Snowflake generator not initialized. Call init_generator() first.")
+    return _generator.generate()
--- a/nginx/nginx.conf
+++ b/nginx/nginx.conf
@ -0,0 +1,55 @@
+events {
+    worker_connections 1024;
+}
+
+http {
+    # Upstream API servers - Docker will resolve 'api' to all instances
+    upstream api_servers {
+        # Load balancing method: least_conn sends to least busy server
+        # Other options: round_robin (default), ip_hash, random
+        least_conn;
+
+        # Docker Compose service discovery
+        server api:8000;
+
+        # When scaling manually, you'd list servers like:
+        # server api_1:8000;
+        # server api_2:8000;
+        # server api_3:8000;
+    }
+
+    # Rate limiting zone: 10 requests per second per IP
+    limit_req_zone $binary_remote_addr zone=api_limit:10m rate=10r/s;
+
+    server {
+        listen 80;
+        server_name localhost;
+
+        # Health check endpoint
+        location /health {
+            access_log off;
+            return 200 "OK\n";
+            add_header Content-Type text/plain;
+        }
+
+        # API endpoints
+        location / {
+            # Apply rate limiting with burst
+            limit_req zone=api_limit burst=20 nodelay;
+
+            proxy_pass http://api_servers;
+            proxy_http_version 1.1;
+
+            # Pass client info to backend
+            proxy_set_header Host $host;
+            proxy_set_header X-Real-IP $remote_addr;
+            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+            proxy_set_header X-Forwarded-Proto $scheme;
+
+            # Timeouts
+            proxy_connect_timeout 5s;
+            proxy_send_timeout 10s;
+            proxy_read_timeout 10s;
+        }
+    }
+}