chore: create script for selfhosted reflector (#866)

* self hosted with self gpu * add optional ollama model * garage ports * exposes ports and changes curl * custom domain * try to fix wroker * build locallly * documentation * docs format * precommit
2026-05-06 11:15:18 +00:00 · 2026-02-19 15:11:45 -05:00
parent a8ad237d85
commit cdd974b935
11 changed files with 2313 additions and 1 deletions
--- a/scripts/setup-selfhosted.sh
+++ b/scripts/setup-selfhosted.sh
@@ -0,0 +1,945 @@
+#!/usr/bin/env bash
+#
+# Self-hosted production setup for Reflector.
+# Single script to configure and launch everything on one server.
+#
+# Usage:
+#   ./scripts/setup-selfhosted.sh <--gpu|--cpu> [--ollama-gpu|--ollama-cpu] [--llm-model MODEL] [--garage] [--caddy] [--domain DOMAIN] [--build]
+#
+# Specialized models (pick ONE — required):
+#   --gpu              NVIDIA GPU for transcription/diarization/translation
+#   --cpu              CPU-only for transcription/diarization/translation (slower)
+#
+# Local LLM (optional — for summarization & topic detection):
+#   --ollama-gpu       Local Ollama with NVIDIA GPU acceleration
+#   --ollama-cpu       Local Ollama on CPU only
+#   --llm-model MODEL  Ollama model to use (default: qwen2.5:14b)
+#   (If omitted, configure an external OpenAI-compatible LLM in server/.env)
+#
+# Optional flags:
+#   --garage           Use Garage for local S3-compatible storage
+#   --caddy            Enable Caddy reverse proxy with auto-SSL
+#   --domain DOMAIN    Use a real domain for Caddy (enables Let's Encrypt auto-HTTPS)
+#                      Requires: DNS pointing to this server + ports 80/443 open
+#                      Without --domain: Caddy uses self-signed cert for IP access
+#   --build            Build backend and frontend images from source instead of pulling
+#
+# Examples:
+#   ./scripts/setup-selfhosted.sh --gpu --ollama-gpu --garage --caddy
+#   ./scripts/setup-selfhosted.sh --gpu --ollama-gpu --garage --caddy --domain reflector.example.com
+#   ./scripts/setup-selfhosted.sh --cpu --ollama-cpu --garage --caddy
+#   ./scripts/setup-selfhosted.sh --gpu --ollama-gpu --llm-model mistral --garage --caddy
+#   ./scripts/setup-selfhosted.sh --gpu --garage --caddy
+#   ./scripts/setup-selfhosted.sh --cpu
+#
+# Idempotent — safe to re-run at any time.
+#
+set -euo pipefail
+
+SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
+ROOT_DIR="$(cd "$SCRIPT_DIR/.." && pwd)"
+
+COMPOSE_FILE="$ROOT_DIR/docker-compose.selfhosted.yml"
+SERVER_ENV="$ROOT_DIR/server/.env"
+WWW_ENV="$ROOT_DIR/www/.env"
+
+OLLAMA_MODEL="qwen2.5:14b"
+OS="$(uname -s)"
+
+# --- Colors ---
+RED='\033[0;31m'
+GREEN='\033[0;32m'
+YELLOW='\033[1;33m'
+CYAN='\033[0;36m'
+NC='\033[0m'
+
+info()  { echo -e "${CYAN}==>${NC} $*"; }
+ok()    { echo -e "${GREEN}  ✓${NC} $*"; }
+warn()  { echo -e "${YELLOW}  !${NC} $*"; }
+err()   { echo -e "${RED}  ✗${NC} $*" >&2; }
+
+# --- Helpers ---
+
+dump_diagnostics() {
+    local failed_svc="${1:-}"
+    echo ""
+    err "========== DIAGNOSTICS =========="
+
+    err "Container status:"
+    compose_cmd ps -a --format "table {{.Name}}\t{{.Status}}" 2>/dev/null || true
+    echo ""
+
+    local stopped
+    stopped=$(compose_cmd ps -a --format '{{.Name}}\t{{.Status}}' 2>/dev/null \
+        | grep -iv 'up\|running' | awk -F'\t' '{print $1}' || true)
+    for c in $stopped; do
+        err "--- Logs for $c (exited/unhealthy) ---"
+        docker logs --tail 30 "$c" 2>&1 || true
+        echo ""
+    done
+
+    if [[ -n "$failed_svc" ]]; then
+        err "--- Logs for $failed_svc (last 40) ---"
+        compose_cmd logs "$failed_svc" --tail 40 2>&1 || true
+    fi
+
+    err "================================="
+}
+
+trap 'dump_diagnostics' ERR
+
+detect_lan_ip() {
+    case "$OS" in
+        Darwin)
+            for iface in en0 en1 en2 en3; do
+                local ip
+                ip=$(ipconfig getifaddr "$iface" 2>/dev/null || true)
+                if [[ -n "$ip" ]]; then
+                    echo "$ip"
+                    return
+                fi
+            done
+            ;;
+        Linux)
+            ip route get 1.1.1.1 2>/dev/null | sed -n 's/.*src \([^ ]*\).*/\1/p'
+            return
+            ;;
+    esac
+    echo ""
+}
+
+wait_for_url() {
+    local url="$1" label="$2" retries="${3:-30}" interval="${4:-2}"
+    for i in $(seq 1 "$retries"); do
+        if curl -sf "$url" > /dev/null 2>&1; then
+            return 0
+        fi
+        echo -ne "\r  Waiting for $label... ($i/$retries)"
+        sleep "$interval"
+    done
+    echo ""
+    err "$label not responding at $url after $retries attempts"
+    return 1
+}
+
+env_has_key() {
+    local file="$1" key="$2"
+    grep -q "^${key}=" "$file" 2>/dev/null
+}
+
+env_get() {
+    local file="$1" key="$2"
+    grep "^${key}=" "$file" 2>/dev/null | head -1 | cut -d= -f2-
+}
+
+env_set() {
+    local file="$1" key="$2" value="$3"
+    if env_has_key "$file" "$key"; then
+        if [[ "$OS" == "Darwin" ]]; then
+            sed -i '' "s|^${key}=.*|${key}=${value}|" "$file"
+        else
+            sed -i "s|^${key}=.*|${key}=${value}|" "$file"
+        fi
+    else
+        echo "${key}=${value}" >> "$file"
+    fi
+}
+
+compose_cmd() {
+    local profiles=""
+    for p in "${COMPOSE_PROFILES[@]}"; do
+        profiles="$profiles --profile $p"
+    done
+    docker compose -f "$COMPOSE_FILE" $profiles "$@"
+}
+
+# Compose command with only garage profile (for garage-only operations before full stack start)
+compose_garage_cmd() {
+    docker compose -f "$COMPOSE_FILE" --profile garage "$@"
+}
+
+# --- Parse arguments ---
+MODEL_MODE=""       # gpu or cpu (required, mutually exclusive)
+OLLAMA_MODE=""      # ollama-gpu or ollama-cpu (optional)
+USE_GARAGE=false
+USE_CADDY=false
+CUSTOM_DOMAIN=""    # optional domain for Let's Encrypt HTTPS
+BUILD_IMAGES=false  # build backend/frontend from source
+
+SKIP_NEXT=false
+ARGS=("$@")
+for i in "${!ARGS[@]}"; do
+    if [[ "$SKIP_NEXT" == "true" ]]; then
+        SKIP_NEXT=false
+        continue
+    fi
+    arg="${ARGS[$i]}"
+    case "$arg" in
+        --gpu)
+            [[ -n "$MODEL_MODE" ]] && { err "Cannot combine --gpu and --cpu. Pick one."; exit 1; }
+            MODEL_MODE="gpu" ;;
+        --cpu)
+            [[ -n "$MODEL_MODE" ]] && { err "Cannot combine --gpu and --cpu. Pick one."; exit 1; }
+            MODEL_MODE="cpu" ;;
+        --ollama-gpu)
+            [[ -n "$OLLAMA_MODE" ]] && { err "Cannot combine --ollama-gpu and --ollama-cpu. Pick one."; exit 1; }
+            OLLAMA_MODE="ollama-gpu" ;;
+        --ollama-cpu)
+            [[ -n "$OLLAMA_MODE" ]] && { err "Cannot combine --ollama-gpu and --ollama-cpu. Pick one."; exit 1; }
+            OLLAMA_MODE="ollama-cpu" ;;
+        --llm-model)
+            next_i=$((i + 1))
+            if [[ $next_i -ge ${#ARGS[@]} ]] || [[ "${ARGS[$next_i]}" == --* ]]; then
+                err "--llm-model requires a model name (e.g. --llm-model mistral)"
+                exit 1
+            fi
+            OLLAMA_MODEL="${ARGS[$next_i]}"
+            SKIP_NEXT=true ;;
+        --garage)       USE_GARAGE=true ;;
+        --caddy)        USE_CADDY=true ;;
+        --build)        BUILD_IMAGES=true ;;
+        --domain)
+            next_i=$((i + 1))
+            if [[ $next_i -ge ${#ARGS[@]} ]] || [[ "${ARGS[$next_i]}" == --* ]]; then
+                err "--domain requires a domain name (e.g. --domain reflector.example.com)"
+                exit 1
+            fi
+            CUSTOM_DOMAIN="${ARGS[$next_i]}"
+            USE_CADDY=true  # --domain implies --caddy
+            SKIP_NEXT=true ;;
+        *)
+            err "Unknown argument: $arg"
+            err "Usage: $0 <--gpu|--cpu> [--ollama-gpu|--ollama-cpu] [--llm-model MODEL] [--garage] [--caddy] [--domain DOMAIN] [--build]"
+            exit 1
+            ;;
+    esac
+done
+
+if [[ -z "$MODEL_MODE" ]]; then
+    err "No model mode specified. You must choose --gpu or --cpu."
+    err ""
+    err "Usage: $0 <--gpu|--cpu> [--ollama-gpu|--ollama-cpu] [--llm-model MODEL] [--garage] [--caddy] [--domain DOMAIN] [--build]"
+    err ""
+    err "Specialized models (required):"
+    err "  --gpu              NVIDIA GPU for transcription/diarization/translation"
+    err "  --cpu              CPU-only (slower but works without GPU)"
+    err ""
+    err "Local LLM (optional):"
+    err "  --ollama-gpu       Local Ollama with GPU (for summarization/topics)"
+    err "  --ollama-cpu       Local Ollama on CPU (for summarization/topics)"
+    err "  --llm-model MODEL  Ollama model to download (default: qwen2.5:14b)"
+    err "  (omit --ollama-* for external OpenAI-compatible LLM)"
+    err ""
+    err "Other options:"
+    err "  --garage           Local S3-compatible storage (Garage)"
+    err "  --caddy            Caddy reverse proxy with self-signed cert"
+    err "  --domain DOMAIN    Use a real domain with Let's Encrypt HTTPS (implies --caddy)"
+    err "  --build            Build backend/frontend images from source instead of pulling"
+    exit 1
+fi
+
+# Build profiles list — one profile per feature
+COMPOSE_PROFILES=("$MODEL_MODE")
+[[ -n "$OLLAMA_MODE" ]] && COMPOSE_PROFILES+=("$OLLAMA_MODE")
+[[ "$USE_GARAGE" == "true" ]] && COMPOSE_PROFILES+=("garage")
+[[ "$USE_CADDY" == "true" ]] && COMPOSE_PROFILES+=("caddy")
+
+# Derived flags
+NEEDS_NVIDIA=false
+[[ "$MODEL_MODE" == "gpu" ]] && NEEDS_NVIDIA=true
+[[ "$OLLAMA_MODE" == "ollama-gpu" ]] && NEEDS_NVIDIA=true
+
+USES_OLLAMA=false
+OLLAMA_SVC=""
+[[ "$OLLAMA_MODE" == "ollama-gpu" ]] && USES_OLLAMA=true && OLLAMA_SVC="ollama"
+[[ "$OLLAMA_MODE" == "ollama-cpu" ]] && USES_OLLAMA=true && OLLAMA_SVC="ollama-cpu"
+
+# Human-readable mode string for display
+MODE_DISPLAY="$MODEL_MODE"
+[[ -n "$OLLAMA_MODE" ]] && MODE_DISPLAY="$MODEL_MODE + $OLLAMA_MODE"
+
+# =========================================================
+# Step 0: Prerequisites
+# =========================================================
+step_prerequisites() {
+    info "Step 0: Checking prerequisites"
+
+    # Docker
+    if ! docker compose version 2>/dev/null | grep -qi compose; then
+        err "Docker Compose V2 not found."
+        err "Install Docker with Compose V2: https://docs.docker.com/engine/install/"
+        exit 1
+    fi
+    if ! docker info &>/dev/null; then
+        err "Docker daemon not running."
+        exit 1
+    fi
+    ok "Docker + Compose V2 ready"
+
+    # NVIDIA GPU check
+    if [[ "$NEEDS_NVIDIA" == "true" ]]; then
+        if ! command -v nvidia-smi &>/dev/null || ! nvidia-smi &>/dev/null; then
+            err "NVIDIA GPU required (model=$MODEL_MODE, ollama=$OLLAMA_MODE) but nvidia-smi failed."
+            err "Install NVIDIA drivers and nvidia-container-toolkit."
+            exit 1
+        fi
+        ok "NVIDIA GPU detected"
+    fi
+
+    # Compose file
+    if [[ ! -f "$COMPOSE_FILE" ]]; then
+        err "docker-compose.selfhosted.yml not found at $COMPOSE_FILE"
+        err "Run this script from the repo root: ./scripts/setup-selfhosted.sh"
+        exit 1
+    fi
+
+    ok "Prerequisites OK (models=$MODEL_MODE, ollama=$OLLAMA_MODE, garage=$USE_GARAGE, caddy=$USE_CADDY)"
+}
+
+# =========================================================
+# Step 1: Generate secrets
+# =========================================================
+step_secrets() {
+    info "Step 1: Generating secrets"
+
+    # These are used in later steps — generate once, reuse
+    if [[ -f "$SERVER_ENV" ]] && env_has_key "$SERVER_ENV" "SECRET_KEY"; then
+        SECRET_KEY=$(env_get "$SERVER_ENV" "SECRET_KEY")
+        if [[ "$SECRET_KEY" != "changeme"* ]]; then
+            ok "SECRET_KEY already set"
+        else
+            SECRET_KEY=$(openssl rand -hex 32)
+        fi
+    else
+        SECRET_KEY=$(openssl rand -hex 32)
+    fi
+
+    if [[ -f "$WWW_ENV" ]] && env_has_key "$WWW_ENV" "NEXTAUTH_SECRET"; then
+        NEXTAUTH_SECRET=$(env_get "$WWW_ENV" "NEXTAUTH_SECRET")
+        if [[ "$NEXTAUTH_SECRET" != "changeme"* ]]; then
+            ok "NEXTAUTH_SECRET already set"
+        else
+            NEXTAUTH_SECRET=$(openssl rand -hex 32)
+        fi
+    else
+        NEXTAUTH_SECRET=$(openssl rand -hex 32)
+    fi
+
+    ok "Secrets ready"
+}
+
+# =========================================================
+# Step 2: Generate server/.env
+# =========================================================
+step_server_env() {
+    info "Step 2: Generating server/.env"
+
+    if [[ -f "$SERVER_ENV" ]]; then
+        ok "server/.env already exists — ensuring required vars"
+    else
+        cp "$ROOT_DIR/server/.env.selfhosted.example" "$SERVER_ENV"
+        ok "Created server/.env from template"
+    fi
+
+    # Core infrastructure
+    env_set "$SERVER_ENV" "DATABASE_URL" "postgresql+asyncpg://reflector:reflector@postgres:5432/reflector"
+    env_set "$SERVER_ENV" "REDIS_HOST" "redis"
+    env_set "$SERVER_ENV" "CELERY_BROKER_URL" "redis://redis:6379/1"
+    env_set "$SERVER_ENV" "CELERY_RESULT_BACKEND" "redis://redis:6379/1"
+    env_set "$SERVER_ENV" "SECRET_KEY" "$SECRET_KEY"
+    env_set "$SERVER_ENV" "AUTH_BACKEND" "none"
+    env_set "$SERVER_ENV" "PUBLIC_MODE" "true"
+
+    # Public-facing URLs
+    local server_base_url
+    if [[ -n "$CUSTOM_DOMAIN" ]]; then
+        server_base_url="https://$CUSTOM_DOMAIN"
+    elif [[ "$USE_CADDY" == "true" ]]; then
+        if [[ -n "$PRIMARY_IP" ]]; then
+            server_base_url="https://$PRIMARY_IP"
+        else
+            server_base_url="https://localhost"
+        fi
+    else
+        if [[ -n "$PRIMARY_IP" ]]; then
+            server_base_url="http://$PRIMARY_IP"
+        else
+            server_base_url="http://localhost:1250"
+        fi
+    fi
+    env_set "$SERVER_ENV" "BASE_URL" "$server_base_url"
+    env_set "$SERVER_ENV" "CORS_ORIGIN" "$server_base_url"
+
+    # WebRTC: advertise host IP in ICE candidates so browsers can reach the server
+    if [[ -n "$PRIMARY_IP" ]]; then
+        env_set "$SERVER_ENV" "WEBRTC_HOST" "$PRIMARY_IP"
+    fi
+
+    # Specialized models (always via gpu/cpu container aliased as "transcription")
+    env_set "$SERVER_ENV" "TRANSCRIPT_BACKEND" "modal"
+    env_set "$SERVER_ENV" "TRANSCRIPT_URL" "http://transcription:8000"
+    env_set "$SERVER_ENV" "TRANSCRIPT_MODAL_API_KEY" "selfhosted"
+    env_set "$SERVER_ENV" "DIARIZATION_ENABLED" "true"
+    env_set "$SERVER_ENV" "DIARIZATION_BACKEND" "modal"
+    env_set "$SERVER_ENV" "DIARIZATION_URL" "http://transcription:8000"
+    env_set "$SERVER_ENV" "TRANSLATION_BACKEND" "modal"
+    env_set "$SERVER_ENV" "TRANSLATE_URL" "http://transcription:8000"
+
+    # HuggingFace token for gated models (pyannote diarization)
+    # Written to root .env so docker compose picks it up for gpu/cpu containers
+    local root_env="$ROOT_DIR/.env"
+    local current_hf_token="${HF_TOKEN:-}"
+    if [[ -f "$root_env" ]] && env_has_key "$root_env" "HF_TOKEN"; then
+        current_hf_token=$(env_get "$root_env" "HF_TOKEN")
+    fi
+    if [[ -z "$current_hf_token" ]]; then
+        echo ""
+        warn "HF_TOKEN not set. Diarization will use a public model fallback."
+        warn "For best results, get a token at https://huggingface.co/settings/tokens"
+        warn "and accept pyannote licenses at https://huggingface.co/pyannote/speaker-diarization-3.1"
+        read -rp "  HuggingFace token (or press Enter to skip): " current_hf_token
+    fi
+    if [[ -n "$current_hf_token" ]]; then
+        touch "$root_env"
+        env_set "$root_env" "HF_TOKEN" "$current_hf_token"
+        export HF_TOKEN="$current_hf_token"
+        ok "HF_TOKEN configured"
+    else
+        touch "$root_env"
+        env_set "$root_env" "HF_TOKEN" ""
+        ok "HF_TOKEN skipped (using public model fallback)"
+    fi
+
+    # LLM configuration
+    if [[ "$USES_OLLAMA" == "true" ]]; then
+        local llm_host="$OLLAMA_SVC"
+        env_set "$SERVER_ENV" "LLM_URL" "http://${llm_host}:11434/v1"
+        env_set "$SERVER_ENV" "LLM_MODEL" "$OLLAMA_MODEL"
+        env_set "$SERVER_ENV" "LLM_API_KEY" "not-needed"
+        ok "LLM configured for local Ollama ($llm_host, model=$OLLAMA_MODEL)"
+    else
+        # Check if user already configured LLM
+        local current_llm_url=""
+        if env_has_key "$SERVER_ENV" "LLM_URL"; then
+            current_llm_url=$(env_get "$SERVER_ENV" "LLM_URL")
+        fi
+        if [[ -z "$current_llm_url" ]] || [[ "$current_llm_url" == "http://host.docker.internal"* ]]; then
+            warn "LLM not configured. Summarization and topic detection will NOT work."
+            warn "Edit server/.env and set LLM_URL, LLM_API_KEY, LLM_MODEL"
+            warn "Example: LLM_URL=https://api.openai.com/v1  LLM_MODEL=gpt-4o-mini"
+        else
+            ok "LLM already configured: $current_llm_url"
+        fi
+    fi
+
+    ok "server/.env ready"
+}
+
+# =========================================================
+# Step 3: Generate www/.env
+# =========================================================
+step_www_env() {
+    info "Step 3: Generating www/.env"
+
+    if [[ -f "$WWW_ENV" ]]; then
+        ok "www/.env already exists — ensuring required vars"
+    else
+        cp "$ROOT_DIR/www/.env.selfhosted.example" "$WWW_ENV"
+        ok "Created www/.env from template"
+    fi
+
+    # Public-facing URL for frontend
+    local base_url
+    if [[ -n "$CUSTOM_DOMAIN" ]]; then
+        base_url="https://$CUSTOM_DOMAIN"
+    elif [[ "$USE_CADDY" == "true" ]]; then
+        if [[ -n "$PRIMARY_IP" ]]; then
+            base_url="https://$PRIMARY_IP"
+        else
+            base_url="https://localhost"
+        fi
+    else
+        # No Caddy — user's proxy handles SSL. Use http for now, they'll override.
+        if [[ -n "$PRIMARY_IP" ]]; then
+            base_url="http://$PRIMARY_IP"
+        else
+            base_url="http://localhost"
+        fi
+    fi
+
+    env_set "$WWW_ENV" "SITE_URL" "$base_url"
+    env_set "$WWW_ENV" "NEXTAUTH_URL" "$base_url"
+    env_set "$WWW_ENV" "NEXTAUTH_SECRET" "$NEXTAUTH_SECRET"
+    env_set "$WWW_ENV" "API_URL" "$base_url"
+    env_set "$WWW_ENV" "WEBSOCKET_URL" "auto"
+    env_set "$WWW_ENV" "SERVER_API_URL" "http://server:1250"
+    env_set "$WWW_ENV" "KV_URL" "redis://redis:6379"
+    env_set "$WWW_ENV" "FEATURE_REQUIRE_LOGIN" "false"
+
+    ok "www/.env ready (URL=$base_url)"
+}
+
+# =========================================================
+# Step 4: Storage setup
+# =========================================================
+step_storage() {
+    info "Step 4: Storage setup"
+
+    if [[ "$USE_GARAGE" == "true" ]]; then
+        step_garage
+    else
+        step_external_s3
+    fi
+}
+
+step_garage() {
+    info "Configuring Garage (local S3)"
+
+    # Generate garage.toml from template
+    local garage_toml="$ROOT_DIR/scripts/garage.toml"
+    local garage_runtime="$ROOT_DIR/data/garage.toml"
+    mkdir -p "$ROOT_DIR/data"
+
+    if [[ -d "$garage_runtime" ]]; then
+        rm -rf "$garage_runtime"
+    fi
+    if [[ ! -f "$garage_runtime" ]]; then
+        local rpc_secret
+        rpc_secret=$(openssl rand -hex 32)
+        sed "s|__GARAGE_RPC_SECRET__|${rpc_secret}|" "$garage_toml" > "$garage_runtime"
+        ok "Generated data/garage.toml"
+    else
+        ok "data/garage.toml already exists"
+    fi
+
+    # Start garage container only
+    compose_garage_cmd up -d garage
+
+    # Wait for admin API (port 3903 exposed to host for health checks)
+    local garage_ready=false
+    for i in $(seq 1 30); do
+        if curl -sf http://localhost:3903/metrics > /dev/null 2>&1; then
+            garage_ready=true
+            break
+        fi
+        echo -ne "\r  Waiting for Garage admin API... ($i/30)"
+        sleep 2
+    done
+    echo ""
+    if [[ "$garage_ready" != "true" ]]; then
+        err "Garage not responding. Check: docker compose logs garage"
+        exit 1
+    fi
+
+    # Layout
+    local node_id
+    node_id=$(compose_garage_cmd exec -T garage /garage node id -q 2>/dev/null | tr -d '[:space:]')
+    local layout_status
+    layout_status=$(compose_garage_cmd exec -T garage /garage layout show 2>&1 || true)
+    if echo "$layout_status" | grep -q "No nodes"; then
+        compose_garage_cmd exec -T garage /garage layout assign "$node_id" -c 1G -z dc1
+        compose_garage_cmd exec -T garage /garage layout apply --version 1
+    fi
+
+    # Bucket
+    if ! compose_garage_cmd exec -T garage /garage bucket info reflector-media &>/dev/null; then
+        compose_garage_cmd exec -T garage /garage bucket create reflector-media
+    fi
+
+    # Key
+    local created_key=false
+    if compose_garage_cmd exec -T garage /garage key info reflector &>/dev/null; then
+        ok "Key 'reflector' already exists"
+    else
+        KEY_OUTPUT=$(compose_garage_cmd exec -T garage /garage key create reflector)
+        created_key=true
+    fi
+
+    # Permissions
+    compose_garage_cmd exec -T garage /garage bucket allow reflector-media --read --write --key reflector
+
+    # Write S3 credentials to server/.env
+    env_set "$SERVER_ENV" "TRANSCRIPT_STORAGE_BACKEND" "aws"
+    env_set "$SERVER_ENV" "TRANSCRIPT_STORAGE_AWS_ENDPOINT_URL" "http://garage:3900"
+    env_set "$SERVER_ENV" "TRANSCRIPT_STORAGE_AWS_BUCKET_NAME" "reflector-media"
+    env_set "$SERVER_ENV" "TRANSCRIPT_STORAGE_AWS_REGION" "garage"
+    if [[ "$created_key" == "true" ]]; then
+        local key_id key_secret
+        key_id=$(echo "$KEY_OUTPUT" | grep -i "key id" | awk '{print $NF}')
+        key_secret=$(echo "$KEY_OUTPUT" | grep -i "secret key" | awk '{print $NF}')
+        env_set "$SERVER_ENV" "TRANSCRIPT_STORAGE_AWS_ACCESS_KEY_ID" "$key_id"
+        env_set "$SERVER_ENV" "TRANSCRIPT_STORAGE_AWS_SECRET_ACCESS_KEY" "$key_secret"
+    fi
+
+    ok "Garage storage ready"
+}
+
+step_external_s3() {
+    info "Checking external S3 configuration"
+
+    env_set "$SERVER_ENV" "TRANSCRIPT_STORAGE_BACKEND" "aws"
+
+    local s3_vars=("TRANSCRIPT_STORAGE_AWS_ACCESS_KEY_ID" "TRANSCRIPT_STORAGE_AWS_SECRET_ACCESS_KEY" "TRANSCRIPT_STORAGE_AWS_BUCKET_NAME" "TRANSCRIPT_STORAGE_AWS_REGION")
+    local missing=()
+
+    for var in "${s3_vars[@]}"; do
+        if ! env_has_key "$SERVER_ENV" "$var" || [[ -z "$(env_get "$SERVER_ENV" "$var")" ]]; then
+            missing+=("$var")
+        fi
+    done
+
+    if [[ ${#missing[@]} -gt 0 ]]; then
+        warn "S3 storage is REQUIRED. The following vars are missing in server/.env:"
+        for var in "${missing[@]}"; do
+            warn "  $var"
+        done
+        echo ""
+        info "Enter S3 credentials (or press Ctrl+C to abort and edit server/.env manually):"
+        echo ""
+
+        for var in "${missing[@]}"; do
+            local prompt_label
+            case "$var" in
+                *ACCESS_KEY_ID)      prompt_label="Access Key ID" ;;
+                *SECRET_ACCESS_KEY)  prompt_label="Secret Access Key" ;;
+                *BUCKET_NAME)        prompt_label="Bucket Name" ;;
+                *REGION)             prompt_label="Region (e.g. us-east-1)" ;;
+            esac
+            local value=""
+            while [[ -z "$value" ]]; do
+                read -rp "  $prompt_label: " value
+            done
+            env_set "$SERVER_ENV" "$var" "$value"
+        done
+
+        # Optional: endpoint URL for non-AWS S3
+        echo ""
+        read -rp "  S3 Endpoint URL (leave empty for AWS, or enter for MinIO/etc.): " endpoint_url
+        if [[ -n "$endpoint_url" ]]; then
+            env_set "$SERVER_ENV" "TRANSCRIPT_STORAGE_AWS_ENDPOINT_URL" "$endpoint_url"
+        fi
+    fi
+
+    ok "S3 storage configured"
+}
+
+# =========================================================
+# Step 5: Caddyfile
+# =========================================================
+step_caddyfile() {
+    if [[ "$USE_CADDY" != "true" ]]; then
+        return
+    fi
+
+    info "Step 5: Caddyfile setup"
+
+    local caddyfile="$ROOT_DIR/Caddyfile"
+    if [[ -d "$caddyfile" ]]; then
+        rm -rf "$caddyfile"
+    fi
+
+    if [[ -n "$CUSTOM_DOMAIN" ]]; then
+        # Real domain: Caddy auto-provisions Let's Encrypt certificate
+        cat > "$caddyfile" << CADDYEOF
+# Generated by setup-selfhosted.sh — Let's Encrypt HTTPS for $CUSTOM_DOMAIN
+$CUSTOM_DOMAIN {
+    handle /v1/* {
+        reverse_proxy server:1250
+    }
+    handle /health {
+        reverse_proxy server:1250
+    }
+    handle {
+        reverse_proxy web:3000
+    }
+}
+CADDYEOF
+        ok "Created Caddyfile for $CUSTOM_DOMAIN (Let's Encrypt auto-HTTPS)"
+    elif [[ -n "$PRIMARY_IP" ]]; then
+        # No domain, IP only: catch-all :443 with self-signed cert
+        # (IP connections don't send SNI, so we can't match by address)
+        cat > "$caddyfile" << CADDYEOF
+# Generated by setup-selfhosted.sh — self-signed cert for IP access
+:443 {
+    tls internal
+    handle /v1/* {
+        reverse_proxy server:1250
+    }
+    handle /health {
+        reverse_proxy server:1250
+    }
+    handle {
+        reverse_proxy web:3000
+    }
+}
+CADDYEOF
+        ok "Created Caddyfile for $PRIMARY_IP (catch-all :443 with self-signed cert)"
+    elif [[ ! -f "$caddyfile" ]]; then
+        cp "$ROOT_DIR/Caddyfile.selfhosted.example" "$caddyfile"
+        ok "Created Caddyfile from template"
+    else
+        ok "Caddyfile already exists"
+    fi
+}
+
+# =========================================================
+# Step 6: Start services
+# =========================================================
+step_services() {
+    info "Step 6: Starting Docker services"
+
+    # Build GPU/CPU image from source (always needed — no prebuilt image)
+    local build_svc="$MODEL_MODE"
+    info "Building $build_svc image (first build downloads ML models, may take a while)..."
+    compose_cmd build "$build_svc"
+    ok "$build_svc image built"
+
+    # Build or pull backend and frontend images
+    if [[ "$BUILD_IMAGES" == "true" ]]; then
+        info "Building backend image from source (server, worker, beat)..."
+        compose_cmd build server worker beat
+        ok "Backend image built"
+        info "Building frontend image from source..."
+        compose_cmd build web
+        ok "Frontend image built"
+    else
+        info "Pulling latest backend and frontend images..."
+        compose_cmd pull server web || warn "Pull failed — using cached images"
+    fi
+
+    # Start all services
+    compose_cmd up -d
+    ok "Containers started"
+
+    # Quick sanity check
+    sleep 3
+    local exited
+    exited=$(compose_cmd ps -a --format '{{.Name}} {{.Status}}' 2>/dev/null \
+        | grep -i 'exit' || true)
+    if [[ -n "$exited" ]]; then
+        warn "Some containers exited immediately:"
+        echo "$exited" | while read -r line; do warn "  $line"; done
+        dump_diagnostics
+    fi
+}
+
+# =========================================================
+# Step 7: Health checks
+# =========================================================
+step_health() {
+    info "Step 7: Health checks"
+
+    # Specialized model service (gpu or cpu)
+    local model_svc="$MODEL_MODE"
+
+    info "Waiting for $model_svc service (first start downloads ~1GB of models)..."
+    local model_ok=false
+    for i in $(seq 1 120); do
+        if curl -sf http://localhost:8000/docs > /dev/null 2>&1; then
+            model_ok=true
+            break
+        fi
+        echo -ne "\r  Waiting for $model_svc service... ($i/120)"
+        sleep 5
+    done
+    echo ""
+    if [[ "$model_ok" == "true" ]]; then
+        ok "$model_svc service healthy (transcription + diarization)"
+    else
+        warn "$model_svc service not ready yet — it will keep loading in the background"
+        warn "Check with: docker compose -f docker-compose.selfhosted.yml logs $model_svc"
+    fi
+
+    # Ollama (if applicable)
+    if [[ "$USES_OLLAMA" == "true" ]]; then
+        info "Waiting for Ollama service..."
+        local ollama_ok=false
+        for i in $(seq 1 60); do
+            if curl -sf http://localhost:11434/api/tags > /dev/null 2>&1; then
+                ollama_ok=true
+                break
+            fi
+            echo -ne "\r  Waiting for Ollama... ($i/60)"
+            sleep 3
+        done
+        echo ""
+        if [[ "$ollama_ok" == "true" ]]; then
+            ok "Ollama service healthy"
+
+            # Pull model if not present
+            if compose_cmd exec -T "$OLLAMA_SVC" ollama list 2>/dev/null | awk '{print $1}' | grep -qxF "$OLLAMA_MODEL"; then
+                ok "Model $OLLAMA_MODEL already pulled"
+            else
+                info "Pulling model $OLLAMA_MODEL (this may take a while)..."
+                compose_cmd exec -T "$OLLAMA_SVC" ollama pull "$OLLAMA_MODEL"
+                ok "Model $OLLAMA_MODEL pulled"
+            fi
+        else
+            warn "Ollama not ready yet. Check: docker compose logs $OLLAMA_SVC"
+        fi
+    fi
+
+    # Server API
+    info "Waiting for Server API (first run includes database migrations)..."
+    local server_ok=false
+    for i in $(seq 1 90); do
+        local svc_status
+        svc_status=$(compose_cmd ps server --format '{{.Status}}' 2>/dev/null || true)
+        if [[ -z "$svc_status" ]] || echo "$svc_status" | grep -qi 'exit'; then
+            echo ""
+            err "Server container exited unexpectedly"
+            dump_diagnostics server
+            exit 1
+        fi
+        if curl -sf http://localhost:1250/health > /dev/null 2>&1; then
+            server_ok=true
+            break
+        fi
+        echo -ne "\r  Waiting for Server API... ($i/90)"
+        sleep 5
+    done
+    echo ""
+    if [[ "$server_ok" == "true" ]]; then
+        ok "Server API healthy"
+    else
+        err "Server API not ready after ~7 minutes"
+        dump_diagnostics server
+        exit 1
+    fi
+
+    # Frontend
+    info "Waiting for Frontend..."
+    local web_ok=false
+    for i in $(seq 1 30); do
+        if curl -sf http://localhost:3000 > /dev/null 2>&1; then
+            web_ok=true
+            break
+        fi
+        echo -ne "\r  Waiting for Frontend... ($i/30)"
+        sleep 3
+    done
+    echo ""
+    if [[ "$web_ok" == "true" ]]; then
+        ok "Frontend healthy"
+    else
+        warn "Frontend not responding. Check: docker compose logs web"
+    fi
+
+    # Caddy
+    if [[ "$USE_CADDY" == "true" ]]; then
+        sleep 2
+        if curl -sfk "https://localhost" > /dev/null 2>&1; then
+            ok "Caddy proxy healthy"
+        else
+            warn "Caddy proxy not responding. Check: docker compose logs caddy"
+        fi
+    fi
+
+    # LLM warning for non-Ollama modes
+    if [[ "$USES_OLLAMA" == "false" ]]; then
+        local llm_url=""
+        if env_has_key "$SERVER_ENV" "LLM_URL"; then
+            llm_url=$(env_get "$SERVER_ENV" "LLM_URL")
+        fi
+        if [[ -z "$llm_url" ]]; then
+            echo ""
+            warn "LLM is not configured. Transcription will work, but:"
+            warn "  - Summaries will NOT be generated"
+            warn "  - Topics will NOT be detected"
+            warn "  - Titles will NOT be auto-generated"
+            warn "Configure in server/.env: LLM_URL, LLM_API_KEY, LLM_MODEL"
+        fi
+    fi
+}
+
+# =========================================================
+# Main
+# =========================================================
+main() {
+    echo ""
+    echo "=========================================="
+    echo " Reflector — Self-Hosted Production Setup"
+    echo "=========================================="
+    echo ""
+    echo "  Models:  $MODEL_MODE"
+    echo "  LLM:     ${OLLAMA_MODE:-external}"
+    echo "  Garage:  $USE_GARAGE"
+    echo "  Caddy:   $USE_CADDY"
+    [[ -n "$CUSTOM_DOMAIN" ]] && echo "  Domain:  $CUSTOM_DOMAIN"
+    [[ "$BUILD_IMAGES" == "true" ]] && echo "  Build:   from source"
+    echo ""
+
+    # Detect primary IP
+    PRIMARY_IP=""
+    if [[ "$OS" == "Linux" ]]; then
+        PRIMARY_IP=$(hostname -I 2>/dev/null | awk '{print $1}' || true)
+        if [[ "$PRIMARY_IP" == "127."* ]] || [[ -z "$PRIMARY_IP" ]]; then
+            PRIMARY_IP=$(ip -4 route get 1 2>/dev/null | sed -n 's/.*src \([0-9.]*\).*/\1/p' || true)
+        fi
+    fi
+
+    # Touch env files so compose doesn't complain about missing env_file
+    mkdir -p "$ROOT_DIR/data"
+    touch "$SERVER_ENV" "$WWW_ENV"
+
+    # Ensure garage.toml exists if garage profile is active (compose needs it for volume mount)
+    if [[ "$USE_GARAGE" == "true" ]]; then
+        local garage_runtime="$ROOT_DIR/data/garage.toml"
+        if [[ ! -f "$garage_runtime" ]]; then
+            local rpc_secret
+            rpc_secret=$(openssl rand -hex 32)
+            sed "s|__GARAGE_RPC_SECRET__|${rpc_secret}|" "$ROOT_DIR/scripts/garage.toml" > "$garage_runtime"
+        fi
+    fi
+
+    step_prerequisites
+    echo ""
+    step_secrets
+    echo ""
+    step_server_env
+    echo ""
+    step_www_env
+    echo ""
+    step_storage
+    echo ""
+    step_caddyfile
+    echo ""
+    step_services
+    echo ""
+    step_health
+
+    echo ""
+    echo "=========================================="
+    echo -e " ${GREEN}Reflector is running!${NC}"
+    echo "=========================================="
+    echo ""
+    if [[ "$USE_CADDY" == "true" ]]; then
+        if [[ -n "$CUSTOM_DOMAIN" ]]; then
+            echo "  App:   https://$CUSTOM_DOMAIN"
+            echo "  API:   https://$CUSTOM_DOMAIN/v1/"
+        elif [[ -n "$PRIMARY_IP" ]]; then
+            echo "  App:   https://$PRIMARY_IP  (accept self-signed cert in browser)"
+            echo "  API:   https://$PRIMARY_IP/v1/"
+            echo "  Local: https://localhost"
+        else
+            echo "  App:   https://localhost  (accept self-signed cert in browser)"
+            echo "  API:   https://localhost/v1/"
+        fi
+    else
+        echo "  No Caddy — point your reverse proxy at:"
+        echo "    Frontend:  web:3000   (or localhost:3000 from host)"
+        echo "    API:       server:1250 (or localhost:1250 from host)"
+    fi
+    echo ""
+    echo "  Models:  $MODEL_MODE (transcription/diarization/translation)"
+    [[ "$USE_GARAGE" == "true" ]] && echo "  Storage: Garage (local S3)"
+    [[ "$USE_GARAGE" != "true" ]] && echo "  Storage: External S3"
+    [[ "$USES_OLLAMA" == "true" ]] && echo "  LLM:     Ollama ($OLLAMA_MODEL) for summarization/topics"
+    [[ "$USES_OLLAMA" != "true" ]] && echo "  LLM:     External (configure in server/.env)"
+    echo ""
+    echo "  To stop:   docker compose -f docker-compose.selfhosted.yml down"
+    echo "  To re-run: ./scripts/setup-selfhosted.sh $*"
+    echo ""
+}
+
+main "$@"