diff --git a/.bumpversion.cfg b/.bumpversion.cfg
index 37ef7924..151a8ac0 100644
--- a/.bumpversion.cfg
+++ b/.bumpversion.cfg
@@ -1,5 +1,5 @@
 [bumpversion]
-current_version = 0.1.12
+current_version = 0.1.13
 commit = True
 tag = True
 tag_name = v{new_version}
diff --git a/.dockerignore b/.dockerignore
new file mode 100644
index 00000000..1f1ea4be
--- /dev/null
+++ b/.dockerignore
@@ -0,0 +1,55 @@
+# Dependencies
+node_modules/
+__pycache__/
+*.pyc
+*.pyo
+*.pyd
+.Python
+env/
+venv/
+
+# Build outputs
+build/
+*.egg-info/
+.eggs/
+target/
+
+# Keep web/dist for the Docker image
+!web/dist
+
+# Development
+.git/
+.github/
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+
+# Data and logs
+data/
+*.log
+*.sqlite
+*.db
+
+# OS
+.DS_Store
+Thumbs.db
+
+# Documentation
+docs/
+landing/
+mlx-test/
+
+# Test files
+*.test.ts
+*.test.tsx
+*.spec.ts
+*.spec.tsx
+
+# Keep these out
+.env
+.env.local
+*.pem
+*.key
+credentials.json
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 9e65f520..d102274c 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -6,7 +6,151 @@ on:
     tags:
       - "v*"
 
+env:
+  PROVIDER_VERSION: "1.0.0"
+
 jobs:
+  # ============================================
+  # Build TTS Providers (uploaded to R2, not GitHub)
+  # ============================================
+  build-providers:
+    runs-on: ${{ matrix.platform }}
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          # PyTorch CPU provider (Windows)
+          - platform: "windows-latest"
+            provider: "pytorch-cpu"
+            python-version: "3.12"
+          # PyTorch CUDA provider (Windows) - large binary, uploaded to R2
+          - platform: "windows-latest"
+            provider: "pytorch-cuda"
+            python-version: "3.12"
+          # PyTorch CPU provider (Linux)
+          - platform: "ubuntu-22.04"
+            provider: "pytorch-cpu"
+            python-version: "3.12"
+          # PyTorch CUDA provider (Linux) - large binary, uploaded to R2
+          - platform: "ubuntu-22.04"
+            provider: "pytorch-cuda"
+            python-version: "3.12"
+          # PyTorch CPU provider (macOS Apple Silicon)
+          - platform: "macos-latest"
+            provider: "pytorch-cpu"
+            python-version: "3.12"
+          # PyTorch CPU provider (macOS Intel)
+          - platform: "macos-15-intel"
+            provider: "pytorch-cpu"
+            python-version: "3.12"
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install dependencies (ubuntu only)
+        if: matrix.platform == 'ubuntu-22.04'
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y llvm-dev
+
+      - name: Setup Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+          cache: "pip"
+
+      - name: Install CPU-only torch (Linux)
+        if: matrix.provider == 'pytorch-cpu' && matrix.platform == 'ubuntu-22.04'
+        run: |
+          python -m pip install --upgrade pip
+          pip install pyinstaller
+          pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu
+          pip install -r providers/pytorch-cpu/requirements.txt
+          pip install -r backend/requirements.txt
+
+      - name: Install Python dependencies (CPU - non-Linux)
+        if: matrix.provider == 'pytorch-cpu' && matrix.platform != 'ubuntu-22.04'
+        run: |
+          python -m pip install --upgrade pip
+          pip install pyinstaller
+          pip install -r providers/pytorch-cpu/requirements.txt
+          pip install -r backend/requirements.txt
+
+      - name: Install Python dependencies (CUDA)
+        if: matrix.provider == 'pytorch-cuda'
+        run: |
+          python -m pip install --upgrade pip
+          pip install pyinstaller
+          pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
+          pip install -r providers/pytorch-cuda/requirements.txt
+          pip install -r backend/requirements.txt
+
+      - name: Build provider binary
+        shell: bash
+        run: |
+          cd providers/${{ matrix.provider }}
+          python build.py
+
+      - name: Package provider for distribution
+        shell: bash
+        run: |
+          cd providers/${{ matrix.provider }}/dist
+
+          # Add platform suffix for archive name
+          if [ "${{ matrix.platform }}" == "windows-latest" ]; then
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-windows.zip"
+            # On Windows, zip the directory
+            powershell Compress-Archive -Path "tts-provider-${{ matrix.provider }}/*" -DestinationPath "$ARCHIVE_NAME"
+          elif [ "${{ matrix.platform }}" == "macos-latest" ]; then
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-macos-arm64.tar.gz"
+            tar -czf "$ARCHIVE_NAME" tts-provider-${{ matrix.provider }}/
+          elif [ "${{ matrix.platform }}" == "macos-15-intel" ]; then
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-macos-x64.tar.gz"
+            tar -czf "$ARCHIVE_NAME" tts-provider-${{ matrix.provider }}/
+          else
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-linux.tar.gz"
+            tar -czf "$ARCHIVE_NAME" tts-provider-${{ matrix.provider }}/
+          fi
+
+          echo "Created archive: $ARCHIVE_NAME"
+          ls -lh "$ARCHIVE_NAME"
+
+      - name: Upload provider to R2
+        shell: bash
+        env:
+          R2_ACCESS_KEY_ID: ${{ secrets.R2_ACCESS_KEY_ID }}
+          R2_SECRET_ACCESS_KEY: ${{ secrets.R2_SECRET_ACCESS_KEY }}
+          R2_ENDPOINT: ${{ secrets.R2_ENDPOINT }}
+        run: |
+          # Install AWS CLI (compatible with R2)
+          pip install awscli
+
+          # Configure AWS CLI for R2
+          aws configure set aws_access_key_id $R2_ACCESS_KEY_ID
+          aws configure set aws_secret_access_key $R2_SECRET_ACCESS_KEY
+          aws configure set region auto
+
+          # Determine archive name based on platform
+          if [ "${{ matrix.platform }}" == "windows-latest" ]; then
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-windows.zip"
+          elif [ "${{ matrix.platform }}" == "macos-latest" ]; then
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-macos-arm64.tar.gz"
+          elif [ "${{ matrix.platform }}" == "macos-15-intel" ]; then
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-macos-x64.tar.gz"
+          else
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-linux.tar.gz"
+          fi
+
+          # Upload to R2 (bucket: voicebox)
+          aws s3 cp "providers/${{ matrix.provider }}/dist/$ARCHIVE_NAME" \
+            "s3://voicebox/providers/v${{ env.PROVIDER_VERSION }}/$ARCHIVE_NAME" \
+            --endpoint-url "$R2_ENDPOINT"
+
+          echo "Uploaded $ARCHIVE_NAME to R2"
+
+  # ============================================
+  # Build Main App (without bundled TTS on Win/Linux)
+  # ============================================
   release:
     permissions:
       contents: write
@@ -14,18 +158,22 @@ jobs:
       fail-fast: false
       matrix:
         include:
+          # macOS Apple Silicon - MLX bundled (works out of the box)
           - platform: "macos-latest"
             args: "--target aarch64-apple-darwin"
             python-version: "3.12"
             backend: "mlx"
+          # macOS Intel - PyTorch bundled (smaller user base, keep simple)
           - platform: "macos-15-intel"
             args: "--target x86_64-apple-darwin"
             python-version: "3.12"
             backend: "pytorch"
-          # - platform: 'ubuntu-22.04'
-          #   args: ''
-          #   python-version: '3.12'
-          #   backend: 'pytorch'
+          # Linux - No TTS bundled, providers downloaded separately
+          - platform: "ubuntu-22.04"
+            args: ""
+            python-version: "3.12"
+            backend: "none"
+          # Windows - PyTorch CPU bundled (works out of the box)
           - platform: "windows-latest"
             args: ""
             python-version: "3.12"
@@ -40,7 +188,7 @@ jobs:
         if: matrix.platform == 'ubuntu-22.04'
         run: |
           sudo apt-get update
-          sudo apt-get install -y libwebkit2gtk-4.1-dev libappindicator3-dev librsvg2-dev patchelf llvm-dev
+          sudo apt-get install -y libwebkit2gtk-4.1-dev libappindicator3-dev librsvg2-dev patchelf llvm-dev libasound2-dev
 
       - name: Install LLVM (macOS)
         if: matrix.platform == 'macos-latest' || matrix.platform == 'macos-15-intel'
@@ -55,23 +203,27 @@ jobs:
           python-version: ${{ matrix.python-version }}
           cache: "pip"
 
-      - name: Install Python dependencies
+      - name: Install Python dependencies (with TTS)
+        if: matrix.backend != 'none'
         run: |
           python -m pip install --upgrade pip
           pip install pyinstaller
           pip install -r backend/requirements.txt
 
+      - name: Install Python dependencies (without TTS)
+        if: matrix.backend == 'none'
+        run: |
+          python -m pip install --upgrade pip
+          pip install pyinstaller
+          # Install base requirements without PyTorch/Qwen-TTS
+          pip install fastapi uvicorn sqlalchemy librosa soundfile numpy httpx
+          pip install huggingface_hub  # For Whisper downloads
+
       - name: Install MLX dependencies (Apple Silicon only)
         if: matrix.backend == 'mlx'
         run: |
           pip install -r backend/requirements-mlx.txt
 
-      # - name: Install PyTorch with CUDA (Windows only)
-      #   if: matrix.platform == 'windows-latest'
-      #   run: |
-      #     pip install torch --index-url https://download.pytorch.org/whl/cu121 --force-reinstall --no-deps
-      #     pip install torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
-
       - name: Build Python server (Linux/macOS)
         if: matrix.platform != 'windows-latest'
         run: |
@@ -148,13 +300,84 @@ jobs:
             See the assets below to download and install this version.
 
             ### Installation
-            - **macOS (Apple Silicon)**: Download the `aarch64.dmg` file - uses MLX for fast native inference
+            - **macOS (Apple Silicon)**: Download the `aarch64.dmg` file - uses MLX for fast native inference (works out of the box)
             - **macOS (Intel)**: Download the `x64.dmg` file - uses PyTorch
-            - **Windows**: Download the `.msi` installer
-            - **Linux**: Download the `.AppImage` or `.deb` package
+            - **Windows**: Download the `.msi` installer - requires downloading a TTS provider on first use
+            - **Linux**: Download the `.AppImage` or `.deb` package - requires downloading a TTS provider on first use
+
+            ### TTS Providers
+            Windows and Linux users will be prompted to download a TTS provider on first launch:
+            - **Windows**: PyTorch CPU (~300MB) or PyTorch CUDA (~2.4GB for NVIDIA GPUs)
+            - **Linux**: PyTorch CUDA (~2.4GB) - requires NVIDIA GPU
 
             The app includes automatic updates - future updates will be installed automatically.
           releaseDraft: true
           prerelease: false
           args: ${{ matrix.args }}
           includeUpdaterJson: true
+
+  # ============================================
+  # Build and Push Docker Images
+  # ============================================
+  docker:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      packages: write
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Set up Docker Buildx
+        uses: docker/setup-buildx-action@v3
+
+      - name: Login to GitHub Container Registry
+        uses: docker/login-action@v3
+        with:
+          registry: ghcr.io
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Setup Bun
+        uses: oven-sh/setup-bun@v2
+
+      - name: Install dependencies and build web UI
+        run: |
+          bun install
+          cd web
+          bun run build
+
+      - name: Extract version from tag
+        id: version
+        run: |
+          if [[ $GITHUB_REF == refs/tags/v* ]]; then
+            VERSION=${GITHUB_REF#refs/tags/v}
+          else
+            VERSION="dev"
+          fi
+          echo "version=$VERSION" >> $GITHUB_OUTPUT
+
+      - name: Build and push CPU image
+        uses: docker/build-push-action@v5
+        with:
+          context: .
+          file: ./Dockerfile
+          platforms: linux/amd64,linux/arm64
+          push: true
+          tags: |
+            ghcr.io/jamiepine/voicebox:latest
+            ghcr.io/jamiepine/voicebox:${{ steps.version.outputs.version }}
+          cache-from: type=gha
+          cache-to: type=gha,mode=max
+
+      - name: Build and push CUDA image
+        uses: docker/build-push-action@v5
+        with:
+          context: .
+          file: ./Dockerfile.cuda
+          platforms: linux/amd64
+          push: true
+          tags: |
+            ghcr.io/jamiepine/voicebox:latest-cuda
+            ghcr.io/jamiepine/voicebox:${{ steps.version.outputs.version }}-cuda
+          cache-from: type=gha
+          cache-to: type=gha,mode=max
diff --git a/.gitignore b/.gitignore
index 05f7ef0d..4fef6ea4 100644
--- a/.gitignore
+++ b/.gitignore
@@ -15,6 +15,7 @@ dist/
 build/
 *.egg-info/
 *.egg
+*.spec
 target/
 *.app
 *.dmg
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 765da827..45d898e7 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -14,16 +14,19 @@ Thank you for your interest in contributing to Voicebox! This document provides
 ### Prerequisites
 
 - **[Bun](https://bun.sh)** - Fast JavaScript runtime and package manager
+
   ```bash
   curl -fsSL https://bun.sh/install | bash
   ```
 
 - **[Python 3.11+](https://python.org)** - For backend development
+
   ```bash
   python --version  # Should be 3.11 or higher
   ```
 
 - **[Rust](https://rustup.rs)** - For Tauri desktop app (installed automatically by Tauri CLI)
+
   ```bash
   rustc --version  # Check if installed
   ```
@@ -37,41 +40,46 @@ Thank you for your interest in contributing to Voicebox! This document provides
 **Manual setup (required for Windows):**
 
 1. **Fork and clone the repository**
+
    ```bash
    git clone https://github.com/YOUR_USERNAME/voicebox.git
    cd voicebox
    ```
 
 2. **Install JavaScript dependencies**
+
    ```bash
    bun install
    ```
+
    This installs dependencies for:
+
    - `app/` - Shared React frontend
    - `tauri/` - Tauri desktop wrapper
    - `web/` - Web deployment wrapper
 
 3. **Set up Python backend**
+
    ```bash
    cd backend
-   
+
    # Create virtual environment
    python -m venv venv
-   
+
    # Activate virtual environment
    source venv/bin/activate  # On macOS/Linux
    # or
    venv\Scripts\activate  # On Windows
-   
+
    # Install Python dependencies
    pip install -r requirements.txt
-   
+
    # Install MLX dependencies (Apple Silicon only - for faster inference)
    # On Apple Silicon, this enables native Metal acceleration
    if [[ $(uname -m) == "arm64" ]]; then
      pip install -r requirements-mlx.txt
    fi
-   
+
    # Install Qwen3-TTS (required for voice synthesis)
    pip install git+https://github.com/QwenLM/Qwen3-TTS.git
    ```
@@ -81,19 +89,24 @@ Thank you for your interest in contributing to Voicebox! This document provides
    Development requires two terminals: one for the Python backend, one for the Tauri app.
 
    **Terminal 1: Backend server** (start this first)
+
    ```bash
    cd backend
    source venv/bin/activate  # Activate venv if not already active
    bun run dev:server
    # Or manually: uvicorn main:app --reload --port 17493
    ```
+
    Backend will be available at `http://localhost:17493`
 
    **Terminal 2: Desktop app**
+
    ```bash
    bun run dev
    ```
+
    This will:
+
    - Create a placeholder sidecar binary (for Tauri compilation)
    - Start Vite dev server on port 5173
    - Launch Tauri window pointing to localhost:5173
@@ -104,26 +117,133 @@ Thank you for your interest in contributing to Voicebox! This document provides
    > The bundled server binary is only used in production builds.
 
    **Optional: Web app**
+
    ```bash
    bun run dev:web
    ```
+
    Web app will be available at `http://localhost:5174`
 
 ### Model Downloads
 
 Models are automatically downloaded from HuggingFace Hub on first use:
+
 - **Whisper** (transcription): Auto-downloads on first transcription
 - **Qwen3-TTS** (voice cloning): Auto-downloads on first generation (~2-4GB)
 
 First-time usage will be slower due to model downloads, but subsequent runs will use cached models.
 
+### TTS Provider Development
+
+Voicebox uses a modular provider system to support different inference backends. Understanding this architecture is important when working on TTS features.
+
+#### Provider Types
+
+**Bundled Providers** — Included with the app binary:
+
+- `apple-mlx` — Bundled with macOS Apple Silicon builds (`.dmg` for aarch64)
+  - Uses MLX for native Metal acceleration
+  - Configured in `.github/workflows/release.yml` with `backend: "mlx"`
+
+**Hybrid Provider:**
+
+- `pytorch-cpu` — Can be bundled OR downloaded depending on platform
+  - **Bundled** with Windows and macOS Intel builds
+    - macOS Intel: `.dmg` for x64 with `backend: "pytorch"`
+    - Windows: `.exe` installer with PyTorch CPU included
+  - **Downloaded** on first use for Linux builds (~300MB)
+  - Falls back to bundled version if external binary not found
+
+**External-Only Providers:**
+
+- `pytorch-cuda` — NVIDIA GPU-accelerated provider (~2.4GB)
+  - Windows/Linux only (no NVIDIA GPUs on macOS)
+  - Downloaded on demand, not bundled
+  - Optional for users with CUDA-capable GPUs
+
+#### Provider Architecture
+
+```
+backend/providers/
+├── __init__.py         # ProviderManager - lifecycle management
+├── base.py             # TTSProvider protocol
+├── bundled.py          # BundledProvider - wraps built-in backends
+├── local.py            # LocalProvider - wraps external subprocess
+├── installer.py        # Download and install external providers
+└── types.py            # Provider type definitions
+
+providers/
+├── pytorch-cpu/        # External PyTorch CPU provider
+│   ├── main.py         # FastAPI server
+│   ├── build.py        # PyInstaller build script
+│   └── build_and_install.py  # Build and install locally
+└── pytorch-cuda/       # External PyTorch CUDA provider
+    ├── main.py
+    ├── build.py
+    └── build_and_install.py
+```
+
+**How it works:**
+
+1. **Bundled providers** run in-process within the main backend
+2. **External providers** run as separate subprocess servers
+3. **LocalProvider** communicates with external providers via HTTP
+4. **ProviderManager** handles starting/stopping and health checks
+
+#### Building Providers Locally
+
+When developing provider features, you'll need to build and test external providers:
+
+**Build a single provider:**
+
+```bash
+cd providers/pytorch-cpu
+python build_and_install.py
+```
+
+**Build all providers:**
+
+```bash
+bun run build:providers
+```
+
+This script:
+
+- Builds the provider binary with PyInstaller
+- Detects your platform (Windows/macOS/Linux)
+- Copies to the correct location:
+  - macOS: `~/Library/Application Support/voicebox/providers/`
+  - Windows: `%APPDATA%\voicebox\providers\`
+  - Linux: `~/.local/share/voicebox/providers/`
+- Sets executable permissions on Unix
+
+**Testing provider changes:**
+
+1. Make changes to `providers/pytorch-cpu/main.py`
+2. Run `bun run build:providers`
+3. Restart the Voicebox app
+4. Select the provider in Settings → TTS Provider
+
+#### Provider Binary Distribution
+
+For production releases, provider binaries are:
+
+1. Built by GitHub Actions for all platforms
+2. Uploaded to Cloudflare R2 at `downloads.voicebox.sh/providers/v{VERSION}/`
+3. Downloaded on-demand by users based on their platform and GPU
+
+See `.github/workflows/release.yml` for the build matrix.
+
 ### Building
 
 **Build everything (recommended):**
+
 ```bash
 bun run build
 ```
+
 This automatically:
+
 1. Builds the Python server binary (`./scripts/build-server.sh`)
 2. Builds the Tauri desktop app (`cd tauri && bun run tauri build`)
 
@@ -132,13 +252,23 @@ Creates platform-specific installers (`.dmg`, `.msi`, `.AppImage`) in `tauri/src
 **Note:** The build process detects your platform and includes the appropriate backend (MLX for Apple Silicon, PyTorch for others).
 
 **Build server binary only:**
+
 ```bash
 bun run build:server
 # or
 ./scripts/build-server.sh
 ```
+
 Creates platform-specific binary in `tauri/src-tauri/binaries/`
 
+**Build provider binaries (for development):**
+
+```bash
+bun run build:providers
+```
+
+Builds all external provider binaries and installs them to the system provider directory. See [TTS Provider Development](#tts-provider-development) for details.
+
 **Building with local Qwen3-TTS development version:**
 
 If you're actively developing or modifying the Qwen3-TTS library, set the `QWEN_TTS_PATH` environment variable to point to your local clone:
@@ -151,34 +281,41 @@ bun run build:server
 This makes PyInstaller use your local qwen-tts version instead of the pip-installed package. Useful when testing changes to the TTS library before they're published to PyPI or when using an editable install (`pip install -e`).
 
 **Build web app:**
+
 ```bash
 cd web
 bun run build
 ```
+
 Output in `web/dist/`
 
 ### Generate OpenAPI Client
 
 After starting the backend server:
+
 ```bash
 ./scripts/generate-api.sh
 ```
+
 This downloads the OpenAPI schema and generates the TypeScript client in `app/src/lib/api/`
 
 ### Convert Assets to Web Formats
 
 To optimize images and videos for the web, run:
+
 ```bash
 bun run convert:assets
 ```
 
 This script:
+
 - Converts PNG → WebP (better compression, same quality)
 - Converts MOV → WebM (VP9 codec, smaller file size)
 - Processes files in `landing/public/` and `docs/public/`
 - **Deletes original files** after successful conversion
 
 **Requirements:** Install `webp` and `ffmpeg`:
+
 ```bash
 brew install webp ffmpeg
 ```
@@ -225,6 +362,7 @@ git push origin feature/your-feature-name
 ```
 
 Then create a pull request on GitHub with:
+
 - Clear description of changes
 - Screenshots (for UI changes)
 - Reference to related issues
@@ -370,21 +508,23 @@ Currently, testing is primarily manual. When adding tests:
 Releases are managed by maintainers:
 
 1. **Bump version using bumpversion:**
+
    ```bash
    # Install bumpversion (if not already installed)
    pip install bumpversion
-   
+
    # Bump patch version (0.1.0 -> 0.1.1)
    bumpversion patch
-   
+
    # Or bump minor version (0.1.0 -> 0.2.0)
    bumpversion minor
-   
+
    # Or bump major version (0.1.0 -> 1.0.0)
    bumpversion major
    ```
-   
+
    This automatically:
+
    - Updates version numbers in all files (`tauri.conf.json`, `Cargo.toml`, all `package.json` files, `backend/main.py`)
    - Creates a git commit with the version bump
    - Creates a git tag (e.g., `v0.1.1`, `v0.2.0`)
@@ -392,6 +532,7 @@ Releases are managed by maintainers:
 2. **Update CHANGELOG.md** with release notes
 
 3. **Push commits and tags:**
+
    ```bash
    git push
    git push --tags
diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 00000000..ca243bc5
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,43 @@
+# Base Dockerfile for Voicebox (CPU-only)
+# For GPU support, use Dockerfile.cuda
+
+FROM python:3.12-slim
+
+# Prevent interactive prompts during build
+ENV DEBIAN_FRONTEND=noninteractive
+ENV TZ=UTC
+
+WORKDIR /app
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y \
+    ffmpeg \
+    curl \
+    tzdata \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy backend
+COPY backend/ /app/backend/
+COPY providers/ /app/providers/
+
+# Copy pre-built web UI
+COPY web/dist/ /app/web/dist/
+
+# Install Python dependencies (without PyTorch - will be downloaded via provider system)
+RUN python -m pip install --upgrade pip && \
+    pip install --no-cache-dir \
+    fastapi uvicorn[standard] pydantic sqlalchemy alembic \
+    librosa soundfile numpy python-multipart Pillow \
+    huggingface_hub transformers accelerate
+
+# Create data directory for profiles/generations
+RUN mkdir -p /app/data
+
+# Health check
+HEALTHCHECK --interval=30s --timeout=10s --retries=3 --start-period=40s \
+  CMD curl -f http://localhost:8000/health || exit 1
+
+EXPOSE 8000
+
+# Run server with web UI
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
diff --git a/Dockerfile.cuda b/Dockerfile.cuda
new file mode 100644
index 00000000..b7d7ca96
--- /dev/null
+++ b/Dockerfile.cuda
@@ -0,0 +1,58 @@
+# Dockerfile for Voicebox with NVIDIA GPU support (CUDA)
+
+FROM nvidia/cuda:12.1.1-runtime-ubuntu22.04
+
+# Prevent interactive prompts during build
+ENV DEBIAN_FRONTEND=noninteractive
+ENV TZ=UTC
+
+WORKDIR /app
+
+# Install Python 3.12
+RUN apt-get update && apt-get install -y \
+    software-properties-common \
+    && add-apt-repository ppa:deadsnakes/ppa \
+    && apt-get update && apt-get install -y \
+    python3.12 \
+    python3.12-dev \
+    python3.12-venv \
+    ffmpeg \
+    curl \
+    tzdata \
+    && rm -rf /var/lib/apt/lists/*
+
+# Set Python 3.12 as default and bootstrap pip
+RUN update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.12 1 && \
+    update-alternatives --install /usr/bin/python python /usr/bin/python3.12 1 && \
+    python3.12 -m ensurepip --upgrade && \
+    python3.12 -m pip install --upgrade pip
+
+# Copy backend
+COPY backend/ /app/backend/
+COPY providers/ /app/providers/
+
+# Copy pre-built web UI
+COPY web/dist/ /app/web/dist/
+
+# Install PyTorch with CUDA support first
+RUN pip install --no-cache-dir \
+    torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
+
+# Install remaining dependencies
+RUN pip install --no-cache-dir \
+    fastapi uvicorn[standard] pydantic sqlalchemy alembic \
+    transformers accelerate huggingface_hub \
+    librosa soundfile numpy python-multipart Pillow \
+    qwen-tts
+
+# Create data directory
+RUN mkdir -p /app/data
+
+# Health check
+HEALTHCHECK --interval=30s --timeout=10s --retries=3 --start-period=40s \
+  CMD curl -f http://localhost:8000/health || exit 1
+
+EXPOSE 8000
+
+# Run server with web UI
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
diff --git a/README.md b/README.md
index 575918cf..9d0d39dd 100644
--- a/README.md
+++ b/README.md
@@ -76,16 +76,39 @@ Download a voice model, clone any voice from a few seconds of audio, and compose
 
 ## Download
 
-Voicebox is available now for macOS and Windows.
+### Desktop App
 
-| Platform | Download |
-|----------|----------|
-| macOS (Apple Silicon) | [voicebox_aarch64.app.tar.gz](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_aarch64.app.tar.gz) |
-| macOS (Intel) | [voicebox_x64.app.tar.gz](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_x64.app.tar.gz) |
-| Windows (MSI) | [voicebox_0.1.0_x64_en-US.msi](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64_en-US.msi) |
-| Windows (Setup) | [voicebox_0.1.0_x64-setup.exe](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64-setup.exe) |
+| Platform              | Download                                                                                                                    |
+| --------------------- | --------------------------------------------------------------------------------------------------------------------------- |
+| macOS (Apple Silicon) | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest)   |
+| macOS (Intel)         | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest)           |
+| Windows (MSI)         | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest) |
+| Windows (Setup)       | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest) |
+| Linux (AppImage)      | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest) |
+| Linux (Deb)           | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest) |
 
-> **Linux builds coming soon** — Currently blocked by GitHub runner disk space limitations.
+### Docker
+
+Run Voicebox with the web UI in Docker - perfect for servers and headless deployments:
+
+```bash
+# CPU-only (supports amd64 and arm64)
+docker run -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest
+
+# NVIDIA GPU (recommended for performance)
+docker run --gpus all -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest-cuda
+```
+
+Or use Docker Compose:
+```bash
+docker compose up -d
+```
+
+Open http://localhost:8000 to access the web UI.
+
+See [Docker Deployment Guide](docs/overview/docker.mdx) for cloud deployments, GPU setup, and more.
 
 ---
 
@@ -137,9 +160,10 @@ Create multi-voice narratives, podcasts, and conversations with a timeline-based
 
 ### Flexible Deployment
 
-- **Local mode** — Everything runs on your machine
-- **Remote mode** — Connect to a GPU server on your network
-- **One-click server** — Turn any machine into a Voicebox server
+- **Desktop app** — Native apps for macOS, Windows, and Linux
+- **Docker** — Deploy to servers with the web UI included
+- **Remote mode** — Connect desktop app to a remote GPU server
+- **Cloud ready** — Deploy to AWS, GCP, DigitalOcean, or any cloud provider
 
 ---
 
@@ -176,17 +200,17 @@ Full API documentation available at `http://localhost:8000/docs` when running.
 
 ## Tech Stack
 
-| Layer | Technology |
-|-------|------------|
-| Desktop App | Tauri (Rust) |
-| Frontend | React, TypeScript, Tailwind CSS |
-| State | Zustand, React Query |
-| Backend | FastAPI (Python) |
-| Voice Model | Qwen3-TTS (PyTorch or MLX) |
-| Transcription | Whisper (PyTorch or MLX) |
+| Layer            | Technology                                          |
+| ---------------- | --------------------------------------------------- |
+| Desktop App      | Tauri (Rust)                                        |
+| Frontend         | React, TypeScript, Tailwind CSS                     |
+| State            | Zustand, React Query                                |
+| Backend          | FastAPI (Python)                                    |
+| Voice Model      | Qwen3-TTS (PyTorch or MLX)                          |
+| Transcription    | Whisper (PyTorch or MLX)                            |
 | Inference Engine | MLX (Apple Silicon) / PyTorch (Windows/Linux/Intel) |
-| Database | SQLite |
-| Audio | WaveSurfer.js, librosa |
+| Database         | SQLite                                              |
+| Audio            | WaveSurfer.js, librosa                              |
 
 **Why this stack?**
 
@@ -194,6 +218,26 @@ Full API documentation available at `http://localhost:8000/docs` when running.
 - **FastAPI** — Async Python with automatic OpenAPI schema generation
 - **Type-safe end-to-end** — Generated TypeScript client from OpenAPI spec
 
+### TTS Provider Architecture
+
+Voicebox uses a modular provider system to support different inference backends:
+
+- **`apple-mlx`** — Bundled with macOS Apple Silicon builds
+
+  - Uses MLX with native Metal acceleration (4-5x faster)
+  - Works out of the box, no download required
+
+- **`pytorch-cpu`** — Universal CPU provider (bundled or downloaded)
+
+  - Bundled with Windows and macOS Intel builds
+  - Downloaded on first use for Linux (~300MB)
+
+- **`pytorch-cuda`** — Optional NVIDIA GPU-accelerated provider
+  - Windows/Linux only (~2.4GB)
+  - 4-5x faster inference on CUDA-capable GPUs
+
+macOS and Windows builds work out of the box with bundled providers. Linux users download a provider on first launch. The app automatically detects your hardware and recommends the best option. All downloadable providers are distributed via Cloudflare R2 for fast, global delivery.
+
 ---
 
 ## Roadmap
@@ -202,13 +246,13 @@ Voicebox is the beginning of something bigger. Here's what's coming:
 
 ### Coming Soon
 
-| Feature | Description |
-|---------|-------------|
-| **Real-time Synthesis** | Stream audio as it generates, word by word |
-| **Conversation Mode** | Multi-speaker dialogues with automatic turn-taking |
-| **Voice Effects** | Pitch shift, reverb, M3GAN-style effects |
-| **Timeline Editor** | Audio studio with word-level precision editing |
-| **More Models** | XTTS, Bark, and other open-source voice models |
+| Feature                 | Description                                        |
+| ----------------------- | -------------------------------------------------- |
+| **Real-time Synthesis** | Stream audio as it generates, word by word         |
+| **Conversation Mode**   | Multi-speaker dialogues with automatic turn-taking |
+| **Voice Effects**       | Pitch shift, reverb, M3GAN-style effects           |
+| **Timeline Editor**     | Audio studio with word-level precision editing     |
+| **More Models**         | XTTS, Bark, and other open-source voice models     |
 
 ### Future Vision
 
@@ -260,9 +304,10 @@ cd backend && pip install -r requirements.txt && cd ..
 bun run dev
 ```
 
-**Prerequisites:** [Bun](https://bun.sh), [Rust](https://rustup.rs), [Python 3.11+](https://python.org). 
+**Prerequisites:** [Bun](https://bun.sh), [Rust](https://rustup.rs), [Python 3.11+](https://python.org).
+
+**Performance:**
 
-**Performance:** 
 - **Apple Silicon (M1/M2/M3)**: Uses MLX backend with native Metal acceleration for 4-5x faster inference
 - **Windows/Linux/Intel Mac**: Uses PyTorch backend (CUDA GPU recommended, CPU supported but slower)
 
diff --git a/app/package.json b/app/package.json
index 905dea23..b9ef942a 100644
--- a/app/package.json
+++ b/app/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@voicebox/app",
-  "version": "0.1.12",
+  "version": "0.1.13",
   "private": true,
   "type": "module",
   "scripts": {
@@ -17,6 +17,10 @@
     "@dnd-kit/sortable": "^10.0.0",
     "@dnd-kit/utilities": "^3.2.2",
     "@hookform/resolvers": "^3.9.0",
+    "@hugeicons/core-free-icons": "^3.1.1",
+    "@hugeicons/react": "^1.1.4",
+    "@iconify-json/svg-spinners": "^1.2.4",
+    "@iconify/react": "^6.0.2",
     "@radix-ui/react-alert-dialog": "^1.1.1",
     "@radix-ui/react-avatar": "^1.1.0",
     "@radix-ui/react-dialog": "^1.1.1",
@@ -24,6 +28,7 @@
     "@radix-ui/react-label": "^2.1.0",
     "@radix-ui/react-popover": "^1.1.1",
     "@radix-ui/react-progress": "^1.1.0",
+    "@radix-ui/react-radio-group": "^1.2.0",
     "@radix-ui/react-scroll-area": "^1.1.0",
     "@radix-ui/react-select": "^2.1.1",
     "@radix-ui/react-separator": "^1.1.0",
@@ -43,7 +48,6 @@
     "clsx": "^2.1.1",
     "date-fns": "^3.6.0",
     "framer-motion": "^12.29.0",
-    "lucide-react": "^0.454.0",
     "motion": "^12.29.0",
     "react": "^18.3.0",
     "react-dom": "^18.3.0",
diff --git a/app/src/App.tsx b/app/src/App.tsx
index fbe29118..e54bc9dd 100644
--- a/app/src/App.tsx
+++ b/app/src/App.tsx
@@ -40,7 +40,7 @@ function App() {
   const serverStartingRef = useRef(false);
 
   // Automatically check for app updates on startup and show toast notifications
-  useAutoUpdater({ checkOnMount: true, showToast: true });
+  useAutoUpdater(true);
 
   // Sync stored setting to Rust on startup
   useEffect(() => {
@@ -82,8 +82,7 @@ function App() {
       console.log('Dev mode: Skipping auto-start of server (run it separately)');
       setServerReady(true); // Mark as ready so UI doesn't show loading screen
       // Mark that server was not started by app (so we don't try to stop it on close)
-      // @ts-expect-error - adding property to window
-      window.__voiceboxServerStartedByApp = false;
+      (window as any).__voiceboxServerStartedByApp = false;
       return;
     }
 
@@ -103,14 +102,12 @@ function App() {
         useServerStore.getState().setServerUrl(serverUrl);
         setServerReady(true);
         // Mark that we started the server (so we know to stop it on close)
-        // @ts-expect-error - adding property to window
-        window.__voiceboxServerStartedByApp = true;
+        (window as any).__voiceboxServerStartedByApp = true;
       })
       .catch((error) => {
         console.error('Failed to auto-start server:', error);
         serverStartingRef.current = false;
-        // @ts-expect-error - adding property to window
-        window.__voiceboxServerStartedByApp = false;
+        (window as any).__voiceboxServerStartedByApp = false;
       });
 
     // Cleanup: stop server on actual unmount (not StrictMode remount)
diff --git a/app/src/components/AudioPlayer/AudioPlayer.tsx b/app/src/components/AudioPlayer/AudioPlayer.tsx
index 48dd9e78..6656c9d3 100644
--- a/app/src/components/AudioPlayer/AudioPlayer.tsx
+++ b/app/src/components/AudioPlayer/AudioPlayer.tsx
@@ -1,5 +1,6 @@
 import { useQuery } from '@tanstack/react-query';
-import { Pause, Play, Repeat, Volume2, VolumeX, X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { PauseIcon, PlayIcon, RepeatIcon, VolumeHighIcon, VolumeMuteIcon, Cancel01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useMemo, useRef, useState } from 'react';
 import WaveSurfer from 'wavesurfer.js';
 import { Button } from '@/components/ui/button';
@@ -459,7 +460,7 @@ export function AudioPlayer() {
     // Use double requestAnimationFrame to ensure DOM is fully rendered
     let rafId1: number;
     let rafId2: number;
-    let timeoutId: number | null = null;
+    let timeoutId: ReturnType<typeof setTimeout> | null = null;
 
     rafId1 = requestAnimationFrame(() => {
       rafId2 = requestAnimationFrame(() => {
@@ -832,7 +833,7 @@ export function AudioPlayer() {
             className="shrink-0"
             title={duration === 0 && !isLoading ? 'Audio not loaded' : ''}
           >
-            {isPlaying ? <Pause className="h-5 w-5" /> : <Play className="h-5 w-5" />}
+            {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={20} className="h-5 w-5" /> : <HugeiconsIcon icon={PlayIcon} size={20} className="h-5 w-5" />}
           </Button>
 
           {/* Waveform */}
@@ -873,7 +874,7 @@ export function AudioPlayer() {
             className={isLooping ? 'text-primary' : ''}
             title="Toggle loop"
           >
-            <Repeat className="h-4 w-4" />
+            <HugeiconsIcon icon={RepeatIcon} size={16} className="h-4 w-4" />
           </Button>
 
           {/* Volume Control */}
@@ -884,7 +885,7 @@ export function AudioPlayer() {
               onClick={() => setVolume(volume > 0 ? 0 : 1)}
               className="h-8 w-8"
             >
-              {volume > 0 ? <Volume2 className="h-4 w-4" /> : <VolumeX className="h-4 w-4" />}
+              {volume > 0 ? <HugeiconsIcon icon={VolumeHighIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={VolumeMuteIcon} size={16} className="h-4 w-4" />}
             </Button>
             <Slider
               value={[volume * 100]}
@@ -903,7 +904,7 @@ export function AudioPlayer() {
             className="shrink-0"
             title="Close player"
           >
-            <X className="h-5 w-5" />
+            <HugeiconsIcon icon={Cancel01Icon} size={20} className="h-5 w-5" />
           </Button>
         </div>
       </div>
diff --git a/app/src/components/AudioTab/AudioTab.tsx b/app/src/components/AudioTab/AudioTab.tsx
index f76e99d7..150e7660 100644
--- a/app/src/components/AudioTab/AudioTab.tsx
+++ b/app/src/components/AudioTab/AudioTab.tsx
@@ -1,5 +1,6 @@
 import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
-import { Check, CheckCircle2, Edit, Plus, Speaker, Trash2 } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CheckmarkCircle01Icon, CheckmarkCircle02Icon, Edit01Icon, Add01Icon, SpeakerIcon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useState } from 'react';
 import { Badge } from '@/components/ui/badge';
 import { Button } from '@/components/ui/button';
@@ -135,7 +136,7 @@ export function AudioTab() {
       <div className="flex items-center justify-between mb-6 shrink-0">
         <h2 className="text-2xl font-bold">Audio Channels</h2>
         <Button onClick={() => setCreateDialogOpen(true)}>
-          <Plus className="h-4 w-4 mr-2" />
+          <HugeiconsIcon icon={Add01Icon} size={16} className="h-4 w-4 mr-2" />
           New Channel
         </Button>
       </div>
@@ -150,13 +151,13 @@ export function AudioTab() {
         >
           {allChannels.length === 0 ? (
             <div className="flex flex-col items-center justify-center py-12 border-2 border-dashed border-muted rounded-md">
-              <Speaker className="h-12 w-12 text-muted-foreground mb-4" />
+              <HugeiconsIcon icon={SpeakerIcon} size={48} className="h-12 w-12 text-muted-foreground mb-4" />
               <p className="text-muted-foreground mb-4">
                 No audio channels yet. Create your first channel to route voices to specific
                 devices.
               </p>
               <Button onClick={() => setCreateDialogOpen(true)}>
-                <Plus className="h-4 w-4 mr-2" />
+                <HugeiconsIcon icon={Add01Icon} size={16} className="h-4 w-4 mr-2" />
                 Create Channel
               </Button>
             </div>
@@ -178,7 +179,7 @@ export function AudioTab() {
                       <div className="flex-1 min-w-0">
                         <div className="flex items-center gap-2 mb-3">
                           <div className="h-8 w-8 rounded-lg bg-muted flex items-center justify-center shrink-0">
-                            <Speaker className="h-4 w-4 text-muted-foreground" />
+                            <HugeiconsIcon icon={SpeakerIcon} size={16} className="h-4 w-4 text-muted-foreground" />
                           </div>
                           <div className="flex items-center gap-2 min-w-0">
                             <h3 className="font-semibold text-base truncate">{channel.name}</h3>
@@ -235,7 +236,7 @@ export function AudioTab() {
                               setEditingChannel(channel.id);
                             }}
                           >
-                            <Edit className="h-4 w-4" />
+                            <HugeiconsIcon icon={Edit01Icon} size={16} className="h-4 w-4" />
                           </Button>
                           <Button
                             variant="ghost"
@@ -248,7 +249,7 @@ export function AudioTab() {
                               }
                             }}
                           >
-                            <Trash2 className="h-4 w-4" />
+                            <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
                           </Button>
                         </div>
                       )}
@@ -325,10 +326,10 @@ export function AudioTab() {
                           isConnected ? 'bg-accent border-accent' : 'border-muted-foreground/30',
                         )}
                       >
-                        {isConnected && <Check className="h-3 w-3 text-accent-foreground" />}
+                        {isConnected && <HugeiconsIcon icon={CheckmarkCircle01Icon} size={12} className="h-3 w-3 text-accent-foreground" />}
                       </div>
                     ) : device.is_default ? (
-                      <CheckCircle2 className="h-4 w-4 text-primary shrink-0" />
+                      <HugeiconsIcon icon={CheckmarkCircle02Icon} size={16} className="h-4 w-4 text-primary shrink-0" />
                     ) : null}
                     <span className={cn('truncate flex-1', device.is_default && 'font-medium')}>
                       {device.name}
@@ -339,7 +340,7 @@ export function AudioTab() {
             </div>
           ) : (
             <div className="flex flex-col items-center justify-center py-12 border-2 border-dashed border-muted rounded-md">
-              <CheckCircle2 className="h-12 w-12 text-muted-foreground mb-4" />
+              <HugeiconsIcon icon={CheckmarkCircle02Icon} size={48} className="h-12 w-12 text-muted-foreground mb-4" />
               <p className="text-muted-foreground text-center">
                 {platform.metadata.isTauri ? 'No audio devices found' : 'Audio device selection requires Tauri'}
               </p>
@@ -494,7 +495,7 @@ function CreateChannelDialog({ open, onOpenChange, devices, onCreate }: CreateCh
                           setSelectedDevices(selectedDevices.filter((id) => id !== deviceId))
                         }
                       >
-                        <Trash2 className="h-3 w-3" />
+                        <HugeiconsIcon icon={Delete01Icon} size={12} className="h-3 w-3" />
                       </Button>
                     </div>
                   );
@@ -602,7 +603,7 @@ function EditChannelDialog({
                           setSelectedDevices(selectedDevices.filter((id) => id !== deviceId))
                         }
                       >
-                        <Trash2 className="h-3 w-3" />
+                        <HugeiconsIcon icon={Delete01Icon} size={12} className="h-3 w-3" />
                       </Button>
                     </div>
                   );
@@ -648,7 +649,7 @@ function EditChannelDialog({
                           setSelectedVoices(selectedVoices.filter((id) => id !== profileId))
                         }
                       >
-                        <Trash2 className="h-3 w-3" />
+                        <HugeiconsIcon icon={Delete01Icon} size={12} className="h-3 w-3" />
                       </Button>
                     </div>
                   );
diff --git a/app/src/components/Generation/FloatingGenerateBox.tsx b/app/src/components/Generation/FloatingGenerateBox.tsx
index a8d556a6..d8d493bd 100644
--- a/app/src/components/Generation/FloatingGenerateBox.tsx
+++ b/app/src/components/Generation/FloatingGenerateBox.tsx
@@ -1,6 +1,8 @@
+import { SparklesIcon, TextSquareIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { useMatchRoute } from '@tanstack/react-router';
 import { AnimatePresence, motion } from 'framer-motion';
-import { Loader2, SlidersHorizontal, Sparkles } from 'lucide-react';
 import { useEffect, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import { Form, FormControl, FormField, FormItem, FormMessage } from '@/components/ui/form';
@@ -298,13 +300,13 @@ export function FloatingGenerateBox({
                   <Button
                     type="submit"
                     disabled={isPending || !selectedProfileId}
-                    className="h-10 w-10 rounded-full bg-accent hover:bg-accent/90 hover:scale-105 text-accent-foreground shadow-lg hover:shadow-accent/50 transition-all duration-200"
+                    className="h-10 w-10 rounded-full bg-accent hover:bg-accent/90 hover:scale-105 text-accent-foreground shadow-lg transition-all duration-200"
                     size="icon"
                   >
                     {isPending ? (
-                      <Loader2 className="h-4 w-4 animate-spin" />
+                      <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
                     ) : (
-                      <Sparkles className="h-4 w-4" />
+                      <HugeiconsIcon icon={SparklesIcon} size={16} className="h-4 w-4" />
                     )}
                   </Button>
                   <span className="pointer-events-none absolute bottom-full left-1/2 -translate-x-1/2 mb-2 whitespace-nowrap rounded-md bg-popover px-3 py-1.5 text-xs text-popover-foreground border border-border opacity-0 transition-opacity group-hover:opacity-100 z-[9999]">
@@ -337,7 +339,7 @@ export function FloatingGenerateBox({
                               : 'bg-card border border-border hover:bg-background/50',
                           )}
                         >
-                          <SlidersHorizontal className="h-4 w-4" />
+                          <HugeiconsIcon icon={TextSquareIcon} size={16} className="h-4 w-4" />
                         </Button>
                         <span className="pointer-events-none absolute bottom-full left-1/2 -translate-x-1/2 mb-2 whitespace-nowrap rounded-md bg-popover px-3 py-1.5 text-xs text-popover-foreground border border-border opacity-0 transition-opacity group-hover:opacity-100 z-[9999]">
                           Fine tune instructions
diff --git a/app/src/components/Generation/GenerationForm.tsx b/app/src/components/Generation/GenerationForm.tsx
index 31b100f8..d652a1d7 100644
--- a/app/src/components/Generation/GenerationForm.tsx
+++ b/app/src/components/Generation/GenerationForm.tsx
@@ -1,4 +1,6 @@
-import { Loader2, Mic } from 'lucide-react';
+import { Mic01Icon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { Button } from '@/components/ui/button';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import {
@@ -46,7 +48,11 @@ export function GenerationForm() {
               <FormLabel>Voice Profile</FormLabel>
               {selectedProfile ? (
                 <div className="mt-2 p-3 border rounded-md bg-muted/50 flex items-center gap-2">
-                  <Mic className="h-4 w-4 text-muted-foreground" />
+                  <HugeiconsIcon
+                    icon={Mic01Icon}
+                    size={16}
+                    className="h-4 w-4 text-muted-foreground"
+                  />
                   <span className="font-medium">{selectedProfile.name}</span>
                   <span className="text-sm text-muted-foreground">{selectedProfile.language}</span>
                 </div>
@@ -170,14 +176,10 @@ export function GenerationForm() {
               />
             </div>
 
-            <Button
-              type="submit"
-              className="w-full"
-              disabled={isPending || !selectedProfileId}
-            >
+            <Button type="submit" className="w-full" disabled={isPending || !selectedProfileId}>
               {isPending ? (
                 <>
-                  <Loader2 className="mr-2 h-4 w-4 animate-spin" />
+                  <Icon icon="svg-spinners:ring-resize" className="mr-2 h-4 w-4 animate-spin" />
                   Generating...
                 </>
               ) : (
diff --git a/app/src/components/History/HistoryTable.tsx b/app/src/components/History/HistoryTable.tsx
index e572f69e..cc670e57 100644
--- a/app/src/components/History/HistoryTable.tsx
+++ b/app/src/components/History/HistoryTable.tsx
@@ -1,12 +1,13 @@
 import {
-  AudioWaveform,
-  Download,
-  FileArchive,
-  Loader2,
-  MoreHorizontal,
-  Play,
-  Trash2,
-} from 'lucide-react';
+  Archive01Icon,
+  Delete01Icon,
+  Download01Icon,
+  MoreHorizontalIcon,
+  PlayIcon,
+  WaveIcon,
+} from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { useEffect, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import {
@@ -54,7 +55,9 @@ export function HistoryTable() {
   const [importDialogOpen, setImportDialogOpen] = useState(false);
   const [selectedFile, setSelectedFile] = useState<File | null>(null);
   const [deleteDialogOpen, setDeleteDialogOpen] = useState(false);
-  const [generationToDelete, setGenerationToDelete] = useState<{ id: string; name: string } | null>(null);
+  const [generationToDelete, setGenerationToDelete] = useState<{ id: string; name: string } | null>(
+    null,
+  );
   const limit = 20;
   const { toast } = useToast();
 
@@ -222,7 +225,10 @@ export function HistoryTable() {
   if (isLoading && page === 0) {
     return (
       <div className="flex items-center justify-center h-full">
-        <Loader2 className="h-8 w-8 animate-spin text-muted-foreground" />
+        <Icon
+          icon="svg-spinners:ring-resize"
+          className="h-8 w-8 animate-spin text-muted-foreground"
+        />
       </div>
     );
   }
@@ -268,7 +274,11 @@ export function HistoryTable() {
                 >
                   {/* Waveform icon */}
                   <div className="flex items-center shrink-0">
-                    <AudioWaveform className="h-5 w-5 text-muted-foreground" />
+                    <HugeiconsIcon
+                      icon={WaveIcon}
+                      size={20}
+                      className="h-5 w-5 text-muted-foreground"
+                    />
                   </div>
 
                   {/* Left side - Meta information */}
@@ -310,36 +320,35 @@ export function HistoryTable() {
                           className="h-8 w-8"
                           aria-label="Actions"
                         >
-                          <MoreHorizontal className="h-4 w-4" />
+                          <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
                         </Button>
                       </DropdownMenuTrigger>
                       <DropdownMenuContent align="end">
                         <DropdownMenuItem
                           onClick={() => handlePlay(gen.id, gen.text, gen.profile_id)}
                         >
-                          <Play className="mr-2 h-4 w-4" />
+                          <HugeiconsIcon icon={PlayIcon} size={16} className="mr-2 h-4 w-4" />
                           Play
                         </DropdownMenuItem>
                         <DropdownMenuItem
                           onClick={() => handleDownloadAudio(gen.id, gen.text)}
                           disabled={exportGenerationAudio.isPending}
                         >
-                          <Download className="mr-2 h-4 w-4" />
+                          <HugeiconsIcon icon={Download01Icon} size={16} className="mr-2 h-4 w-4" />
                           Export Audio
                         </DropdownMenuItem>
                         <DropdownMenuItem
                           onClick={() => handleExportPackage(gen.id, gen.text)}
                           disabled={exportGeneration.isPending}
                         >
-                          <FileArchive className="mr-2 h-4 w-4" />
+                          <HugeiconsIcon icon={Archive01Icon} size={16} className="mr-2 h-4 w-4" />
                           Export Package
                         </DropdownMenuItem>
                         <DropdownMenuItem
                           onClick={() => handleDeleteClick(gen.id, gen.profile_name)}
                           disabled={deleteGeneration.isPending}
-                          className="text-destructive focus:text-destructive"
                         >
-                          <Trash2 className="mr-2 h-4 w-4" />
+                          <HugeiconsIcon icon={Delete01Icon} size={16} className="mr-2 h-4 w-4" />
                           Delete
                         </DropdownMenuItem>
                       </DropdownMenuContent>
@@ -352,7 +361,12 @@ export function HistoryTable() {
             {/* Load more trigger element */}
             {hasMore && (
               <div ref={loadMoreRef} className="flex items-center justify-center py-4">
-                {isFetching && <Loader2 className="h-6 w-6 animate-spin text-muted-foreground" />}
+                {isFetching && (
+                  <Icon
+                    icon="svg-spinners:ring-resize"
+                    className="h-6 w-6 animate-spin text-muted-foreground"
+                  />
+                )}
               </div>
             )}
 
@@ -371,7 +385,8 @@ export function HistoryTable() {
           <DialogHeader>
             <DialogTitle>Delete Generation</DialogTitle>
             <DialogDescription>
-              Are you sure you want to delete this generation from "{generationToDelete?.name}"? This action cannot be undone.
+              Are you sure you want to delete this generation from "{generationToDelete?.name}"?
+              This action cannot be undone.
             </DialogDescription>
           </DialogHeader>
           <DialogFooter>
diff --git a/app/src/components/MainEditor/MainEditor.tsx b/app/src/components/MainEditor/MainEditor.tsx
index 9d597b1e..17125893 100644
--- a/app/src/components/MainEditor/MainEditor.tsx
+++ b/app/src/components/MainEditor/MainEditor.tsx
@@ -1,4 +1,5 @@
-import { Sparkles, Upload } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { SparklesIcon, Upload01Icon } from '@hugeicons/core-free-icons';
 import { useRef, useState } from 'react';
 import { FloatingGenerateBox } from '@/components/Generation/FloatingGenerateBox';
 import { HistoryTable } from '@/components/History/HistoryTable';
@@ -89,7 +90,7 @@ export function MainEditor() {
             <h2 className="text-2xl font-bold">Voicebox</h2>
             <div className="flex gap-2">
               <Button variant="outline" onClick={handleImportClick}>
-                <Upload className="mr-2 h-4 w-4" />
+                <HugeiconsIcon icon={Upload01Icon} size={16} className="mr-2 h-4 w-4" />
                 Import Voice
               </Button>
               <input
@@ -100,7 +101,7 @@ export function MainEditor() {
                 className="hidden"
               />
               <Button onClick={() => setDialogOpen(true)}>
-                <Sparkles className="mr-2 h-4 w-4" />
+                <HugeiconsIcon icon={SparklesIcon} size={16} className="mr-2 h-4 w-4" />
                 Create Voice
               </Button>
             </div>
diff --git a/app/src/components/ServerSettings/DataFolders.tsx b/app/src/components/ServerSettings/DataFolders.tsx
new file mode 100644
index 00000000..9338da09
--- /dev/null
+++ b/app/src/components/ServerSettings/DataFolders.tsx
@@ -0,0 +1,112 @@
+import { Folder01Icon, FolderOpenIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
+import { Button } from '@/components/ui/button';
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card';
+import { Input } from '@/components/ui/input';
+import { useSystemFolders } from '@/lib/hooks/useSystemFolders';
+import { usePlatform } from '@/platform/PlatformContext';
+
+interface FolderRowProps {
+  label: string;
+  description: string;
+  path: string | undefined;
+  isLoading: boolean;
+  canOpen: boolean;
+  onOpen: () => void;
+}
+
+function FolderRow({ label, description, path, isLoading, canOpen, onOpen }: FolderRowProps) {
+  return (
+    <div className="space-y-1.5">
+      <div className="flex items-center justify-between">
+        <div>
+          <div className="text-sm font-medium">{label}</div>
+          <div className="text-xs text-muted-foreground">{description}</div>
+        </div>
+        {canOpen && path && (
+          <Button
+            variant="outline"
+            size="sm"
+            onClick={onOpen}
+            disabled={isLoading || !path}
+            className="shrink-0"
+          >
+            <HugeiconsIcon icon={FolderOpenIcon} size={16} className="h-4 w-4 mr-2" />
+            Open
+          </Button>
+        )}
+      </div>
+      <Input
+        value={isLoading ? 'Loading...' : path || 'Not available'}
+        readOnly
+        className="font-mono text-xs text-muted-foreground select-all cursor-text"
+      />
+    </div>
+  );
+}
+
+export function DataFolders() {
+  const { data: folders, isLoading, error } = useSystemFolders();
+  const platform = usePlatform();
+  const isTauri = platform.metadata.isTauri;
+
+  const handleOpenFolder = async (path: string | undefined) => {
+    if (!path) return;
+    const success = await platform.filesystem.openFolder(path);
+    if (!success && isTauri) {
+      console.error('Failed to open folder:', path);
+    }
+  };
+
+  return (
+    <Card>
+      <CardHeader>
+        <CardTitle className="flex items-center gap-2">
+          <HugeiconsIcon icon={Folder01Icon} size={20} className="h-5 w-5" />
+          Data Folders
+        </CardTitle>
+        <CardDescription>
+          {isTauri
+            ? 'Click "Open" to view folders in your file explorer, or copy the paths below.'
+            : 'These are the server-side folder paths where your data is stored.'}
+        </CardDescription>
+      </CardHeader>
+      <CardContent className="space-y-4">
+        {error ? (
+          <div className="flex items-center gap-2 text-sm text-destructive">
+            <Icon icon="lucide:alert-circle" className="h-4 w-4" />
+            <span>Failed to load folder paths: {error.message}</span>
+          </div>
+        ) : (
+          <>
+            <FolderRow
+              label="App Data"
+              description="Voices, generations, and app database"
+              path={folders?.data_dir}
+              isLoading={isLoading}
+              canOpen={isTauri}
+              onOpen={() => handleOpenFolder(folders?.data_dir)}
+            />
+            <FolderRow
+              label="Models"
+              description="Downloaded AI models from HuggingFace Hub"
+              path={folders?.models_dir}
+              isLoading={isLoading}
+              canOpen={isTauri}
+              onOpen={() => handleOpenFolder(folders?.models_dir)}
+            />
+            <FolderRow
+              label="Providers"
+              description="External TTS provider binaries (PyTorch CPU/CUDA)"
+              path={folders?.providers_dir}
+              isLoading={isLoading}
+              canOpen={isTauri}
+              onOpen={() => handleOpenFolder(folders?.providers_dir)}
+            />
+          </>
+        )}
+      </CardContent>
+    </Card>
+  );
+}
diff --git a/app/src/components/ServerSettings/ModelManagement.tsx b/app/src/components/ServerSettings/ModelManagement.tsx
index 4a5fd439..b1c7c123 100644
--- a/app/src/components/ServerSettings/ModelManagement.tsx
+++ b/app/src/components/ServerSettings/ModelManagement.tsx
@@ -1,5 +1,7 @@
+import { Delete01Icon, Download01Icon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
-import { Download, Loader2, Trash2 } from 'lucide-react';
 import { useCallback, useState } from 'react';
 import {
   AlertDialog,
@@ -67,11 +69,11 @@ export function ModelManagement() {
 
   const handleDownload = async (modelName: string) => {
     console.log('[Download] Button clicked for:', modelName, 'at', new Date().toISOString());
-    
+
     // Find display name
     const model = modelStatus?.models.find((m) => m.model_name === modelName);
     const displayName = model?.display_name || modelName;
-    
+
     try {
       // IMPORTANT: Call the API FIRST before setting state
       // Setting state enables the SSE EventSource in useModelDownloadToast,
@@ -79,11 +81,11 @@ export function ModelManagement() {
       console.log('[Download] Calling download API for:', modelName);
       const result = await apiClient.triggerModelDownload(modelName);
       console.log('[Download] Download API responded:', result);
-      
+
       // NOW set state to enable SSE tracking (after download has started on backend)
       setDownloadingModel(modelName);
       setDownloadingDisplayName(displayName);
-      
+
       // Download initiated successfully - state will be cleared when SSE reports completion
       // or by the polling interval detecting the model is downloaded
       queryClient.invalidateQueries({ queryKey: ['modelStatus'] });
@@ -117,7 +119,7 @@ export function ModelManagement() {
       // Invalidate AND explicitly refetch to ensure UI updates
       // Using refetchType: 'all' ensures we refetch even if the query is stale
       console.log('[Delete] Invalidating modelStatus query');
-      await queryClient.invalidateQueries({ 
+      await queryClient.invalidateQueries({
         queryKey: ['modelStatus'],
         refetchType: 'all',
       });
@@ -153,7 +155,10 @@ export function ModelManagement() {
       <CardContent className="space-y-4">
         {isLoading ? (
           <div className="flex items-center justify-center py-8">
-            <Loader2 className="h-6 w-6 animate-spin text-muted-foreground" />
+            <Icon
+              icon="svg-spinners:ring-resize"
+              className="h-6 w-6 animate-spin text-muted-foreground"
+            />
           </div>
         ) : modelStatus ? (
           <div className="space-y-4">
@@ -212,7 +217,6 @@ export function ModelManagement() {
                   ))}
               </div>
             </div>
-
           </div>
         ) : null}
       </CardContent>
@@ -246,7 +250,7 @@ export function ModelManagement() {
             >
               {deleteMutation.isPending ? (
                 <>
-                  <Loader2 className="h-4 w-4 mr-2 animate-spin" />
+                  <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 mr-2 animate-spin" />
                   Deleting...
                 </>
               ) : (
@@ -265,20 +269,20 @@ interface ModelItemProps {
     model_name: string;
     display_name: string;
     downloaded: boolean;
-    downloading?: boolean;  // From server - true if download in progress
+    downloading?: boolean; // From server - true if download in progress
     size_mb?: number;
     loaded: boolean;
   };
   onDownload: () => void;
   onDelete: () => void;
-  isDownloading: boolean;  // Local state - true if user just clicked download
+  isDownloading: boolean; // Local state - true if user just clicked download
   formatSize: (sizeMb?: number) => string;
 }
 
 function ModelItem({ model, onDownload, onDelete, isDownloading, formatSize }: ModelItemProps) {
   // Use server's downloading state OR local state (for immediate feedback before server updates)
   const showDownloading = model.downloading || isDownloading;
-  
+
   return (
     <div className="flex items-center justify-between p-3 border rounded-lg">
       <div className="flex-1">
@@ -315,17 +319,17 @@ function ModelItem({ model, onDownload, onDelete, isDownloading, formatSize }: M
               disabled={model.loaded}
               title={model.loaded ? 'Unload model before deleting' : 'Delete model'}
             >
-              <Trash2 className="h-4 w-4" />
+              <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
             </Button>
           </div>
         ) : showDownloading ? (
           <Button size="sm" variant="outline" disabled>
-            <Loader2 className="h-4 w-4 mr-2 animate-spin" />
+            <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 mr-2 animate-spin" />
             Downloading...
           </Button>
         ) : (
           <Button size="sm" onClick={onDownload} variant="outline">
-            <Download className="h-4 w-4 mr-2" />
+            <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-2" />
             Download
           </Button>
         )}
diff --git a/app/src/components/ServerSettings/ModelProgress.tsx b/app/src/components/ServerSettings/ModelProgress.tsx
index 76aa99f1..efd35427 100644
--- a/app/src/components/ServerSettings/ModelProgress.tsx
+++ b/app/src/components/ServerSettings/ModelProgress.tsx
@@ -1,4 +1,6 @@
-import { Loader2, XCircle } from 'lucide-react';
+import { CancelCircleIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { useEffect, useState } from 'react';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import { Progress } from '@/components/ui/progress';
@@ -12,7 +14,11 @@ interface ModelProgressProps {
   isDownloading?: boolean;
 }
 
-export function ModelProgress({ modelName, displayName, isDownloading = false }: ModelProgressProps) {
+export function ModelProgress({
+  modelName,
+  displayName,
+  isDownloading = false,
+}: ModelProgressProps) {
   const [progress, setProgress] = useState<ModelProgressType | null>(null);
   const serverUrl = useServerStore((state) => state.serverUrl);
 
@@ -74,10 +80,12 @@ export function ModelProgress({ modelName, displayName, isDownloading = false }:
   const getStatusIcon = () => {
     switch (progress.status) {
       case 'error':
-        return <XCircle className="h-4 w-4 text-destructive" />;
+        return (
+          <HugeiconsIcon icon={CancelCircleIcon} size={16} className="h-4 w-4 text-destructive" />
+        );
       case 'downloading':
       case 'extracting':
-        return <Loader2 className="h-4 w-4 animate-spin" />;
+        return <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />;
       default:
         return null;
     }
diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
new file mode 100644
index 00000000..7cd68270
--- /dev/null
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -0,0 +1,400 @@
+import { Delete01Icon, Download01Icon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
+import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
+import { useCallback, useState } from 'react';
+import {
+  AlertDialog,
+  AlertDialogAction,
+  AlertDialogCancel,
+  AlertDialogContent,
+  AlertDialogDescription,
+  AlertDialogFooter,
+  AlertDialogHeader,
+  AlertDialogTitle,
+} from '@/components/ui/alert-dialog';
+import { Button } from '@/components/ui/button';
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card';
+import { Label } from '@/components/ui/label';
+import { RadioGroup, RadioGroupItem } from '@/components/ui/radio-group';
+import { useToast } from '@/components/ui/use-toast';
+import { apiClient } from '@/lib/api/client';
+import { useModelDownloadToast } from '@/lib/hooks/useModelDownloadToast';
+
+const isMacOS = () => navigator.platform.toLowerCase().includes('mac');
+const isWindows = () => navigator.platform.toLowerCase().includes('win');
+const getPlatformName = () => {
+  if (isMacOS()) return 'macOS';
+  if (isWindows()) return 'Windows';
+  return 'Linux';
+};
+
+type ProviderType =
+  | 'auto'
+  | 'apple-mlx'
+  | 'bundled-pytorch'
+  | 'pytorch-cpu'
+  | 'pytorch-cuda'
+  | 'remote'
+  | 'openai';
+
+export function ProviderSettings() {
+  const { toast } = useToast();
+  const queryClient = useQueryClient();
+  const [downloadingProvider, setDownloadingProvider] = useState<string | null>(null);
+
+  const { data: providersData, isLoading } = useQuery({
+    queryKey: ['providers'],
+    queryFn: async () => {
+      return await apiClient.listProviders();
+    },
+    refetchInterval: 5000,
+  });
+
+  const { data: activeProvider } = useQuery({
+    queryKey: ['activeProvider'],
+    queryFn: async () => {
+      return await apiClient.getActiveProvider();
+    },
+    refetchInterval: 5000,
+  });
+
+  // Callbacks for download completion
+  const handleDownloadComplete = useCallback(() => {
+    setDownloadingProvider(null);
+    queryClient.invalidateQueries({ queryKey: ['providers'] });
+  }, [queryClient]);
+
+  const handleDownloadError = useCallback(() => {
+    setDownloadingProvider(null);
+  }, []);
+
+  // Use progress toast hook for the downloading provider
+  useModelDownloadToast({
+    modelName: downloadingProvider || '',
+    displayName: downloadingProvider || '',
+    enabled: !!downloadingProvider,
+    onComplete: handleDownloadComplete,
+    onError: handleDownloadError,
+  });
+
+  const [deleteDialogOpen, setDeleteDialogOpen] = useState(false);
+  const [providerToDelete, setProviderToDelete] = useState<string | null>(null);
+
+  const downloadMutation = useMutation({
+    mutationFn: async (providerType: string) => {
+      return await apiClient.downloadProvider(providerType);
+    },
+    onSuccess: (_, providerType) => {
+      setDownloadingProvider(providerType);
+      queryClient.invalidateQueries({ queryKey: ['providers'] });
+    },
+    onError: (error: Error) => {
+      toast({
+        title: 'Download failed',
+        description: error.message,
+        variant: 'destructive',
+      });
+    },
+  });
+
+  const startMutation = useMutation({
+    mutationFn: async (providerType: string) => {
+      return await apiClient.startProvider(providerType);
+    },
+    onSuccess: () => {
+      queryClient.invalidateQueries({ queryKey: ['activeProvider'] });
+      toast({
+        title: 'Provider started',
+        description: 'The provider has been started successfully',
+      });
+    },
+    onError: (error: Error) => {
+      toast({
+        title: 'Failed to start provider',
+        description: error.message,
+        variant: 'destructive',
+      });
+    },
+  });
+
+  const deleteMutation = useMutation({
+    mutationFn: async (providerType: string) => {
+      return await apiClient.deleteProvider(providerType);
+    },
+    onSuccess: () => {
+      queryClient.invalidateQueries({ queryKey: ['providers'] });
+      toast({
+        title: 'Provider deleted',
+        description: 'The provider has been deleted successfully',
+      });
+    },
+    onError: (error: Error) => {
+      toast({
+        title: 'Failed to delete provider',
+        description: error.message,
+        variant: 'destructive',
+      });
+    },
+  });
+
+  const handleDownload = async (providerType: string) => {
+    downloadMutation.mutate(providerType);
+  };
+
+  const handleStart = async (providerType: string) => {
+    startMutation.mutate(providerType);
+  };
+
+  const handleDelete = (providerType: string) => {
+    setProviderToDelete(providerType);
+    setDeleteDialogOpen(true);
+  };
+
+  const confirmDelete = () => {
+    if (providerToDelete) {
+      deleteMutation.mutate(providerToDelete);
+      setDeleteDialogOpen(false);
+      setProviderToDelete(null);
+    }
+  };
+
+  if (isLoading) {
+    return (
+      <Card>
+        <CardHeader>
+          <CardTitle>TTS Provider</CardTitle>
+          <CardDescription>Choose how Voicebox generates speech</CardDescription>
+        </CardHeader>
+        <CardContent>
+          <div className="flex items-center justify-center py-8">
+            <Icon icon="svg-spinners:ring-resize" className="h-6 w-6 animate-spin" />
+          </div>
+        </CardContent>
+      </Card>
+    );
+  }
+
+  const installedProviders = providersData?.installed || [];
+
+  // Determine current active provider
+  const currentProvider = activeProvider?.provider;
+  console.log('currentProvider', currentProvider);
+  const selectedProvider = currentProvider as ProviderType;
+
+  const isStarting = startMutation.isPending;
+
+  return (
+    <>
+      <Card>
+        <CardHeader>
+          <CardTitle>TTS Provider</CardTitle>
+          <CardDescription>Choose how Voicebox generates speech.</CardDescription>
+        </CardHeader>
+        <CardContent className="relative">
+          {isStarting && (
+            <div className="absolute inset-0 bg-background/80 backdrop-blur-sm flex items-center justify-center z-10 rounded-lg">
+              <div className="flex items-center gap-2 text-muted-foreground">
+                <Icon icon="svg-spinners:ring-resize" className="h-5 w-5" />
+                <span>Starting provider...</span>
+              </div>
+            </div>
+          )}
+          <RadioGroup
+            value={selectedProvider}
+            onValueChange={(value) => handleStart(value)}
+            disabled={isStarting}
+          >
+            {/* PyTorch CUDA */}
+            <div className="flex items-center justify-between py-2">
+              <div className={`flex items-center space-x-3 flex-1 ${isMacOS() || !installedProviders.includes('pytorch-cuda') ? 'opacity-50' : ''}`}>
+                <RadioGroupItem value="pytorch-cuda" id="cuda" disabled={isMacOS() || isStarting || !installedProviders.includes('pytorch-cuda')} />
+                <Label
+                  htmlFor="cuda"
+                  className={`flex-1 ${isMacOS() || isStarting || !installedProviders.includes('pytorch-cuda') ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                >
+                  <div className="font-medium">PyTorch CUDA</div>
+                  <div className="text-sm text-muted-foreground">
+                    NVIDIA GPU-accelerated provider
+                  </div>
+                </Label>
+              </div>
+              <div className="flex items-center gap-2">
+                {isMacOS() && (
+                  <>
+                    <span className="text-xs text-muted-foreground">2.4GB</span>
+                    <Button size="sm" variant="secondary" disabled>
+                      Not Available on macOS
+                    </Button>
+                  </>
+                )}
+                {!isMacOS() && !installedProviders.includes('pytorch-cuda') && (
+                  <>
+                    <span className="text-xs text-muted-foreground">2.4GB</span>
+                    <Button
+                      onClick={() => handleDownload('pytorch-cuda')}
+                      size="sm"
+                      variant="outline"
+                      disabled={downloadingProvider === 'pytorch-cuda' || isStarting}
+                      className="shrink-0"
+                    >
+                      {downloadingProvider === 'pytorch-cuda' ? (
+                        <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
+                      ) : (
+                        <>
+                          <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-2" />
+                          Download
+                        </>
+                      )}
+                    </Button>
+                  </>
+                )}
+                {installedProviders.includes('pytorch-cuda') && (
+                  <Button
+                    onClick={() => handleDelete('pytorch-cuda')}
+                    size="sm"
+                    variant="outline"
+                    disabled={isStarting}
+                    className="shrink-0"
+                  >
+                    <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4 mr-2" />
+                    Uninstall
+                  </Button>
+                )}
+              </div>
+            </div>
+
+            {/* PyTorch CPU */}
+            <div className="flex items-center justify-between py-2">
+              <div className={`flex items-center space-x-3 flex-1 ${!installedProviders.includes('pytorch-cpu') ? 'opacity-50' : ''}`}>
+                <RadioGroupItem value="pytorch-cpu" id="cpu" disabled={isStarting || !installedProviders.includes('pytorch-cpu')} />
+                <Label
+                  htmlFor="cpu"
+                  className={`flex-1 ${isStarting || !installedProviders.includes('pytorch-cpu') ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                >
+                  <div className="font-medium">PyTorch CPU</div>
+                  <div className="text-sm text-muted-foreground">
+                    Works on any system, slower inference
+                  </div>
+                </Label>
+              </div>
+              <div className="flex items-center gap-2">
+                {!installedProviders.includes('pytorch-cpu') && (
+                  <>
+                    <span className="text-xs text-muted-foreground">242MB</span>
+                    <Button
+                      onClick={() => handleDownload('pytorch-cpu')}
+                      size="sm"
+                      variant="outline"
+                      disabled={downloadingProvider === 'pytorch-cpu' || isStarting}
+                      className="shrink-0"
+                    >
+                      {downloadingProvider === 'pytorch-cpu' ? (
+                        <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
+                      ) : (
+                        <>
+                          <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-2" />
+                          Download
+                        </>
+                      )}
+                    </Button>
+                  </>
+                )}
+                {installedProviders.includes('pytorch-cpu') && (
+                  <Button
+                    onClick={() => handleDelete('pytorch-cpu')}
+                    size="sm"
+                    variant="outline"
+                    disabled={isStarting}
+                    className="shrink-0"
+                  >
+                    <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4 mr-2" />
+                    Uninstall
+                  </Button>
+                )}
+              </div>
+            </div>
+
+            {/* MLX bundled (macOS Apple Silicon only) */}
+            <div className="flex items-center justify-between py-2">
+              <div className={`flex items-center space-x-3 flex-1 ${!isMacOS() ? 'opacity-50' : ''}`}>
+                <RadioGroupItem value="apple-mlx" id="mlx" disabled={isStarting || !isMacOS()} />
+                <Label
+                  htmlFor="mlx"
+                  className={`flex-1 ${isStarting || !isMacOS() ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                >
+                  <div className="font-medium">Apple MLX</div>
+                  <div className="text-sm text-muted-foreground">
+                    {isMacOS()
+                      ? 'Bundled with this version, optimized for Apple Silicon'
+                      : 'Only available on Apple Silicon'}
+                  </div>
+                </Label>
+              </div>
+              {!isMacOS() && (
+                <Button size="sm" variant="secondary" disabled>
+                  Not Available on {getPlatformName()}
+                </Button>
+              )}
+            </div>
+
+            {/* Remote */}
+            <div className="flex items-center justify-between py-2">
+              <div className="flex items-center space-x-3 flex-1 opacity-50">
+                <RadioGroupItem value="remote" id="remote" disabled />
+                <Label htmlFor="remote" className="flex-1 cursor-not-allowed">
+                  <div className="font-medium">Remote Server</div>
+                  <div className="text-sm text-muted-foreground">
+                    Connect to your own TTS server
+                  </div>
+                </Label>
+              </div>
+              <Button size="sm" variant="secondary" disabled>
+                Coming Soon
+              </Button>
+            </div>
+
+            {/* OpenAI */}
+            <div className="flex items-center justify-between py-2">
+              <div className="flex items-center space-x-3 flex-1 opacity-50">
+                <RadioGroupItem value="openai" id="openai" disabled />
+                <Label htmlFor="openai" className="flex-1 cursor-not-allowed">
+                  <div className="font-medium">OpenAI API</div>
+                  <div className="text-sm text-muted-foreground">Use OpenAI's TTS API</div>
+                </Label>
+              </div>
+              <Button size="sm" variant="secondary" disabled>
+                Coming Soon
+              </Button>
+            </div>
+          </RadioGroup>
+          <p className="text-xs text-muted-foreground mt-5">
+            Note: PyTorch and MLX use different versions of the same model. When switching between
+            them, you will need to redownload the model.
+          </p>
+        </CardContent>
+      </Card>
+
+      <AlertDialog open={deleteDialogOpen} onOpenChange={setDeleteDialogOpen}>
+        <AlertDialogContent>
+          <AlertDialogHeader>
+            <AlertDialogTitle>Delete Provider</AlertDialogTitle>
+            <AlertDialogDescription>
+              Are you sure you want to delete {providerToDelete}? This will remove the provider
+              binary from your system. You can download it again later if needed.
+            </AlertDialogDescription>
+          </AlertDialogHeader>
+          <AlertDialogFooter>
+            <AlertDialogCancel>Cancel</AlertDialogCancel>
+            <AlertDialogAction
+              onClick={confirmDelete}
+              className="bg-destructive text-destructive-foreground"
+            >
+              Delete
+            </AlertDialogAction>
+          </AlertDialogFooter>
+        </AlertDialogContent>
+      </AlertDialog>
+    </>
+  );
+}
diff --git a/app/src/components/ServerSettings/ServerStatus.tsx b/app/src/components/ServerSettings/ServerStatus.tsx
index 02a94ec2..8437552e 100644
--- a/app/src/components/ServerSettings/ServerStatus.tsx
+++ b/app/src/components/ServerSettings/ServerStatus.tsx
@@ -1,4 +1,6 @@
-import { Loader2, XCircle } from 'lucide-react';
+import { CancelCircleIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { Badge } from '@/components/ui/badge';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import { useServerHealth } from '@/lib/hooks/useServer';
@@ -32,12 +34,12 @@ export function ServerStatus() {
 
         {isLoading ? (
           <div className="flex items-center gap-2">
-            <Loader2 className="h-4 w-4 animate-spin" />
+            <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
             <span className="text-sm">Checking connection...</span>
           </div>
         ) : error ? (
           <div className="flex items-center gap-2">
-            <XCircle className="h-4 w-4 text-destructive" />
+            <HugeiconsIcon icon={CancelCircleIcon} size={16} className="h-4 w-4 text-destructive" />
             <span className="text-sm text-destructive">Connection failed: {error.message}</span>
           </div>
         ) : health ? (
diff --git a/app/src/components/ServerSettings/UpdateStatus.tsx b/app/src/components/ServerSettings/UpdateStatus.tsx
index a3d832aa..5cab320e 100644
--- a/app/src/components/ServerSettings/UpdateStatus.tsx
+++ b/app/src/components/ServerSettings/UpdateStatus.tsx
@@ -1,4 +1,5 @@
-import { AlertCircle, Download, RefreshCw } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { AlertCircleIcon, Download01Icon, Refresh01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useState } from 'react';
 import { Badge } from '@/components/ui/badge';
 import { Button } from '@/components/ui/button';
@@ -36,21 +37,21 @@ export function UpdateStatus() {
             variant="outline"
             size="sm"
           >
-            <RefreshCw className={`h-4 w-4 mr-2 ${status.checking ? 'animate-spin' : ''}`} />
+            <HugeiconsIcon icon={Refresh01Icon} size={16} className={`h-4 w-4 mr-2 ${status.checking ? 'animate-spin' : ''}`} />
             Check for Updates
           </Button>
         </div>
 
         {status.checking && (
           <div className="flex items-center gap-2 text-sm text-muted-foreground">
-            <RefreshCw className="h-4 w-4 animate-spin" />
+            <HugeiconsIcon icon={Refresh01Icon} size={16} className="h-4 w-4 animate-spin" />
             Checking for updates...
           </div>
         )}
 
         {status.error && (
           <div className="flex items-center gap-2 text-sm text-destructive">
-            <AlertCircle className="h-4 w-4" />
+            <HugeiconsIcon icon={AlertCircleIcon} size={16} className="h-4 w-4" />
             {status.error}
           </div>
         )}
@@ -65,7 +66,7 @@ export function UpdateStatus() {
               <Badge>New</Badge>
             </div>
             <Button onClick={downloadAndInstall} className="w-full" size="sm">
-              <Download className="h-4 w-4 mr-2" />
+              <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-2" />
               Download Update
             </Button>
           </div>
@@ -75,7 +76,7 @@ export function UpdateStatus() {
           <div className="space-y-2">
             <div className="flex items-center justify-between text-sm">
               <div className="flex items-center gap-2">
-                <Download className="h-4 w-4" />
+                <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4" />
                 Downloading update...
               </div>
               {status.downloadProgress !== undefined && (
@@ -109,7 +110,7 @@ export function UpdateStatus() {
               your convenience.
             </div>
             <Button onClick={restartAndInstall} className="w-full" size="sm">
-              <RefreshCw className="h-4 w-4 mr-2" />
+              <HugeiconsIcon icon={Refresh01Icon} size={16} className="h-4 w-4 mr-2" />
               Restart Now
             </Button>
           </div>
diff --git a/app/src/components/ServerTab/ServerTab.tsx b/app/src/components/ServerTab/ServerTab.tsx
index abf91ac2..69fc7117 100644
--- a/app/src/components/ServerTab/ServerTab.tsx
+++ b/app/src/components/ServerTab/ServerTab.tsx
@@ -1,4 +1,6 @@
 import { ConnectionForm } from '@/components/ServerSettings/ConnectionForm';
+import { DataFolders } from '@/components/ServerSettings/DataFolders';
+import { ProviderSettings } from '@/components/ServerSettings/ProviderSettings';
 import { ServerStatus } from '@/components/ServerSettings/ServerStatus';
 import { UpdateStatus } from '@/components/ServerSettings/UpdateStatus';
 import { usePlatform } from '@/platform/PlatformContext';
@@ -11,6 +13,8 @@ export function ServerTab() {
         <ConnectionForm />
         <ServerStatus />
       </div>
+      <ProviderSettings />
+      <DataFolders />
       {platform.metadata.isTauri && <UpdateStatus />}
       <div className="py-8 text-center text-sm text-muted-foreground">
         Created by{' '}
diff --git a/app/src/components/Sidebar.tsx b/app/src/components/Sidebar.tsx
index a849344f..39314788 100644
--- a/app/src/components/Sidebar.tsx
+++ b/app/src/components/Sidebar.tsx
@@ -1,5 +1,14 @@
+import {
+  Book01Icon,
+  Mic01Icon,
+  PackageIcon,
+  ServerStack01Icon,
+  SpeakerIcon,
+  VolumeHighIcon,
+} from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { Link, useMatchRoute } from '@tanstack/react-router';
-import { Box, BookOpen, Loader2, Mic, Server, Speaker, Volume2 } from 'lucide-react';
 import voiceboxLogo from '@/assets/voicebox-logo.png';
 import { cn } from '@/lib/utils/cn';
 import { useGenerationStore } from '@/stores/generationStore';
@@ -10,12 +19,12 @@ interface SidebarProps {
 }
 
 const tabs = [
-  { id: 'main', path: '/', icon: Volume2, label: 'Generate' },
-  { id: 'stories', path: '/stories', icon: BookOpen, label: 'Stories' },
-  { id: 'voices', path: '/voices', icon: Mic, label: 'Voices' },
-  { id: 'audio', path: '/audio', icon: Speaker, label: 'Audio' },
-  { id: 'models', path: '/models', icon: Box, label: 'Models' },
-  { id: 'server', path: '/server', icon: Server, label: 'Server' },
+  { id: 'main', path: '/', icon: VolumeHighIcon, label: 'Generate' },
+  { id: 'stories', path: '/stories', icon: Book01Icon, label: 'Stories' },
+  { id: 'voices', path: '/voices', icon: Mic01Icon, label: 'Voices' },
+  { id: 'audio', path: '/audio', icon: SpeakerIcon, label: 'Audio' },
+  { id: 'models', path: '/models', icon: PackageIcon, label: 'Models' },
+  { id: 'server', path: '/server', icon: ServerStack01Icon, label: 'Server' },
 ];
 
 export function Sidebar({ isMacOS }: SidebarProps) {
@@ -42,9 +51,7 @@ export function Sidebar({ isMacOS }: SidebarProps) {
           const Icon = tab.icon;
           // For index route, use exact match; for others, use default matching
           const isActive =
-            tab.path === '/'
-              ? matchRoute({ to: '/', exact: true })
-              : matchRoute({ to: tab.path });
+            tab.path === '/' ? matchRoute({ to: '/' }) : matchRoute({ to: tab.path });
 
           return (
             <Link
@@ -58,7 +65,7 @@ export function Sidebar({ isMacOS }: SidebarProps) {
               title={tab.label}
               aria-label={tab.label}
             >
-              <Icon className="h-5 w-5" />
+              <HugeiconsIcon icon={Icon} size={20} className="h-5 w-5" />
             </Link>
           );
         })}
@@ -75,7 +82,7 @@ export function Sidebar({ isMacOS }: SidebarProps) {
             isPlayerVisible ? 'mb-[120px]' : 'mb-0',
           )}
         >
-          <Loader2 className="h-6 w-6 text-accent animate-spin" />
+          <Icon icon="svg-spinners:ring-resize" className="h-6 w-6 text-accent animate-spin" />
         </div>
       )}
     </div>
diff --git a/app/src/components/StoriesTab/StoryChatItem.tsx b/app/src/components/StoriesTab/StoryChatItem.tsx
index 19fa2249..ac16352a 100644
--- a/app/src/components/StoriesTab/StoryChatItem.tsx
+++ b/app/src/components/StoriesTab/StoryChatItem.tsx
@@ -1,7 +1,7 @@
 import { useSortable } from '@dnd-kit/sortable';
 import { CSS } from '@dnd-kit/utilities';
-import { GripVertical, Mic, MoreHorizontal, Play, Trash2 } from 'lucide-react';
-import { useState } from 'react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { DragDropVerticalIcon, MoreHorizontalIcon, PlayIcon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { Button } from '@/components/ui/button';
 import {
   DropdownMenu,
@@ -10,10 +10,10 @@ import {
   DropdownMenuTrigger,
 } from '@/components/ui/dropdown-menu';
 import { Textarea } from '@/components/ui/textarea';
+import { ProfileAvatar } from '@/components/VoiceProfiles/ProfileAvatar';
 import type { StoryItemDetail } from '@/lib/api/types';
 import { cn } from '@/lib/utils/cn';
 import { useStoryStore } from '@/stores/storyStore';
-import { useServerStore } from '@/stores/serverStore';
 
 interface StoryChatItemProps {
   item: StoryItemDetail;
@@ -35,10 +35,6 @@ export function StoryChatItem({
   isDragging,
 }: StoryChatItemProps) {
   const seek = useStoryStore((state) => state.seek);
-  const serverUrl = useServerStore((state) => state.serverUrl);
-  const [avatarError, setAvatarError] = useState(false);
-
-  const avatarUrl = `${serverUrl}/profiles/${item.profile_id}/avatar`;
 
   // Check if this item is currently playing based on timecode
   const itemStartMs = item.start_time_ms;
@@ -74,27 +70,18 @@ export function StoryChatItem({
           className="shrink-0 cursor-grab active:cursor-grabbing touch-none text-muted-foreground hover:text-foreground transition-colors"
           {...dragHandleProps}
         >
-          <GripVertical className="h-5 w-5" />
+          <HugeiconsIcon icon={DragDropVerticalIcon} size={20} className="h-5 w-5" />
         </button>
       )}
 
       {/* Voice Avatar */}
       <div className="shrink-0">
-        <div className="h-10 w-10 rounded-full bg-muted flex items-center justify-center overflow-hidden">
-          {!avatarError ? (
-            <img
-              src={avatarUrl}
-              alt={`${item.profile_name} avatar`}
-              className={cn(
-                'h-full w-full object-cover transition-all duration-200',
-                !isCurrentlyPlaying && 'grayscale'
-              )}
-              onError={() => setAvatarError(true)}
-            />
-          ) : (
-            <Mic className="h-5 w-5 text-muted-foreground" />
-          )}
-        </div>
+        <ProfileAvatar
+          profileId={item.profile_id}
+          size="lg"
+          grayscale={!isCurrentlyPlaying}
+          alt={`${item.profile_name} avatar`}
+        />
       </div>
 
       {/* Content */}
@@ -119,16 +106,16 @@ export function StoryChatItem({
         <DropdownMenu>
           <DropdownMenuTrigger asChild>
             <Button variant="ghost" size="icon" className="h-8 w-8" aria-label="Actions">
-              <MoreHorizontal className="h-4 w-4" />
+              <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
             </Button>
           </DropdownMenuTrigger>
           <DropdownMenuContent align="end">
             <DropdownMenuItem onClick={handlePlay}>
-              <Play className="mr-2 h-4 w-4" />
+              <HugeiconsIcon icon={PlayIcon} size={16} className="mr-2 h-4 w-4" />
               Play from here
             </DropdownMenuItem>
             <DropdownMenuItem onClick={onRemove} className="text-destructive focus:text-destructive">
-              <Trash2 className="mr-2 h-4 w-4" />
+              <HugeiconsIcon icon={Delete01Icon} size={16} className="mr-2 h-4 w-4" />
               Remove from Story
             </DropdownMenuItem>
           </DropdownMenuContent>
diff --git a/app/src/components/StoriesTab/StoryContent.tsx b/app/src/components/StoriesTab/StoryContent.tsx
index 483e6657..518c42a0 100644
--- a/app/src/components/StoriesTab/StoryContent.tsx
+++ b/app/src/components/StoriesTab/StoryContent.tsx
@@ -13,7 +13,8 @@ import {
   sortableKeyboardCoordinates,
   verticalListSortingStrategy,
 } from '@dnd-kit/sortable';
-import { Download, Plus } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Download01Icon, Add01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useMemo, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import { Input } from '@/components/ui/input';
@@ -271,7 +272,7 @@ export function StoryContent() {
           <Popover open={isAddOpen} onOpenChange={setIsAddOpen}>
             <PopoverTrigger asChild>
               <Button variant="outline" size="sm">
-                <Plus className="mr-2 h-4 w-4" />
+                <HugeiconsIcon icon={Add01Icon} size={16} className="mr-2 h-4 w-4" />
                 Add
               </Button>
             </PopoverTrigger>
@@ -316,7 +317,7 @@ export function StoryContent() {
               onClick={handleExportAudio}
               disabled={exportAudio.isPending}
             >
-              <Download className="mr-2 h-4 w-4" />
+              <HugeiconsIcon icon={Download01Icon} size={16} className="mr-2 h-4 w-4" />
               Export Audio
             </Button>
           )}
diff --git a/app/src/components/StoriesTab/StoryList.tsx b/app/src/components/StoriesTab/StoryList.tsx
index ebbd6616..dd78d245 100644
--- a/app/src/components/StoriesTab/StoryList.tsx
+++ b/app/src/components/StoriesTab/StoryList.tsx
@@ -1,5 +1,6 @@
-import { Plus, BookOpen, MoreHorizontal, Pencil, Trash2 } from 'lucide-react';
-import { useState } from 'react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Add01Icon, Book01Icon, MoreHorizontalIcon, PencilIcon, Delete01Icon } from '@hugeicons/core-free-icons';
+import { useState, useMemo } from 'react';
 import {
   AlertDialog,
   AlertDialogAction,
@@ -29,7 +30,7 @@ import { Input } from '@/components/ui/input';
 import { Label } from '@/components/ui/label';
 import { Textarea } from '@/components/ui/textarea';
 import { useToast } from '@/components/ui/use-toast';
-import { useStories, useCreateStory, useUpdateStory, useDeleteStory } from '@/lib/hooks/useStories';
+import { useStories, useCreateStory, useUpdateStory, useDeleteStory, useStory } from '@/lib/hooks/useStories';
 import { cn } from '@/lib/utils/cn';
 import { formatDate } from '@/lib/utils/format';
 import { useStoryStore } from '@/stores/storyStore';
@@ -38,6 +39,8 @@ export function StoryList() {
   const { data: stories, isLoading } = useStories();
   const selectedStoryId = useStoryStore((state) => state.selectedStoryId);
   const setSelectedStoryId = useStoryStore((state) => state.setSelectedStoryId);
+  const trackEditorHeight = useStoryStore((state) => state.trackEditorHeight);
+  const { data: currentStory } = useStory(selectedStoryId);
   const createStory = useCreateStory();
   const updateStory = useUpdateStory();
   const deleteStory = useDeleteStory();
@@ -54,6 +57,16 @@ export function StoryList() {
   const [newStoryDescription, setNewStoryDescription] = useState('');
   const { toast } = useToast();
 
+  // Calculate bottom padding to account for FloatingGenerateBox and StoryTrackEditor
+  const hasTrackEditor = currentStory && currentStory.items.length > 0;
+  const bottomPadding = useMemo(() => {
+    // FloatingGenerateBox height (~100px) + gap (24px)
+    const generateBoxHeight = 124;
+    // Track editor height when visible
+    const editorHeight = hasTrackEditor ? trackEditorHeight + 24 : 0;
+    return generateBoxHeight + editorHeight;
+  }, [hasTrackEditor, trackEditorHeight]);
+
   const handleCreateStory = () => {
     if (!newStoryName.trim()) {
       toast({
@@ -177,16 +190,19 @@ export function StoryList() {
       <div className="flex items-center justify-between mb-4 px-1">
         <h2 className="text-2xl font-bold">Stories</h2>
         <Button onClick={() => setCreateDialogOpen(true)} size="sm">
-          <Plus className="mr-2 h-4 w-4" />
+          <HugeiconsIcon icon={Add01Icon} size={16} className="mr-2 h-4 w-4" />
           New Story
         </Button>
       </div>
 
       {/* Story List */}
-      <div className="flex-1 min-h-0 overflow-y-auto space-y-2">
+      <div 
+        className="flex-1 min-h-0 overflow-y-auto space-y-2"
+        style={{ paddingBottom: `${bottomPadding}px` }}
+      >
         {storyList.length === 0 ? (
           <div className="text-center py-12 px-5 border-2 border-dashed border-muted rounded-2xl text-muted-foreground">
-            <BookOpen className="h-12 w-12 mx-auto mb-4 opacity-50" />
+            <HugeiconsIcon icon={Book01Icon} size={48} className="h-12 w-12 mx-auto mb-4 opacity-50" />
             <p className="text-sm">No stories yet</p>
             <p className="text-xs mt-2">Create your first story to get started</p>
           </div>
@@ -227,19 +243,19 @@ export function StoryList() {
                       className="h-8 w-8 opacity-0 group-hover:opacity-100 transition-opacity"
                       onClick={(e) => e.stopPropagation()}
                     >
-                      <MoreHorizontal className="h-4 w-4" />
+                      <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
                     </Button>
                   </DropdownMenuTrigger>
                   <DropdownMenuContent align="end">
                     <DropdownMenuItem onClick={() => handleEditClick(story)}>
-                      <Pencil className="mr-2 h-4 w-4" />
+                      <HugeiconsIcon icon={PencilIcon} size={16} className="mr-2 h-4 w-4" />
                       Edit
                     </DropdownMenuItem>
                     <DropdownMenuItem
                       onClick={() => handleDeleteClick(story.id)}
                       className="text-destructive focus:text-destructive"
                     >
-                      <Trash2 className="mr-2 h-4 w-4" />
+                      <HugeiconsIcon icon={Delete01Icon} size={16} className="mr-2 h-4 w-4" />
                       Delete
                     </DropdownMenuItem>
                   </DropdownMenuContent>
diff --git a/app/src/components/StoriesTab/StoryTrackEditor.tsx b/app/src/components/StoriesTab/StoryTrackEditor.tsx
index 74dbde25..95a10296 100644
--- a/app/src/components/StoriesTab/StoryTrackEditor.tsx
+++ b/app/src/components/StoriesTab/StoryTrackEditor.tsx
@@ -1,14 +1,15 @@
+import { HugeiconsIcon } from '@hugeicons/react';
 import {
-  Copy,
-  GripHorizontal,
-  Minus,
-  Pause,
-  Play,
-  Plus,
-  Scissors,
-  Square,
-  Trash2,
-} from 'lucide-react';
+  Copy01Icon,
+  DragDropHorizontalIcon,
+  RemoveIcon,
+  PauseIcon,
+  PlayIcon,
+  Add01Icon,
+  Scissor01Icon,
+  SquareIcon,
+  Delete01Icon,
+} from '@hugeicons/core-free-icons';
 import { useCallback, useEffect, useMemo, useRef, useState } from 'react';
 import WaveSurfer from 'wavesurfer.js';
 import { Button } from '@/components/ui/button';
@@ -723,7 +724,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
           onMouseDown={handleResizeStart}
           aria-label="Resize track editor"
         >
-          <GripHorizontal className="h-3 w-3 text-muted-foreground/50 group-hover:text-muted-foreground" />
+          <HugeiconsIcon icon={DragDropHorizontalIcon} size={12} className="h-3 w-3 text-muted-foreground/50 group-hover:text-muted-foreground" />
         </button>
 
         {/* Toolbar */}
@@ -737,7 +738,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
               onClick={handlePlayPause}
               title="Play/Pause (Space)"
             >
-              {isCurrentlyPlaying ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
+              {isCurrentlyPlaying ? <HugeiconsIcon icon={PauseIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={PlayIcon} size={16} className="h-4 w-4" />}
             </Button>
             <Button
               variant="ghost"
@@ -746,7 +747,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
               onClick={handleStop}
               disabled={!isCurrentlyPlaying}
             >
-              <Square className="h-3 w-3" />
+              <HugeiconsIcon icon={SquareIcon} size={12} className="h-3 w-3" />
             </Button>
             <span className="text-xs text-muted-foreground tabular-nums ml-2">
               {formatTime(currentTimeMs)} / {formatTime(totalDurationMs)}
@@ -763,7 +764,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
                 onClick={handleSplit}
                 title="Split at playhead (S)"
               >
-                <Scissors className="h-4 w-4" />
+                <HugeiconsIcon icon={Scissor01Icon} size={16} className="h-4 w-4" />
               </Button>
               <Button
                 variant="ghost"
@@ -772,7 +773,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
                 onClick={handleDuplicate}
                 title="Duplicate (Cmd/Ctrl+D)"
               >
-                <Copy className="h-4 w-4" />
+                <HugeiconsIcon icon={Copy01Icon} size={16} className="h-4 w-4" />
               </Button>
               <Button
                 variant="ghost"
@@ -781,7 +782,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
                 onClick={handleDelete}
                 title="Delete (Delete/Backspace)"
               >
-                <Trash2 className="h-4 w-4" />
+                <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
               </Button>
             </div>
           )}
@@ -790,10 +791,10 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
           <div className="flex items-center gap-2">
             <span className="text-xs text-muted-foreground">Zoom:</span>
             <Button variant="ghost" size="icon" className="h-6 w-6" onClick={handleZoomOut}>
-              <Minus className="h-3 w-3" />
+              <HugeiconsIcon icon={RemoveIcon} size={12} className="h-3 w-3" />
             </Button>
             <Button variant="ghost" size="icon" className="h-6 w-6" onClick={handleZoomIn}>
-              <Plus className="h-3 w-3" />
+              <HugeiconsIcon icon={Add01Icon} size={12} className="h-3 w-3" />
             </Button>
           </div>
         </div>
@@ -837,7 +838,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
               type="button"
               className="h-6 border-b bg-muted/20 sticky top-0 z-10 cursor-pointer text-left"
               style={{ width: `${timelineWidth}px` }}
-              onClick={handleTimelineClick}
+              onClick={(e) => handleTimelineClick(e as unknown as React.MouseEvent<HTMLDivElement>)}
               aria-label="Seek timeline"
             >
               {timeMarkers.map((ms) => (
@@ -878,7 +879,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
               <button
                 type="button"
                 className="absolute inset-0 z-0 cursor-pointer"
-                onClick={handleTimelineClick}
+                onClick={(e) => handleTimelineClick(e as unknown as React.MouseEvent<HTMLDivElement>)}
                 aria-label="Seek timeline"
               />
 
diff --git a/app/src/components/VoiceProfiles/AudioSampleRecording.tsx b/app/src/components/VoiceProfiles/AudioSampleRecording.tsx
index 4f2db4e3..4364b351 100644
--- a/app/src/components/VoiceProfiles/AudioSampleRecording.tsx
+++ b/app/src/components/VoiceProfiles/AudioSampleRecording.tsx
@@ -1,4 +1,5 @@
-import { Mic, Pause, Play, Square } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, PauseIcon, PlayIcon, SquareIcon } from '@hugeicons/core-free-icons';
 import { memo, useEffect, useState } from 'react';
 import { Visualizer } from 'react-sound-visualizer';
 import { Button } from '@/components/ui/button';
@@ -95,7 +96,7 @@ export function AudioSampleRecording({
                 size="lg"
                 className="relative z-10 flex items-center gap-2"
               >
-                <Mic className="h-5 w-5" />
+                <HugeiconsIcon icon={Mic01Icon} size={20} className="h-5 w-5" />
                 Start Recording
               </Button>
               <p className="relative z-10 text-sm text-muted-foreground text-center">
@@ -122,7 +123,7 @@ export function AudioSampleRecording({
                 onClick={onStop}
                 className="relative z-10 flex items-center gap-2 bg-accent text-accent-foreground hover:bg-accent/90"
               >
-                <Square className="h-4 w-4" />
+                <HugeiconsIcon icon={SquareIcon} size={16} className="h-4 w-4" />
                 Stop Recording
               </Button>
               <p className="relative z-10 text-sm text-muted-foreground text-center">
@@ -134,13 +135,13 @@ export function AudioSampleRecording({
           {file && !isRecording && (
             <div className="flex flex-col items-center justify-center gap-4 p-4 border-2 border-primary rounded-lg bg-primary/5 min-h-[180px]">
               <div className="flex items-center gap-2">
-                <Mic className="h-5 w-5 text-primary" />
+                <HugeiconsIcon icon={Mic01Icon} size={20} className="h-5 w-5 text-primary" />
                 <span className="font-medium">Recording complete</span>
               </div>
               <p className="text-sm text-muted-foreground text-center">File: {file.name}</p>
               <div className="flex gap-2">
                 <Button type="button" size="icon" variant="outline" onClick={onPlayPause}>
-                  {isPlaying ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
+                  {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={PlayIcon} size={16} className="h-4 w-4" />}
                 </Button>
                 <Button
                   type="button"
@@ -149,7 +150,7 @@ export function AudioSampleRecording({
                   disabled={isTranscribing}
                   className="flex items-center gap-2"
                 >
-                  <Mic className="h-4 w-4" />
+                  <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4" />
                   {isTranscribing ? 'Transcribing...' : 'Transcribe'}
                 </Button>
                 <Button
diff --git a/app/src/components/VoiceProfiles/AudioSampleSystem.tsx b/app/src/components/VoiceProfiles/AudioSampleSystem.tsx
index 0cc892b2..d120e1a1 100644
--- a/app/src/components/VoiceProfiles/AudioSampleSystem.tsx
+++ b/app/src/components/VoiceProfiles/AudioSampleSystem.tsx
@@ -1,4 +1,5 @@
-import { Mic, Monitor, Pause, Play, Square } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, DeskIcon, PauseIcon, PlayIcon, SquareIcon } from '@hugeicons/core-free-icons';
 import { Button } from '@/components/ui/button';
 import { FormControl, FormItem, FormMessage } from '@/components/ui/form';
 import { formatAudioDuration } from '@/lib/utils/audio';
@@ -35,7 +36,7 @@ export function AudioSampleSystem({
           {!isRecording && !file && (
             <div className="flex flex-col items-center justify-center gap-4 p-4 border-2 border-dashed rounded-lg min-h-[180px]">
               <Button type="button" onClick={onStart} size="lg" className="flex items-center gap-2">
-                <Monitor className="h-5 w-5" />
+                <HugeiconsIcon icon={DeskIcon} size={20} className="h-5 w-5" />
                 Start Capture
               </Button>
               <p className="text-sm text-muted-foreground text-center">
@@ -60,7 +61,7 @@ export function AudioSampleSystem({
                 variant="destructive"
                 className="flex items-center gap-2"
               >
-                <Square className="h-4 w-4" />
+                <HugeiconsIcon icon={SquareIcon} size={16} className="h-4 w-4" />
                 Stop Capture
               </Button>
               <p className="text-sm text-muted-foreground text-center">
@@ -72,13 +73,13 @@ export function AudioSampleSystem({
           {file && !isRecording && (
             <div className="flex flex-col items-center justify-center gap-4 p-4 border-2 border-primary rounded-lg bg-primary/5 min-h-[180px]">
               <div className="flex items-center gap-2">
-                <Monitor className="h-5 w-5 text-primary" />
+                <HugeiconsIcon icon={DeskIcon} size={20} className="h-5 w-5 text-primary" />
                 <span className="font-medium">Capture complete</span>
               </div>
               <p className="text-sm text-muted-foreground text-center">File: {file.name}</p>
               <div className="flex gap-2">
                 <Button type="button" size="icon" variant="outline" onClick={onPlayPause}>
-                  {isPlaying ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
+                  {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={PlayIcon} size={16} className="h-4 w-4" />}
                 </Button>
                 <Button
                   type="button"
@@ -87,7 +88,7 @@ export function AudioSampleSystem({
                   disabled={isTranscribing}
                   className="flex items-center gap-2"
                 >
-                  <Mic className="h-4 w-4" />
+                  <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4" />
                   {isTranscribing ? 'Transcribing...' : 'Transcribe'}
                 </Button>
                 <Button
diff --git a/app/src/components/VoiceProfiles/AudioSampleUpload.tsx b/app/src/components/VoiceProfiles/AudioSampleUpload.tsx
index c66ded14..9a954121 100644
--- a/app/src/components/VoiceProfiles/AudioSampleUpload.tsx
+++ b/app/src/components/VoiceProfiles/AudioSampleUpload.tsx
@@ -1,4 +1,5 @@
-import { Mic, Pause, Play, Upload } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, PauseIcon, PlayIcon, Upload01Icon } from '@hugeicons/core-free-icons';
 import { useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import { FormControl, FormItem, FormMessage } from '@/components/ui/form';
@@ -89,7 +90,7 @@ export function AudioSampleUpload({
                   onClick={() => fileInputRef.current?.click()}
                   className="flex items-center gap-2"
                 >
-                  <Upload className="h-5 w-5" />
+                  <HugeiconsIcon icon={Upload01Icon} size={20} className="h-5 w-5" />
                   Choose File
                 </Button>
                 <p className="text-sm text-muted-foreground text-center">
@@ -99,7 +100,7 @@ export function AudioSampleUpload({
             ) : (
               <>
                 <div className="flex items-center gap-2">
-                  <Upload className="h-5 w-5 text-primary" />
+                  <HugeiconsIcon icon={Upload01Icon} size={20} className="h-5 w-5 text-primary" />
                   <span className="font-medium">File uploaded</span>
                 </div>
                 <p className="text-sm text-muted-foreground text-center">File: {file.name}</p>
@@ -111,7 +112,7 @@ export function AudioSampleUpload({
                     onClick={onPlayPause}
                     disabled={isValidating}
                   >
-                    {isPlaying ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
+                    {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={PlayIcon} size={16} className="h-4 w-4" />}
                   </Button>
                   <Button
                     type="button"
@@ -120,7 +121,7 @@ export function AudioSampleUpload({
                     disabled={isTranscribing || isValidating || isDisabled}
                     className="flex items-center gap-2"
                   >
-                    <Mic className="h-4 w-4" />
+                    <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4" />
                     {isTranscribing ? 'Transcribing...' : 'Transcribe'}
                   </Button>
                   <Button
diff --git a/app/src/components/VoiceProfiles/ProfileAvatar.tsx b/app/src/components/VoiceProfiles/ProfileAvatar.tsx
new file mode 100644
index 00000000..0743fb3f
--- /dev/null
+++ b/app/src/components/VoiceProfiles/ProfileAvatar.tsx
@@ -0,0 +1,80 @@
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon } from '@hugeicons/core-free-icons';
+import { useState } from 'react';
+import { cn } from '@/lib/utils/cn';
+import { useServerStore } from '@/stores/serverStore';
+
+interface ProfileAvatarProps {
+  profileId: string;
+  avatarPath?: string | null;
+  size?: 'sm' | 'md' | 'lg' | 'xl';
+  grayscale?: boolean;
+  className?: string;
+  alt?: string;
+}
+
+const sizeClasses = {
+  sm: 'h-6 w-6',
+  md: 'h-8 w-8',
+  lg: 'h-10 w-10',
+  xl: 'h-24 w-24',
+};
+
+const iconSizes = {
+  sm: 14,
+  md: 16,
+  lg: 20,
+  xl: 40,
+};
+
+const iconClassNames = {
+  sm: 'h-3.5 w-3.5',
+  md: 'h-4 w-4',
+  lg: 'h-5 w-5',
+  xl: 'h-10 w-10',
+};
+
+export function ProfileAvatar({
+  profileId,
+  avatarPath,
+  size = 'md',
+  grayscale = false,
+  className,
+  alt = 'Profile avatar',
+}: ProfileAvatarProps) {
+  const [avatarError, setAvatarError] = useState(false);
+  const serverUrl = useServerStore((state) => state.serverUrl);
+
+  // If avatarPath is explicitly null or empty string, don't try to load avatar
+  // Otherwise, always try to load (avatarPath might not be available in all contexts)
+  const avatarUrl =
+    avatarPath === null || avatarPath === '' ? null : `${serverUrl}/profiles/${profileId}/avatar`;
+
+  return (
+    <div
+      className={cn(
+        sizeClasses[size],
+        'rounded-full bg-muted flex items-center justify-center shrink-0 overflow-hidden',
+        className,
+      )}
+    >
+      {avatarUrl && !avatarError ? (
+        <img
+          src={avatarUrl}
+          alt={alt}
+          className={cn(
+            'h-full w-full object-cover transition-all duration-200',
+            grayscale && 'grayscale',
+          )}
+          onError={() => setAvatarError(true)}
+        />
+      ) : (
+        <HugeiconsIcon
+          icon={Mic01Icon}
+          size={iconSizes[size]}
+          className={cn(iconClassNames[size], 'text-muted-foreground')}
+        />
+      )}
+    </div>
+  );
+}
diff --git a/app/src/components/VoiceProfiles/ProfileCard.tsx b/app/src/components/VoiceProfiles/ProfileCard.tsx
index e879294f..40742f40 100644
--- a/app/src/components/VoiceProfiles/ProfileCard.tsx
+++ b/app/src/components/VoiceProfiles/ProfileCard.tsx
@@ -1,4 +1,5 @@
-import { Download, Edit, Mic, Trash2 } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Download01Icon, Edit01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useState } from 'react';
 import { Badge } from '@/components/ui/badge';
 import { Button } from '@/components/ui/button';
@@ -12,10 +13,10 @@ import {
   DialogHeader,
   DialogTitle,
 } from '@/components/ui/dialog';
+import { ProfileAvatar } from '@/components/VoiceProfiles/ProfileAvatar';
 import type { VoiceProfileResponse } from '@/lib/api/types';
 import { useDeleteProfile, useExportProfile } from '@/lib/hooks/useProfiles';
 import { cn } from '@/lib/utils/cn';
-import { useServerStore } from '@/stores/serverStore';
 import { useUIStore } from '@/stores/uiStore';
 
 interface ProfileCardProps {
@@ -24,19 +25,15 @@ interface ProfileCardProps {
 
 export function ProfileCard({ profile }: ProfileCardProps) {
   const [deleteDialogOpen, setDeleteDialogOpen] = useState(false);
-  const [avatarError, setAvatarError] = useState(false);
   const deleteProfile = useDeleteProfile();
   const exportProfile = useExportProfile();
   const setEditingProfileId = useUIStore((state) => state.setEditingProfileId);
   const setProfileDialogOpen = useUIStore((state) => state.setProfileDialogOpen);
   const selectedProfileId = useUIStore((state) => state.selectedProfileId);
   const setSelectedProfileId = useUIStore((state) => state.setSelectedProfileId);
-  const serverUrl = useServerStore((state) => state.serverUrl);
 
   const isSelected = selectedProfileId === profile.id;
 
-  const avatarUrl = profile.avatar_path ? `${serverUrl}/profiles/${profile.id}/avatar` : null;
-
   const handleSelect = () => {
     setSelectedProfileId(isSelected ? null : profile.id);
   };
@@ -72,21 +69,13 @@ export function ProfileCard({ profile }: ProfileCardProps) {
       >
         <CardHeader className="p-3 pb-2">
           <CardTitle className="flex items-center gap-1.5 text-base font-medium">
-            <div className="h-6 w-6 rounded-full bg-muted flex items-center justify-center shrink-0 overflow-hidden">
-              {avatarUrl && !avatarError ? (
-                <img
-                  src={avatarUrl}
-                  alt={`${profile.name} avatar`}
-                  className={cn(
-                    'h-full w-full object-cover transition-all duration-200',
-                    !isSelected && 'grayscale',
-                  )}
-                  onError={() => setAvatarError(true)}
-                />
-              ) : (
-                <Mic className="h-3.5 w-3.5 text-muted-foreground" />
-              )}
-            </div>
+            <ProfileAvatar
+              profileId={profile.id}
+              avatarPath={profile.avatar_path}
+              size="sm"
+              grayscale={!isSelected}
+              alt={`${profile.name} avatar`}
+            />
             <span className="break-words">{profile.name}</span>
           </CardTitle>
         </CardHeader>
@@ -101,13 +90,13 @@ export function ProfileCard({ profile }: ProfileCardProps) {
           </div>
           <div className="flex gap-0.5 justify-end items-end mt-auto">
             <CircleButton
-              icon={Download}
+              icon={(props) => <HugeiconsIcon icon={Download01Icon} size={14} {...props} />}
               onClick={handleExport}
               disabled={exportProfile.isPending}
               aria-label="Export profile"
             />
             <CircleButton
-              icon={Edit}
+              icon={(props) => <HugeiconsIcon icon={Edit01Icon} size={14} {...props} />}
               onClick={(e) => {
                 e.stopPropagation();
                 handleEdit();
@@ -115,7 +104,7 @@ export function ProfileCard({ profile }: ProfileCardProps) {
               aria-label="Edit profile"
             />
             <CircleButton
-              icon={Trash2}
+              icon={(props) => <HugeiconsIcon icon={Delete01Icon} size={14} {...props} />}
               onClick={handleDeleteClick}
               disabled={deleteProfile.isPending}
               aria-label="Delete profile"
diff --git a/app/src/components/VoiceProfiles/ProfileForm.tsx b/app/src/components/VoiceProfiles/ProfileForm.tsx
index f4fc5711..3fcd987e 100644
--- a/app/src/components/VoiceProfiles/ProfileForm.tsx
+++ b/app/src/components/VoiceProfiles/ProfileForm.tsx
@@ -1,5 +1,6 @@
 import { zodResolver } from '@hookform/resolvers/zod';
-import { Edit2, Mic, Monitor, Upload, X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Edit02Icon, Mic01Icon, DeskIcon, Upload01Icon, Cancel01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useRef, useState } from 'react';
 import { useForm } from 'react-hook-form';
 import * as z from 'zod';
@@ -635,7 +636,7 @@ export function ProfileForm() {
                     setSampleMode('record');
                   }}
                 >
-                  <X className="h-3 w-3 mr-1" />
+                  <HugeiconsIcon icon={Cancel01Icon} size={12} className="h-3 w-3 mr-1" />
                   Discard
                 </Button>
               </div>
@@ -668,16 +669,16 @@ export function ProfileForm() {
                           className={`grid w-full ${platform.metadata.isTauri && isSystemAudioSupported ? 'grid-cols-3' : 'grid-cols-2'}`}
                         >
                           <TabsTrigger value="upload" className="flex items-center gap-2">
-                            <Upload className="h-4 w-4 shrink-0" />
+                            <HugeiconsIcon icon={Upload01Icon} size={16} className="h-4 w-4 shrink-0" />
                             Upload
                           </TabsTrigger>
                           <TabsTrigger value="record" className="flex items-center gap-2">
-                            <Mic className="h-4 w-4 shrink-0" />
+                            <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4 shrink-0" />
                             Record
                           </TabsTrigger>
                           {platform.metadata.isTauri && isSystemAudioSupported && (
                             <TabsTrigger value="system" className="flex items-center gap-2">
-                              <Monitor className="h-4 w-4 shrink-0" />
+                              <HugeiconsIcon icon={DeskIcon} size={16} className="h-4 w-4 shrink-0" />
                               System Audio
                             </TabsTrigger>
                           )}
@@ -798,7 +799,7 @@ export function ProfileForm() {
                                     className="h-full w-full object-cover"
                                   />
                                 ) : (
-                                  <Mic className="h-10 w-10 text-muted-foreground" />
+                                  <HugeiconsIcon icon={Mic01Icon} size={40} className="h-10 w-10 text-muted-foreground" />
                                 )}
                               </div>
                               <button
@@ -806,7 +807,7 @@ export function ProfileForm() {
                                 onClick={() => avatarInputRef.current?.click()}
                                 className="absolute inset-0 rounded-full bg-accent/60 opacity-0 group-hover:opacity-100 transition-opacity flex items-center justify-center cursor-pointer"
                               >
-                                <Edit2 className="h-6 w-6 text-accent-foreground" />
+                                <HugeiconsIcon icon={Edit02Icon} size={24} className="h-6 w-6 text-accent-foreground" />
                               </button>
                               {(avatarPreview || editingProfile?.avatar_path) && (
                                 <button
@@ -815,7 +816,7 @@ export function ProfileForm() {
                                   disabled={deleteAvatar.isPending}
                                   className="absolute bottom-0 right-0 h-6 w-6 rounded-full bg-background/60 backdrop-blur-sm text-muted-foreground flex items-center justify-center hover:bg-background/80 hover:text-foreground transition-colors shadow-sm border border-border/50"
                                 >
-                                  <X className="h-3.5 w-3.5" />
+                                  <HugeiconsIcon icon={Cancel01Icon} size={14} className="h-3.5 w-3.5" />
                                 </button>
                               )}
                             </div>
diff --git a/app/src/components/VoiceProfiles/ProfileList.tsx b/app/src/components/VoiceProfiles/ProfileList.tsx
index 8dcb06a4..4e57bfdb 100644
--- a/app/src/components/VoiceProfiles/ProfileList.tsx
+++ b/app/src/components/VoiceProfiles/ProfileList.tsx
@@ -1,4 +1,5 @@
-import { Mic, Sparkles } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, SparklesIcon } from '@hugeicons/core-free-icons';
 import { Button } from '@/components/ui/button';
 import { Card, CardContent } from '@/components/ui/card';
 import { useProfiles } from '@/lib/hooks/useProfiles';
@@ -30,12 +31,12 @@ export function ProfileList() {
         {allProfiles.length === 0 ? (
           <Card>
             <CardContent className="flex flex-col items-center justify-center py-12">
-              <Mic className="h-12 w-12 text-muted-foreground mb-4" />
+              <HugeiconsIcon icon={Mic01Icon} size={48} className="h-12 w-12 text-muted-foreground mb-4" />
               <p className="text-muted-foreground mb-4">
                 No voice profiles yet. Create your first profile to get started.
               </p>
               <Button onClick={() => setDialogOpen(true)}>
-                <Sparkles className="mr-2 h-4 w-4" />
+                <HugeiconsIcon icon={SparklesIcon} size={16} className="mr-2 h-4 w-4" />
                 Create Voice
               </Button>
             </CardContent>
diff --git a/app/src/components/VoiceProfiles/SampleList.tsx b/app/src/components/VoiceProfiles/SampleList.tsx
index 19aa1ca8..17664afd 100644
--- a/app/src/components/VoiceProfiles/SampleList.tsx
+++ b/app/src/components/VoiceProfiles/SampleList.tsx
@@ -1,4 +1,5 @@
-import { Check, Edit, Pause, Play, Plus, Trash2, Volume2, X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CheckmarkCircle01Icon, Edit01Icon, PauseIcon, PlayIcon, Add01Icon, Delete01Icon, VolumeHighIcon, Cancel01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import { CircleButton } from '@/components/ui/circle-button';
@@ -103,7 +104,7 @@ function MiniSamplePlayer({ audioUrl }: MiniSamplePlayerProps) {
           onClick={handlePlayPause}
           disabled={isLoading}
         >
-          {isPlaying ? <Pause className="h-3.5 w-3.5" /> : <Play className="h-3.5 w-3.5 ml-0.5" />}
+          {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={14} className="h-3.5 w-3.5" /> : <HugeiconsIcon icon={PlayIcon} size={14} className="h-3.5 w-3.5 ml-0.5" />}
         </Button>
 
         <div className="flex-1 min-w-0 flex items-center gap-2">
@@ -129,7 +130,7 @@ function MiniSamplePlayer({ audioUrl }: MiniSamplePlayerProps) {
           onClick={handleStop}
           title="Stop"
         >
-          <X className="h-3.5 w-3.5" />
+          <HugeiconsIcon icon={Cancel01Icon} size={14} className="h-3.5 w-3.5" />
         </Button>
       </div>
     </div>
@@ -209,7 +210,7 @@ export function SampleList({ profileId }: SampleListProps) {
     <div className="space-y-4 pt-4">
       {samples && samples.length === 0 ? (
         <div className="flex flex-col items-center justify-center py-8 text-center border border-dashed rounded-lg">
-          <Volume2 className="h-8 w-8 text-muted-foreground/50 mb-2" />
+          <HugeiconsIcon icon={VolumeHighIcon} size={32} className="h-8 w-8 text-muted-foreground/50 mb-2" />
           <p className="text-sm text-muted-foreground">No samples yet</p>
           <p className="text-xs text-muted-foreground/70 mt-1">
             Add your first audio sample to get started
@@ -232,7 +233,7 @@ export function SampleList({ profileId }: SampleListProps) {
                   /* Edit Mode */
                   <div className="p-4 space-y-3">
                     <div className="flex items-center gap-2 text-xs text-muted-foreground mb-2">
-                      <Edit className="h-3 w-3" />
+                      <HugeiconsIcon icon={Edit01Icon} size={12} className="h-3 w-3" />
                       <span>Editing transcription</span>
                     </div>
                     <Textarea
@@ -250,7 +251,7 @@ export function SampleList({ profileId }: SampleListProps) {
                         onClick={handleCancelEdit}
                         disabled={updateSample.isPending}
                       >
-                        <X className="h-4 w-4 mr-1" />
+                        <HugeiconsIcon icon={Cancel01Icon} size={16} className="h-4 w-4 mr-1" />
                         Cancel
                       </Button>
                       <Button
@@ -259,7 +260,7 @@ export function SampleList({ profileId }: SampleListProps) {
                         onClick={() => handleSaveEdit(sample.id)}
                         disabled={updateSample.isPending}
                       >
-                        <Check className="h-4 w-4 mr-1" />
+                        <HugeiconsIcon icon={CheckmarkCircle01Icon} size={16} className="h-4 w-4 mr-1" />
                         {updateSample.isPending ? 'Saving...' : 'Save'}
                       </Button>
                     </div>
@@ -278,12 +279,12 @@ export function SampleList({ profileId }: SampleListProps) {
                       {/* Action Buttons */}
                       <div className="shrink-0 flex items-center gap-0.5 opacity-0 group-hover:opacity-100 transition-opacity">
                         <CircleButton
-                          icon={Edit}
+                          icon={(props) => <HugeiconsIcon icon={Edit01Icon} size={14} {...props} />}
                           title="Edit transcription"
                           onClick={() => handleStartEdit(sample.id, sample.reference_text)}
                         />
                         <CircleButton
-                          icon={Trash2}
+                          icon={(props) => <HugeiconsIcon icon={Delete01Icon} size={14} {...props} />}
                           title="Delete sample"
                           onClick={() => handleDeleteClick(sample.id)}
                           disabled={deleteSample.isPending}
@@ -312,7 +313,7 @@ export function SampleList({ profileId }: SampleListProps) {
         className="w-full"
         onClick={() => setUploadOpen(true)}
       >
-        <Plus className="mr-2 h-4 w-4" />
+        <HugeiconsIcon icon={Add01Icon} size={16} className="mr-2 h-4 w-4" />
         Add Sample
       </Button>
 
diff --git a/app/src/components/VoiceProfiles/SampleUpload.tsx b/app/src/components/VoiceProfiles/SampleUpload.tsx
index 3c53b7d6..a57a27c0 100644
--- a/app/src/components/VoiceProfiles/SampleUpload.tsx
+++ b/app/src/components/VoiceProfiles/SampleUpload.tsx
@@ -1,5 +1,6 @@
 import { zodResolver } from '@hookform/resolvers/zod';
-import { Mic, Monitor, Upload } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, DeskIcon, Upload01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useState } from 'react';
 import { useForm } from 'react-hook-form';
 import * as z from 'zod';
@@ -236,16 +237,16 @@ export function SampleUpload({ profileId, open, onOpenChange }: SampleUploadProp
                 className={`grid w-full ${platform.metadata.isTauri && isSystemAudioSupported ? 'grid-cols-3' : 'grid-cols-2'}`}
               >
                 <TabsTrigger value="upload" className="flex items-center gap-2">
-                  <Upload className="h-4 w-4 shrink-0" />
+                  <HugeiconsIcon icon={Upload01Icon} size={16} className="h-4 w-4 shrink-0" />
                   Upload
                 </TabsTrigger>
                 <TabsTrigger value="record" className="flex items-center gap-2">
-                  <Mic className="h-4 w-4 shrink-0" />
+                  <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4 shrink-0" />
                   Record
                 </TabsTrigger>
                 {platform.metadata.isTauri && isSystemAudioSupported && (
                   <TabsTrigger value="system" className="flex items-center gap-2">
-                    <Monitor className="h-4 w-4 shrink-0" />
+                    <HugeiconsIcon icon={DeskIcon} size={16} className="h-4 w-4 shrink-0" />
                     System Audio
                   </TabsTrigger>
                 )}
diff --git a/app/src/components/VoicesTab/VoicesTab.tsx b/app/src/components/VoicesTab/VoicesTab.tsx
index 12fedef5..f1b34fa3 100644
--- a/app/src/components/VoicesTab/VoicesTab.tsx
+++ b/app/src/components/VoicesTab/VoicesTab.tsx
@@ -1,5 +1,6 @@
 import { useQuery, useQueryClient } from '@tanstack/react-query';
-import { Edit, MoreHorizontal, Plus, Trash2, Mic } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Edit01Icon, MoreHorizontalIcon, Add01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useMemo, useRef } from 'react';
 import { Button } from '@/components/ui/button';
 import {
@@ -18,6 +19,7 @@ import {
   TableRow,
 } from '@/components/ui/table';
 import { ProfileForm } from '@/components/VoiceProfiles/ProfileForm';
+import { ProfileAvatar } from '@/components/VoiceProfiles/ProfileAvatar';
 import { apiClient } from '@/lib/api/client';
 import type { VoiceProfileResponse } from '@/lib/api/types';
 import { BOTTOM_SAFE_AREA_PADDING } from '@/lib/constants/ui';
@@ -112,7 +114,7 @@ export function VoicesTab() {
         <div className="flex items-center justify-between mb-6">
           <h1 className="text-2xl font-bold">Voices</h1>
           <Button onClick={() => setDialogOpen(true)}>
-            <Plus className="h-4 w-4 mr-2" />
+            <HugeiconsIcon icon={Add01Icon} size={16} className="h-4 w-4 mr-2" />
             New Voice
           </Button>
         </div>
@@ -184,9 +186,12 @@ function VoiceRow({
     <TableRow className="cursor-pointer" onClick={onEdit}>
       <TableCell>
         <div className="flex items-center gap-2">
-          <div className="h-8 w-8 rounded-lg bg-muted flex items-center justify-center shrink-0">
-            <Mic className="h-4 w-4 text-muted-foreground" />
-          </div>
+          <ProfileAvatar
+            profileId={profile.id}
+            avatarPath={profile.avatar_path}
+            size="md"
+            alt={`${profile.name} avatar`}
+          />
           <div>
             <div className="font-medium">{profile.name}</div>
             {profile.description && (
@@ -214,16 +219,16 @@ function VoiceRow({
         <DropdownMenu>
           <DropdownMenuTrigger asChild>
             <Button variant="ghost" size="icon">
-              <MoreHorizontal className="h-4 w-4" />
+              <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
             </Button>
           </DropdownMenuTrigger>
           <DropdownMenuContent>
             <DropdownMenuItem onClick={onEdit}>
-              <Edit className="h-4 w-4 mr-2" />
+              <HugeiconsIcon icon={Edit01Icon} size={16} className="h-4 w-4 mr-2" />
               Edit
             </DropdownMenuItem>
             <DropdownMenuItem onClick={onDelete} className="text-destructive">
-              <Trash2 className="h-4 w-4 mr-2" />
+              <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4 mr-2" />
               Delete
             </DropdownMenuItem>
           </DropdownMenuContent>
diff --git a/app/src/components/ui/checkbox.tsx b/app/src/components/ui/checkbox.tsx
index f423fef0..303fe26d 100644
--- a/app/src/components/ui/checkbox.tsx
+++ b/app/src/components/ui/checkbox.tsx
@@ -1,5 +1,6 @@
 import * as React from 'react';
-import { Check } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CheckmarkCircle01Icon } from '@hugeicons/core-free-icons';
 import { cn } from '@/lib/utils/cn';
 
 export interface CheckboxProps {
@@ -34,7 +35,7 @@ const Checkbox = React.forwardRef<HTMLButtonElement, CheckboxProps>(
         )}
         {...props}
       >
-        {checked && <Check className="h-3 w-3 text-accent-foreground" />}
+        {checked && <HugeiconsIcon icon={CheckmarkCircle01Icon} size={12} className="h-3 w-3 text-accent-foreground" />}
       </button>
     );
   },
diff --git a/app/src/components/ui/dialog.tsx b/app/src/components/ui/dialog.tsx
index 5fe10944..14a38c3a 100644
--- a/app/src/components/ui/dialog.tsx
+++ b/app/src/components/ui/dialog.tsx
@@ -1,5 +1,6 @@
 import * as DialogPrimitive from '@radix-ui/react-dialog';
-import { X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Cancel01Icon } from '@hugeicons/core-free-icons';
 import * as React from 'react';
 import { cn } from '@/lib/utils/cn';
 
@@ -42,7 +43,7 @@ const DialogContent = React.forwardRef<
     >
       {children}
       <DialogPrimitive.Close className="absolute right-4 top-4 rounded-sm opacity-70 ring-offset-background transition-opacity hover:opacity-100 focus:outline-none focus:ring-2 focus:ring-ring focus:ring-offset-2 disabled:pointer-events-none data-[state=open]:bg-accent data-[state=open]:text-muted-foreground">
-        <X className="h-4 w-4" />
+        <HugeiconsIcon icon={Cancel01Icon} size={16} className="h-4 w-4" />
         <span className="sr-only">Close</span>
       </DialogPrimitive.Close>
     </DialogPrimitive.Content>
diff --git a/app/src/components/ui/dropdown-menu.tsx b/app/src/components/ui/dropdown-menu.tsx
index d59c291c..7a878f99 100644
--- a/app/src/components/ui/dropdown-menu.tsx
+++ b/app/src/components/ui/dropdown-menu.tsx
@@ -1,6 +1,7 @@
-import * as React from 'react';
+import { MoreHorizontalIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
 import * as DropdownMenuPrimitive from '@radix-ui/react-dropdown-menu';
-import { MoreHorizontal } from 'lucide-react';
+import * as React from 'react';
 import { cn } from '@/lib/utils/cn';
 
 const DropdownMenu = DropdownMenuPrimitive.Root;
@@ -26,7 +27,7 @@ const DropdownMenuSubTrigger = React.forwardRef<
     {...props}
   >
     {children}
-    <MoreHorizontal className="ml-auto h-4 w-4" />
+    <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="ml-auto h-4 w-4" />
   </DropdownMenuPrimitive.SubTrigger>
 ));
 DropdownMenuSubTrigger.displayName = DropdownMenuPrimitive.SubTrigger.displayName;
@@ -73,7 +74,7 @@ const DropdownMenuItem = React.forwardRef<
   <DropdownMenuPrimitive.Item
     ref={ref}
     className={cn(
-      'relative flex cursor-default select-none items-center rounded-sm px-2 py-1.5 text-sm outline-none transition-colors focus:bg-accent focus:text-accent-foreground data-[disabled]:pointer-events-none data-[disabled]:opacity-50',
+      'relative flex cursor-default select-none items-center rounded-sm px-2 py-1.5 text-sm outline-none focus:bg-accent focus:text-accent-foreground data-[disabled]:pointer-events-none data-[disabled]:opacity-50',
       inset && 'pl-8',
       className,
     )}
@@ -97,7 +98,7 @@ const DropdownMenuCheckboxItem = React.forwardRef<
   >
     <span className="absolute left-2 flex h-3.5 w-3.5 items-center justify-center">
       <DropdownMenuPrimitive.ItemIndicator>
-        <MoreHorizontal className="h-4 w-4" />
+        <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
       </DropdownMenuPrimitive.ItemIndicator>
     </span>
     {children}
@@ -119,7 +120,7 @@ const DropdownMenuRadioItem = React.forwardRef<
   >
     <span className="absolute left-2 flex h-3.5 w-3.5 items-center justify-center">
       <DropdownMenuPrimitive.ItemIndicator>
-        <MoreHorizontal className="h-2 w-2 fill-current" />
+        <HugeiconsIcon icon={MoreHorizontalIcon} size={8} className="h-2 w-2 fill-current" />
       </DropdownMenuPrimitive.ItemIndicator>
     </span>
     {children}
@@ -154,7 +155,9 @@ const DropdownMenuSeparator = React.forwardRef<
 DropdownMenuSeparator.displayName = DropdownMenuPrimitive.Separator.displayName;
 
 const DropdownMenuShortcut = ({ className, ...props }: React.HTMLAttributes<HTMLSpanElement>) => {
-  return <span className={cn('ml-auto text-xs tracking-widest opacity-60', className)} {...props} />;
+  return (
+    <span className={cn('ml-auto text-xs tracking-widest opacity-60', className)} {...props} />
+  );
 };
 DropdownMenuShortcut.displayName = 'DropdownMenuShortcut';
 
diff --git a/app/src/components/ui/multi-select.tsx b/app/src/components/ui/multi-select.tsx
index 0f3ffb5e..d807c23b 100644
--- a/app/src/components/ui/multi-select.tsx
+++ b/app/src/components/ui/multi-select.tsx
@@ -1,5 +1,6 @@
 import * as React from 'react';
-import { ChevronDown, Check } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { ArrowDown01Icon, CheckmarkCircle01Icon } from '@hugeicons/core-free-icons';
 import { cn } from '@/lib/utils/cn';
 import {
   DropdownMenu,
@@ -36,7 +37,7 @@ const MultiSelectCheckboxItem = React.forwardRef<
   >
     <span className="absolute left-2 flex h-3.5 w-3.5 items-center justify-center">
       <DropdownMenuPrimitive.ItemIndicator>
-        <Check className="h-4 w-4" />
+        <HugeiconsIcon icon={CheckmarkCircle01Icon} size={16} className="h-4 w-4" />
       </DropdownMenuPrimitive.ItemIndicator>
     </span>
     {children}
@@ -78,7 +79,7 @@ export function MultiSelect({
           )}
         >
           <span className="line-clamp-1">{displayText}</span>
-          <ChevronDown className="h-4 w-4 opacity-50" />
+          <HugeiconsIcon icon={ArrowDown01Icon} size={16} className="h-4 w-4 opacity-50" />
         </button>
       </DropdownMenuTrigger>
       <DropdownMenuContent
diff --git a/app/src/components/ui/radio-group.tsx b/app/src/components/ui/radio-group.tsx
new file mode 100644
index 00000000..a04aa433
--- /dev/null
+++ b/app/src/components/ui/radio-group.tsx
@@ -0,0 +1,43 @@
+'use client';
+
+import { CircleIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import * as RadioGroupPrimitive from '@radix-ui/react-radio-group';
+import * as React from 'react';
+
+import { cn } from '@/lib/utils/cn';
+
+const RadioGroup = React.forwardRef<
+  React.ElementRef<typeof RadioGroupPrimitive.Root>,
+  React.ComponentPropsWithoutRef<typeof RadioGroupPrimitive.Root>
+>(({ className, ...props }, ref) => {
+  return <RadioGroupPrimitive.Root className={cn('grid gap-2', className)} {...props} ref={ref} />;
+});
+RadioGroup.displayName = RadioGroupPrimitive.Root.displayName;
+
+const RadioGroupItem = React.forwardRef<
+  React.ElementRef<typeof RadioGroupPrimitive.Item>,
+  React.ComponentPropsWithoutRef<typeof RadioGroupPrimitive.Item>
+>(({ className, ...props }, ref) => {
+  return (
+    <RadioGroupPrimitive.Item
+      ref={ref}
+      className={cn(
+        'aspect-square h-4 w-4 rounded-full border border-accent text-accent ring-offset-background focus:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50',
+        className,
+      )}
+      {...props}
+    >
+      <RadioGroupPrimitive.Indicator className="flex items-center justify-center">
+        <HugeiconsIcon
+          icon={CircleIcon}
+          size={10}
+          className="h-2.5 w-2.5 fill-current text-current"
+        />
+      </RadioGroupPrimitive.Indicator>
+    </RadioGroupPrimitive.Item>
+  );
+});
+RadioGroupItem.displayName = RadioGroupPrimitive.Item.displayName;
+
+export { RadioGroup, RadioGroupItem };
diff --git a/app/src/components/ui/select.tsx b/app/src/components/ui/select.tsx
index 4a1949fc..2f88e528 100644
--- a/app/src/components/ui/select.tsx
+++ b/app/src/components/ui/select.tsx
@@ -1,5 +1,6 @@
 import * as SelectPrimitive from '@radix-ui/react-select';
-import { Check, ChevronDown, ChevronUp } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CheckmarkCircle01Icon, ArrowDown01Icon, ArrowUp01Icon } from '@hugeicons/core-free-icons';
 import * as React from 'react';
 import { cn } from '@/lib/utils/cn';
 
@@ -23,7 +24,7 @@ const SelectTrigger = React.forwardRef<
   >
     {children}
     <SelectPrimitive.Icon asChild>
-      <ChevronDown className="h-4 w-4 opacity-50" />
+      <HugeiconsIcon icon={ArrowDown01Icon} size={16} className="h-4 w-4 opacity-50" />
     </SelectPrimitive.Icon>
   </SelectPrimitive.Trigger>
 ));
@@ -38,7 +39,7 @@ const SelectScrollUpButton = React.forwardRef<
     className={cn('flex cursor-default items-center justify-center py-1', className)}
     {...props}
   >
-    <ChevronUp className="h-4 w-4" />
+    <HugeiconsIcon icon={ArrowUp01Icon} size={16} className="h-4 w-4" />
   </SelectPrimitive.ScrollUpButton>
 ));
 SelectScrollUpButton.displayName = SelectPrimitive.ScrollUpButton.displayName;
@@ -52,7 +53,7 @@ const SelectScrollDownButton = React.forwardRef<
     className={cn('flex cursor-default items-center justify-center py-1', className)}
     {...props}
   >
-    <ChevronDown className="h-4 w-4" />
+    <HugeiconsIcon icon={ArrowDown01Icon} size={16} className="h-4 w-4" />
   </SelectPrimitive.ScrollDownButton>
 ));
 SelectScrollDownButton.displayName = SelectPrimitive.ScrollDownButton.displayName;
@@ -115,7 +116,7 @@ const SelectItem = React.forwardRef<
   >
     <span className="absolute left-2 flex h-3.5 w-3.5 items-center justify-center">
       <SelectPrimitive.ItemIndicator>
-        <Check className="h-4 w-4" />
+        <HugeiconsIcon icon={CheckmarkCircle01Icon} size={16} className="h-4 w-4" />
       </SelectPrimitive.ItemIndicator>
     </span>
 
diff --git a/app/src/components/ui/toast.tsx b/app/src/components/ui/toast.tsx
index 35150afd..48a8743d 100644
--- a/app/src/components/ui/toast.tsx
+++ b/app/src/components/ui/toast.tsx
@@ -1,6 +1,7 @@
 import * as ToastPrimitives from '@radix-ui/react-toast';
 import { cva, type VariantProps } from 'class-variance-authority';
-import { X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Cancel01Icon } from '@hugeicons/core-free-icons';
 import * as React from 'react';
 import { cn } from '@/lib/utils/cn';
 
@@ -79,7 +80,7 @@ const ToastClose = React.forwardRef<
     toast-close=""
     {...props}
   >
-    <X className="h-4 w-4" />
+    <HugeiconsIcon icon={Cancel01Icon} size={16} className="h-4 w-4" />
   </ToastPrimitives.Close>
 ));
 ToastClose.displayName = ToastPrimitives.Close.displayName;
diff --git a/app/src/hooks/useAutoUpdater.ts b/app/src/hooks/useAutoUpdater.ts
deleted file mode 100644
index 7a9f169a..00000000
--- a/app/src/hooks/useAutoUpdater.ts
+++ /dev/null
@@ -1,52 +0,0 @@
-import { useCallback, useEffect, useRef, useState } from 'react';
-import { usePlatform } from '@/platform/PlatformContext';
-import type { UpdateStatus } from '@/platform/types';
-
-// Re-export UpdateStatus for backwards compatibility
-export type { UpdateStatus };
-
-export function useAutoUpdater(checkOnMount = false) {
-  const platform = usePlatform();
-  const [status, setStatus] = useState<UpdateStatus>(platform.updater.getStatus());
-  const hasCheckedRef = useRef(false);
-
-  // Subscribe to updater status changes
-  useEffect(() => {
-    const unsubscribe = platform.updater.subscribe((newStatus) => {
-      setStatus(newStatus);
-    });
-    return unsubscribe;
-    // Empty dependency array - platform is stable from context
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.updater.subscribe]);
-
-  const checkForUpdates = useCallback(async () => {
-    await platform.updater.checkForUpdates();
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.updater.checkForUpdates]);
-
-  const downloadAndInstall = useCallback(async () => {
-    await platform.updater.downloadAndInstall();
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.updater.downloadAndInstall]);
-
-  const restartAndInstall = useCallback(async () => {
-    await platform.updater.restartAndInstall();
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.updater.restartAndInstall]);
-
-  useEffect(() => {
-    if (checkOnMount && platform.metadata.isTauri && !hasCheckedRef.current) {
-      hasCheckedRef.current = true;
-      checkForUpdates();
-    }
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.metadata.isTauricheckOnMountcheckForUpdates]);
-
-  return {
-    status,
-    checkForUpdates,
-    downloadAndInstall,
-    restartAndInstall,
-  };
-}
diff --git a/app/src/hooks/useAutoUpdater.tsx b/app/src/hooks/useAutoUpdater.tsx
index 8a6351f6..a7e1e949 100644
--- a/app/src/hooks/useAutoUpdater.tsx
+++ b/app/src/hooks/useAutoUpdater.tsx
@@ -1,4 +1,5 @@
-import { Download, RefreshCw } from 'lucide-react';
+import { Download01Icon, Refresh01Icon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
 import { useCallback, useEffect, useRef, useState } from 'react';
 import { Progress } from '@/components/ui/progress';
 import { ToastAction } from '@/components/ui/toast';
@@ -73,7 +74,7 @@ export function useAutoUpdater(options: boolean | UseAutoUpdaterOptions = false)
     }
     // Empty dependency array - only run once on mount
     // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.metadata.isTauricheckOnMountcheckForUpdates]);
+  }, [platform.metadata.isTauri, checkOnMount, checkForUpdates]);
 
   // Show toast when update is available
   useEffect(() => {
@@ -132,7 +133,7 @@ export function useAutoUpdater(options: boolean | UseAutoUpdaterOptions = false)
     toastUpdateRef.current({
       title: (
         <div className="flex items-center gap-2">
-          <Download className="h-4 w-4 animate-pulse" />
+          <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 animate-pulse" />
           <span>Downloading Update</span>
         </div>
       ),
@@ -174,7 +175,7 @@ export function useAutoUpdater(options: boolean | UseAutoUpdaterOptions = false)
       duration: Infinity,
       action: (
         <ToastAction altText="Restart now" onClick={handleRestartNow}>
-          <RefreshCw className="h-3 w-3 mr-1" />
+          <HugeiconsIcon icon={Refresh01Icon} size={12} className="h-3 w-3 mr-1" />
           Restart Now
         </ToastAction>
       ),
diff --git a/app/src/lib/api/client.ts b/app/src/lib/api/client.ts
index c5b079b2..da64d4ff 100644
--- a/app/src/lib/api/client.ts
+++ b/app/src/lib/api/client.ts
@@ -1,29 +1,30 @@
-import { useServerStore } from '@/stores/serverStore';
 import type { LanguageCode } from '@/lib/constants/languages';
+import { useServerStore } from '@/stores/serverStore';
 import type {
-  VoiceProfileCreate,
-  VoiceProfileResponse,
-  ProfileSampleResponse,
+  ActiveTasksResponse,
+  FolderPathsResponse,
   GenerationRequest,
   GenerationResponse,
-  HistoryQuery,
+  HealthResponse,
   HistoryListResponse,
+  HistoryQuery,
   HistoryResponse,
-  TranscriptionResponse,
-  HealthResponse,
-  ModelStatusListResponse,
   ModelDownloadRequest,
-  ActiveTasksResponse,
+  ModelStatusListResponse,
+  ProfileSampleResponse,
   StoryCreate,
-  StoryResponse,
   StoryDetailResponse,
+  StoryItemBatchUpdate,
   StoryItemCreate,
   StoryItemDetail,
-  StoryItemBatchUpdate,
-  StoryItemReorder,
   StoryItemMove,
-  StoryItemTrim,
+  StoryItemReorder,
   StoryItemSplit,
+  StoryItemTrim,
+  StoryResponse,
+  TranscriptionResponse,
+  VoiceProfileCreate,
+  VoiceProfileResponse,
 } from './types';
 
 class ApiClient {
@@ -57,6 +58,11 @@ class ApiClient {
     return this.request<HealthResponse>('/health');
   }
 
+  // System
+  async getSystemFolders(): Promise<FolderPathsResponse> {
+    return this.request<FolderPathsResponse>('/system/folders');
+  }
+
   // Profiles
   async createProfile(data: VoiceProfileCreate): Promise<VoiceProfileResponse> {
     return this.request<VoiceProfileResponse>('/profiles', {
@@ -199,6 +205,77 @@ class ApiClient {
     });
   }
 
+  // Providers
+  async listProviders(): Promise<{
+    providers: Array<{
+      type: string;
+      name: string;
+      installed: boolean;
+      size_mb: number | null;
+    }>;
+    installed: string[];
+  }> {
+    return this.request('/providers');
+  }
+
+  async getActiveProvider(): Promise<{
+    provider: string;
+    health: {
+      status: string;
+      provider: string;
+      version: string | null;
+      model: string | null;
+      device: string | null;
+    };
+    status: {
+      model_loaded: boolean;
+      model_size: string | null;
+      available_sizes: string[];
+      gpu_available: boolean | null;
+      vram_used_mb: number | null;
+    };
+  }> {
+    return this.request('/providers/active');
+  }
+
+  async startProvider(providerType: string): Promise<{
+    message: string;
+    provider: {
+      status: string;
+      provider: string;
+      version: string | null;
+      model: string | null;
+      device: string | null;
+    };
+  }> {
+    return this.request('/providers/start', {
+      method: 'POST',
+      body: JSON.stringify({ provider_type: providerType }),
+    });
+  }
+
+  async stopProvider(): Promise<{ message: string }> {
+    return this.request('/providers/stop', {
+      method: 'POST',
+    });
+  }
+
+  async downloadProvider(providerType: string): Promise<{
+    message: string;
+    provider_type: string;
+  }> {
+    return this.request('/providers/download', {
+      method: 'POST',
+      body: JSON.stringify({ provider_type: providerType }),
+    });
+  }
+
+  async deleteProvider(providerType: string): Promise<{ message: string }> {
+    return this.request(`/providers/${providerType}`, {
+      method: 'DELETE',
+    });
+  }
+
   // History
   async listHistory(query?: HistoryQuery): Promise<HistoryListResponse> {
     const params = new URLSearchParams();
@@ -251,7 +328,15 @@ class ApiClient {
     return response.blob();
   }
 
-  async importGeneration(file: File): Promise<{ id: string; profile_id: string; profile_name: string; text: string; message: string }> {
+  async importGeneration(
+    file: File,
+  ): Promise<{
+    id: string;
+    profile_id: string;
+    profile_name: string;
+    text: string;
+    message: string;
+  }> {
     const url = `${this.getBaseUrl()}/history/import`;
     const formData = new FormData();
     formData.append('file', file);
@@ -310,7 +395,12 @@ class ApiClient {
   }
 
   async triggerModelDownload(modelName: string): Promise<{ message: string }> {
-    console.log('[API] triggerModelDownload called for:', modelName, 'at', new Date().toISOString());
+    console.log(
+      '[API] triggerModelDownload called for:',
+      modelName,
+      'at',
+      new Date().toISOString(),
+    );
     const result = await this.request<{ message: string }>('/models/download', {
       method: 'POST',
       body: JSON.stringify({ model_name: modelName } as ModelDownloadRequest),
@@ -343,10 +433,7 @@ class ApiClient {
     return this.request('/channels');
   }
 
-  async createChannel(data: {
-    name: string;
-    device_ids: string[];
-  }): Promise<{
+  async createChannel(data: { name: string; device_ids: string[] }): Promise<{
     id: string;
     name: string;
     is_default: boolean;
@@ -388,10 +475,7 @@ class ApiClient {
     return this.request(`/channels/${channelId}/voices`);
   }
 
-  async setChannelVoices(
-    channelId: string,
-    profileIds: string[],
-  ): Promise<{ message: string }> {
+  async setChannelVoices(channelId: string, profileIds: string[]): Promise<{ message: string }> {
     return this.request(`/channels/${channelId}/voices`, {
       method: 'PUT',
       body: JSON.stringify({ profile_ids: profileIds }),
@@ -402,10 +486,7 @@ class ApiClient {
     return this.request(`/profiles/${profileId}/channels`);
   }
 
-  async setProfileChannels(
-    profileId: string,
-    channelIds: string[],
-  ): Promise<{ message: string }> {
+  async setProfileChannels(profileId: string, channelIds: string[]): Promise<{ message: string }> {
     return this.request(`/profiles/${profileId}/channels`, {
       method: 'PUT',
       body: JSON.stringify({ channel_ids: channelIds }),
@@ -468,21 +549,33 @@ class ApiClient {
     });
   }
 
-  async moveStoryItem(storyId: string, itemId: string, data: StoryItemMove): Promise<StoryItemDetail> {
+  async moveStoryItem(
+    storyId: string,
+    itemId: string,
+    data: StoryItemMove,
+  ): Promise<StoryItemDetail> {
     return this.request<StoryItemDetail>(`/stories/${storyId}/items/${itemId}/move`, {
       method: 'PUT',
       body: JSON.stringify(data),
     });
   }
 
-  async trimStoryItem(storyId: string, itemId: string, data: StoryItemTrim): Promise<StoryItemDetail> {
+  async trimStoryItem(
+    storyId: string,
+    itemId: string,
+    data: StoryItemTrim,
+  ): Promise<StoryItemDetail> {
     return this.request<StoryItemDetail>(`/stories/${storyId}/items/${itemId}/trim`, {
       method: 'PUT',
       body: JSON.stringify(data),
     });
   }
 
-  async splitStoryItem(storyId: string, itemId: string, data: StoryItemSplit): Promise<StoryItemDetail[]> {
+  async splitStoryItem(
+    storyId: string,
+    itemId: string,
+    data: StoryItemSplit,
+  ): Promise<StoryItemDetail[]> {
     return this.request<StoryItemDetail[]>(`/stories/${storyId}/items/${itemId}/split`, {
       method: 'POST',
       body: JSON.stringify(data),
diff --git a/app/src/lib/api/types.ts b/app/src/lib/api/types.ts
index 131c1be5..717496ea 100644
--- a/app/src/lib/api/types.ts
+++ b/app/src/lib/api/types.ts
@@ -34,6 +34,7 @@ export interface GenerationRequest {
   language: LanguageCode;
   seed?: number;
   model_size?: '1.7B' | '0.6B';
+  instruct?: string;
 }
 
 export interface GenerationResponse {
@@ -127,6 +128,12 @@ export interface ActiveTasksResponse {
   generations: ActiveGenerationTask[];
 }
 
+export interface FolderPathsResponse {
+  data_dir: string;
+  models_dir: string;
+  providers_dir: string;
+}
+
 export interface StoryCreate {
   name: string;
   description?: string;
diff --git a/app/src/lib/hooks/useGenerationForm.ts b/app/src/lib/hooks/useGenerationForm.ts
index c6fdba50..70955824 100644
--- a/app/src/lib/hooks/useGenerationForm.ts
+++ b/app/src/lib/hooks/useGenerationForm.ts
@@ -91,11 +91,6 @@ export function useGenerationForm(options: UseGenerationFormOptions = {}) {
         instruct: data.instruct || undefined,
       });
 
-      toast({
-        title: 'Generation complete!',
-        description: `Audio generated (${result.duration.toFixed(2)}s)`,
-      });
-
       const audioUrl = apiClient.getAudioUrl(result.id);
       setAudioWithAutoPlay(audioUrl, result.id, selectedProfileId, data.text.substring(0, 50));
 
diff --git a/app/src/lib/hooks/useModelDownloadToast.tsx b/app/src/lib/hooks/useModelDownloadToast.tsx
index 2df221e1..10fb7bdc 100644
--- a/app/src/lib/hooks/useModelDownloadToast.tsx
+++ b/app/src/lib/hooks/useModelDownloadToast.tsx
@@ -1,4 +1,6 @@
-import { CheckCircle2, Loader2, XCircle } from 'lucide-react';
+import { CancelCircleIcon, CheckmarkCircle02Icon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { useCallback, useEffect, useRef } from 'react';
 import { Progress } from '@/components/ui/progress';
 import { useToast } from '@/components/ui/use-toast';
@@ -59,7 +61,7 @@ export function useModelDownloadToast({
       title: displayName,
       description: (
         <div className="flex items-center gap-2">
-          <Loader2 className="h-4 w-4 animate-spin" />
+          <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
           <span>Connecting to download...</span>
         </div>
       ),
@@ -96,19 +98,35 @@ export function useModelDownloadToast({
 
           switch (progress.status) {
             case 'complete':
-              statusIcon = <CheckCircle2 className="h-4 w-4 text-green-500" />;
+              statusIcon = (
+                <HugeiconsIcon
+                  icon={CheckmarkCircle02Icon}
+                  size={16}
+                  className="h-4 w-4 text-green-500"
+                />
+              );
               statusText = 'Download complete';
               break;
             case 'error':
-              statusIcon = <XCircle className="h-4 w-4 text-destructive" />;
+              statusIcon = (
+                <HugeiconsIcon
+                  icon={CancelCircleIcon}
+                  size={16}
+                  className="h-4 w-4 text-destructive"
+                />
+              );
               statusText = `Error: ${progress.error || 'Unknown error'}`;
               break;
             case 'downloading':
-              statusIcon = <Loader2 className="h-4 w-4 animate-spin" />;
+              statusIcon = (
+                <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
+              );
               statusText = progress.filename || 'Downloading...';
               break;
             case 'extracting':
-              statusIcon = <Loader2 className="h-4 w-4 animate-spin" />;
+              statusIcon = (
+                <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
+              );
               statusText = 'Extracting...';
               break;
           }
@@ -154,7 +172,11 @@ export function useModelDownloadToast({
               toastUpdateRef.current({
                 title: (
                   <div className="flex items-center gap-2">
-                    <CheckCircle2 className="h-4 w-4 text-green-500" />
+                    <HugeiconsIcon
+                      icon={CheckmarkCircle02Icon}
+                      size={16}
+                      className="h-4 w-4 text-green-500"
+                    />
                     <span>{displayName}</span>
                   </div>
                 ),
diff --git a/app/src/lib/hooks/useSystemFolders.ts b/app/src/lib/hooks/useSystemFolders.ts
new file mode 100644
index 00000000..47e92540
--- /dev/null
+++ b/app/src/lib/hooks/useSystemFolders.ts
@@ -0,0 +1,14 @@
+import { useQuery } from '@tanstack/react-query';
+import { apiClient } from '@/lib/api/client';
+import { useServerStore } from '@/stores/serverStore';
+
+export function useSystemFolders() {
+  const serverUrl = useServerStore((state) => state.serverUrl);
+
+  return useQuery({
+    queryKey: ['system', 'folders', serverUrl],
+    queryFn: () => apiClient.getSystemFolders(),
+    staleTime: 60000, // Cache for 1 minute - folder paths don't change often
+    retry: 1,
+  });
+}
diff --git a/app/src/platform/types.ts b/app/src/platform/types.ts
index 5ea4d609..6d724fd8 100644
--- a/app/src/platform/types.ts
+++ b/app/src/platform/types.ts
@@ -10,6 +10,13 @@ export interface FileFilter {
 
 export interface PlatformFilesystem {
   saveFile(filename: string, blob: Blob, filters?: FileFilter[]): Promise<void>;
+  /**
+   * Open a folder in the native file explorer.
+   * On web, this is a no-op since browsers cannot open folders.
+   * @param path - The absolute path to the folder to open
+   * @returns true if the folder was opened, false if not supported
+   */
+  openFolder(path: string): Promise<boolean>;
 }
 
 export interface UpdateStatus {
diff --git a/backend/__init__.py b/backend/__init__.py
index e75772bd..36b3fee7 100644
--- a/backend/__init__.py
+++ b/backend/__init__.py
@@ -1,3 +1,3 @@
 # Backend package
 
-__version__ = "0.1.12"
+__version__ = "0.1.13"
diff --git a/backend/backends/__init__.py b/backend/backends/__init__.py
index f7c47ba9..5f0c9b7e 100644
--- a/backend/backends/__init__.py
+++ b/backend/backends/__init__.py
@@ -118,22 +118,37 @@ def is_loaded(self) -> bool:
 def get_tts_backend() -> TTSBackend:
     """
     Get or create TTS backend instance based on platform.
-    
+
     Returns:
         TTS backend instance (MLX or PyTorch)
+
+    Raises:
+        ImportError: If required dependencies (mlx or torch) are not available
     """
     global _tts_backend
-    
+
     if _tts_backend is None:
         backend_type = get_backend_type()
-        
+
         if backend_type == "mlx":
-            from .mlx_backend import MLXTTSBackend
-            _tts_backend = MLXTTSBackend()
+            try:
+                from .mlx_backend import MLXTTSBackend
+                _tts_backend = MLXTTSBackend()
+            except ImportError as e:
+                raise ImportError(
+                    f"MLX backend dependencies not available. "
+                    f"Please install mlx and mlx_audio or download a provider. Error: {e}"
+                )
         else:
-            from .pytorch_backend import PyTorchTTSBackend
-            _tts_backend = PyTorchTTSBackend()
-    
+            try:
+                from .pytorch_backend import PyTorchTTSBackend
+                _tts_backend = PyTorchTTSBackend()
+            except ImportError as e:
+                raise ImportError(
+                    f"PyTorch backend dependencies not available. "
+                    f"Please download a TTS provider (pytorch-cpu or pytorch-cuda) from the Downloads page. Error: {e}"
+                )
+
     return _tts_backend
 
 
diff --git a/backend/build_binary.py b/backend/build_binary.py
index a2973cd4..df96f5dc 100644
--- a/backend/build_binary.py
+++ b/backend/build_binary.py
@@ -30,7 +30,7 @@ def build_server():
         args.extend(['--paths', str(qwen_tts_path)])
         print(f"Using local qwen_tts source from: {qwen_tts_path}")
 
-    # Add common hidden imports
+    # Add common hidden imports (always included)
     args.extend([
         '--hidden-import', 'backend',
         '--hidden-import', 'backend.main',
@@ -42,38 +42,42 @@ def build_server():
         '--hidden-import', 'backend.tts',
         '--hidden-import', 'backend.transcribe',
         '--hidden-import', 'backend.platform_detect',
-        '--hidden-import', 'backend.backends',
-        '--hidden-import', 'backend.backends.pytorch_backend',
+        '--hidden-import', 'backend.providers',
+        '--hidden-import', 'backend.providers.base',
+        '--hidden-import', 'backend.providers.bundled',
+        '--hidden-import', 'backend.providers.types',
         '--hidden-import', 'backend.utils.audio',
         '--hidden-import', 'backend.utils.cache',
         '--hidden-import', 'backend.utils.progress',
         '--hidden-import', 'backend.utils.hf_progress',
         '--hidden-import', 'backend.utils.validation',
-        '--hidden-import', 'torch',
-        '--hidden-import', 'transformers',
+        '--hidden-import', 'numpy',
+        '--hidden-import', 'numpy.core',
+        '--hidden-import', 'numpy.core._multiarray_umath',
+        '--hidden-import', 'scipy',
+        '--hidden-import', 'scipy.signal',
         '--hidden-import', 'fastapi',
         '--hidden-import', 'uvicorn',
         '--hidden-import', 'sqlalchemy',
         '--hidden-import', 'librosa',
         '--hidden-import', 'soundfile',
-        '--hidden-import', 'qwen_tts',
-        '--hidden-import', 'qwen_tts.inference',
-        '--hidden-import', 'qwen_tts.inference.qwen3_tts_model',
-        '--hidden-import', 'qwen_tts.inference.qwen3_tts_tokenizer',
-        '--hidden-import', 'qwen_tts.core',
-        '--hidden-import', 'qwen_tts.cli',
-        '--copy-metadata', 'qwen-tts',
-        '--collect-submodules', 'qwen_tts',
-        '--collect-data', 'qwen_tts',
         # Fix for pkg_resources and jaraco namespace packages
         '--hidden-import', 'pkg_resources.extern',
         '--collect-submodules', 'jaraco',
+        # Asyncio and threading support for PyInstaller
+        '--hidden-import', 'asyncio',
+        '--hidden-import', 'asyncio.subprocess',
+        '--hidden-import', 'concurrent.futures',
+        '--hidden-import', 'concurrent.futures.thread',
     ])
 
-    # Add MLX-specific imports if building on Apple Silicon
+    # Platform-specific TTS backend handling
+    system = platform.system()
+
     if is_apple_silicon():
-        print("Building for Apple Silicon - including MLX dependencies")
+        print("Building for Apple Silicon - including MLX dependencies (bundled)")
         args.extend([
+            '--hidden-import', 'backend.backends',
             '--hidden-import', 'backend.backends.mlx_backend',
             '--hidden-import', 'mlx',
             '--hidden-import', 'mlx.core',
@@ -87,8 +91,31 @@ def build_server():
             '--collect-data', 'mlx',
             '--collect-data', 'mlx_audio',
         ])
+    elif system == "Windows" or (system == "Darwin" and not is_apple_silicon()):
+        # Windows and Intel macOS: Bundle PyTorch CPU provider
+        print(f"Building for {system} - including PyTorch CPU provider (bundled)")
+        args.extend([
+            '--hidden-import', 'backend.backends',
+            '--hidden-import', 'backend.backends.pytorch_backend',
+            '--hidden-import', 'torch',
+            '--hidden-import', 'transformers',
+            '--hidden-import', 'qwen_tts',
+            '--hidden-import', 'qwen_tts.inference',
+            '--hidden-import', 'qwen_tts.inference.qwen3_tts_model',
+            '--hidden-import', 'qwen_tts.inference.qwen3_tts_tokenizer',
+            '--hidden-import', 'qwen_tts.core',
+            '--hidden-import', 'qwen_tts.cli',
+            '--copy-metadata', 'qwen-tts',
+            '--collect-submodules', 'qwen_tts',
+            '--collect-data', 'qwen_tts',
+        ])
     else:
-        print("Building for non-Apple Silicon platform - PyTorch only")
+        # Linux: No bundled provider - users download providers separately
+        print("Building for Linux - no bundled provider (users download separately)")
+        args.extend([
+            '--hidden-import', 'backend.backends',
+            '--hidden-import', 'backend.backends.pytorch_backend',
+        ])
 
     args.extend([
         '--noconfirm',
diff --git a/backend/main.py b/backend/main.py
index 59fb9e18..c74ae460 100644
--- a/backend/main.py
+++ b/backend/main.py
@@ -14,7 +14,6 @@
 import asyncio
 import uvicorn
 import argparse
-import torch
 import tempfile
 import io
 from pathlib import Path
@@ -23,12 +22,22 @@
 import signal
 import os
 
+# Optional torch import - not available on all platforms (e.g. Windows/Linux without bundled provider)
+try:
+    import torch
+    TORCH_AVAILABLE = True
+except ImportError:
+    torch = None  # type: ignore
+    TORCH_AVAILABLE = False
+
 from . import database, models, profiles, history, tts, transcribe, config, export_import, channels, stories, __version__
 from .database import get_db, Generation as DBGeneration, VoiceProfile as DBVoiceProfile
 from .utils.progress import get_progress_manager
 from .utils.tasks import get_task_manager
 from .utils.cache import clear_voice_prompt_cache
 from .platform_detect import get_backend_type
+from .providers import get_provider_manager
+from .providers.types import ProviderType
 
 app = FastAPI(
     title="voicebox API",
@@ -50,10 +59,8 @@
 # ROOT & HEALTH ENDPOINTS
 # ============================================
 
-@app.get("/")
-async def root():
-    """Root endpoint."""
-    return {"message": "voicebox API", "version": __version__}
+# Root endpoint removed - web UI served at / instead
+# API info available at /health
 
 
 @app.post("/shutdown")
@@ -67,23 +74,48 @@ async def shutdown_async():
     return {"message": "Shutting down..."}
 
 
+@app.get("/system/folders", response_model=models.FolderPathsResponse)
+async def get_system_folders():
+    """Get system folder paths for data, models, and providers."""
+    from huggingface_hub import constants as hf_constants
+    from .providers.installer import _get_providers_dir
+    
+    return models.FolderPathsResponse(
+        data_dir=str(config.get_data_dir().absolute()),
+        models_dir=str(Path(hf_constants.HF_HUB_CACHE).absolute()),
+        providers_dir=str(_get_providers_dir().absolute()),
+    )
+
+
 @app.get("/health", response_model=models.HealthResponse)
 async def health():
     """Health check endpoint."""
-    from huggingface_hub import hf_hub_download, constants as hf_constants
+    from huggingface_hub import constants as hf_constants
     from pathlib import Path
-    import os
 
-    tts_model = tts.get_tts_model()
+    # Try to get TTS model provider, but it may not be available if dependencies aren't installed
+    tts_model = None
+    try:
+        tts_model = await tts.get_tts_model_async()
+    except ImportError as e:
+        # Provider dependencies not available (e.g., PyTorch not bundled on this platform)
+        # This is expected on Windows/Linux builds without a bundled provider
+        print(f"Provider not available: {e}")
+
     backend_type = get_backend_type()
 
     # Check for GPU availability (CUDA or MPS)
-    has_cuda = torch.cuda.is_available()
-    has_mps = hasattr(torch.backends, 'mps') and torch.backends.mps.is_available()
+    # PyTorch might not be available if no provider is bundled
+    has_cuda = False
+    has_mps = False
+    if TORCH_AVAILABLE and torch is not None:
+        has_cuda = torch.cuda.is_available()
+        has_mps = hasattr(torch.backends, 'mps') and torch.backends.mps.is_available()
+
     gpu_available = has_cuda or has_mps
 
     gpu_type = None
-    if has_cuda:
+    if has_cuda and torch is not None:
         gpu_type = f"CUDA ({torch.cuda.get_device_name(0)})"
     elif has_mps:
         gpu_type = "MPS (Apple Silicon)"
@@ -91,26 +123,27 @@ async def health():
         gpu_type = "Metal (Apple Silicon via MLX)"
 
     vram_used = None
-    if has_cuda:
+    if has_cuda and torch is not None:
         vram_used = torch.cuda.memory_allocated() / 1024 / 1024  # MB
-    
+
     # Check if model is loaded - use the same logic as model status endpoint
     model_loaded = False
     model_size = None
-    try:
-        # Use the same check as model status endpoint
-        if tts_model.is_loaded():
-            model_loaded = True
-            # Get the actual loaded model size
-            # Check _current_model_size first (more reliable for actually loaded models)
-            model_size = getattr(tts_model, '_current_model_size', None)
-            if not model_size:
-                # Fallback to model_size attribute (which should be set when model loads)
-                model_size = getattr(tts_model, 'model_size', None)
-    except Exception:
-        # If there's an error checking, assume not loaded
-        model_loaded = False
-        model_size = None
+    if tts_model is not None:
+        try:
+            # Use the same check as model status endpoint
+            if tts_model.is_loaded():
+                model_loaded = True
+                # Get the actual loaded model size
+                # Check _current_model_size first (more reliable for actually loaded models)
+                model_size = getattr(tts_model, '_current_model_size', None)
+                if not model_size:
+                    # Fallback to model_size attribute (which should be set when model loads)
+                    model_size = getattr(tts_model, 'model_size', None)
+        except Exception:
+            # If there's an error checking, assume not loaded
+            model_loaded = False
+            model_size = None
     
     # Check if default model is downloaded (cached)
     model_downloaded = None
@@ -549,7 +582,7 @@ async def generate_speech(
         )
         
         # Generate audio
-        tts_model = tts.get_tts_model()
+        tts_model = await tts.get_tts_model_async()
         # Load the requested model size if different from current (async to not block)
         model_size = data.model_size or "1.7B"
 
@@ -1113,8 +1146,8 @@ async def get_sample_audio(sample_id: str, db: Session = Depends(get_db)):
 async def load_model(model_size: str = "1.7B"):
     """Manually load TTS model."""
     try:
-        tts_model = tts.get_tts_model()
-        await tts_model.load_model_async(model_size)
+        tts_model = await tts.get_tts_model_async()
+        await tts_model.load_model(model_size)
         return {"message": f"Model {model_size} loaded successfully"}
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
@@ -1172,10 +1205,10 @@ async def get_model_status():
     except ImportError:
         use_scan_cache = False
     
-    def check_tts_loaded(model_size: str):
+    async def check_tts_loaded(model_size: str):
         """Check if TTS model is loaded with specific size."""
         try:
-            tts_model = tts.get_tts_model()
+            tts_model = await tts.get_tts_model_async()
             return tts_model.is_loaded() and getattr(tts_model, 'model_size', None) == model_size
         except Exception:
             return False
@@ -1211,14 +1244,14 @@ def check_whisper_loaded(model_size: str):
             "display_name": "Qwen TTS 1.7B",
             "hf_repo_id": tts_1_7b_id,
             "model_size": "1.7B",
-            "check_loaded": lambda: check_tts_loaded("1.7B"),
+            "check_loaded": lambda: check_tts_loaded("1.7B"),  # Async function
         },
         {
             "model_name": "qwen-tts-0.6B",
             "display_name": "Qwen TTS 0.6B",
             "hf_repo_id": tts_0_6b_id,
             "model_size": "0.6B",
-            "check_loaded": lambda: check_tts_loaded("0.6B"),
+            "check_loaded": lambda: check_tts_loaded("0.6B"),  # Async function
         },
         {
             "model_name": "whisper-base",
@@ -1356,7 +1389,16 @@ def check_whisper_loaded(model_size: str):
             
             # Check if loaded in memory
             try:
-                loaded = config["check_loaded"]()
+                check_func = config["check_loaded"]
+                if asyncio.iscoroutinefunction(check_func):
+                    loaded = await check_func()
+                else:
+                    result = check_func()
+                    # Handle lambdas that return coroutines
+                    if asyncio.iscoroutine(result):
+                        loaded = await result
+                    else:
+                        loaded = result
             except Exception:
                 loaded = False
             
@@ -1379,7 +1421,16 @@ def check_whisper_loaded(model_size: str):
         except Exception as e:
             # If check fails, try to at least check if loaded
             try:
-                loaded = config["check_loaded"]()
+                check_func = config["check_loaded"]
+                if asyncio.iscoroutinefunction(check_func):
+                    loaded = await check_func()
+                else:
+                    result = check_func()
+                    # Handle lambdas that return coroutines
+                    if asyncio.iscoroutine(result):
+                        loaded = await result
+                    else:
+                        loaded = result
             except Exception:
                 loaded = False
             
@@ -1406,14 +1457,24 @@ async def trigger_model_download(request: models.ModelDownloadRequest):
     task_manager = get_task_manager()
     progress_manager = get_progress_manager()
     
+    async def load_tts_model_1_7b():
+        """Load 1.7B TTS model."""
+        tts_model = await tts.get_tts_model_async()
+        await tts_model.load_model("1.7B")
+    
+    async def load_tts_model_0_6b():
+        """Load 0.6B TTS model."""
+        tts_model = await tts.get_tts_model_async()
+        await tts_model.load_model("0.6B")
+    
     model_configs = {
         "qwen-tts-1.7B": {
             "model_size": "1.7B",
-            "load_func": lambda: tts.get_tts_model().load_model("1.7B"),
+            "load_func": load_tts_model_1_7b,
         },
         "qwen-tts-0.6B": {
             "model_size": "0.6B",
-            "load_func": lambda: tts.get_tts_model().load_model("0.6B"),
+            "load_func": load_tts_model_0_6b,
         },
         "whisper-base": {
             "model_size": "base",
@@ -1472,6 +1533,171 @@ async def download_in_background():
     return {"message": f"Model {request.model_name} download started"}
 
 
+# ============================================
+# PROVIDER ENDPOINTS
+# ============================================
+
+@app.get("/providers")
+async def list_providers():
+    """List all available provider types."""
+    manager = get_provider_manager()
+    installed = await manager.list_installed()
+    
+    # Get info for all known provider types
+    all_providers = [
+        "apple-mlx",
+        "bundled-pytorch",
+        "pytorch-cpu",
+        "pytorch-cuda",
+        "remote",
+        "openai",
+    ]
+    
+    providers_info = []
+    for provider_type in all_providers:
+        info = await manager.get_provider_info(provider_type)
+        providers_info.append(info)
+    
+    return {
+        "providers": providers_info,
+        "installed": installed,
+    }
+
+
+@app.get("/providers/installed")
+async def list_installed_providers():
+    """List installed provider types."""
+    manager = get_provider_manager()
+    installed = await manager.list_installed()
+    return {"installed": installed}
+
+
+@app.get("/providers/active")
+async def get_active_provider():
+    """Get information about the currently active provider."""
+    manager = get_provider_manager()
+    provider = await manager.get_active_provider()
+    
+    health = await provider.health()
+    status = await provider.status()
+    
+    return {
+        "provider": health["provider"],
+        "health": health,
+        "status": status,
+    }
+
+
+@app.post("/providers/start")
+async def start_provider(data: dict):
+    """Start a specific provider."""
+    provider_type = data.get("provider_type")
+    if not provider_type:
+        raise HTTPException(status_code=400, detail="provider_type is required")
+    
+    manager = get_provider_manager()
+    try:
+        await manager.start_provider(provider_type)
+        provider = await manager.get_active_provider()
+        health = await provider.health()
+        return {
+            "message": f"Provider {provider_type} started",
+            "provider": health,
+        }
+    except NotImplementedError as e:
+        raise HTTPException(status_code=501, detail=str(e))
+    except ValueError as e:
+        raise HTTPException(status_code=400, detail=str(e))
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+
+
+@app.post("/providers/stop")
+async def stop_provider():
+    """Stop the currently active provider."""
+    manager = get_provider_manager()
+    await manager.stop_provider()
+    return {"message": "Provider stopped"}
+
+
+@app.post("/providers/download")
+async def download_provider_endpoint(data: dict):
+    """Download a provider binary."""
+    from .providers.installer import download_provider
+    
+    provider_type = data.get("provider_type")
+    if not provider_type:
+        raise HTTPException(status_code=400, detail="provider_type is required")
+    
+    if provider_type not in ["pytorch-cpu", "pytorch-cuda"]:
+        raise HTTPException(
+            status_code=400,
+            detail=f"Provider type {provider_type} cannot be downloaded"
+        )
+    
+    try:
+        # Start download in background
+        asyncio.create_task(download_provider(provider_type))
+        return {
+            "message": f"Provider {provider_type} download started",
+            "provider_type": provider_type,
+        }
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+
+
+@app.get("/providers/download/progress/{provider_type}")
+async def get_provider_download_progress(provider_type: str):
+    """Get provider download progress via Server-Sent Events."""
+    from fastapi.responses import StreamingResponse
+    from .utils.progress import get_progress_manager
+    
+    progress_manager = get_progress_manager()
+    
+    async def event_generator():
+        """Generate SSE events for provider download progress."""
+        import asyncio
+        import json
+        
+        last_progress = None
+        
+        while True:
+            progress = progress_manager.get_progress(provider_type)
+            
+            if progress and progress != last_progress:
+                yield f"data: {json.dumps(progress)}\n\n"
+                last_progress = progress
+                
+                if progress.get("status") in ["complete", "error"]:
+                    break
+            
+            await asyncio.sleep(0.5)
+    
+    return StreamingResponse(event_generator(), media_type="text/event-stream")
+
+
+@app.delete("/providers/{provider_type}")
+async def delete_provider_endpoint(provider_type: str):
+    """Delete an installed provider."""
+    from .providers.installer import delete_provider
+    
+    if provider_type not in ["pytorch-cpu", "pytorch-cuda"]:
+        raise HTTPException(
+            status_code=400,
+            detail=f"Provider type {provider_type} cannot be deleted"
+        )
+    
+    deleted = delete_provider(provider_type)
+    
+    if deleted:
+        return {"message": f"Provider {provider_type} deleted successfully"}
+    else:
+        raise HTTPException(
+            status_code=404,
+            detail=f"Provider {provider_type} not found"
+        )
+
+
 @app.delete("/models/{model_name}")
 async def delete_model(model_name: str):
     """Delete a downloaded model from the HuggingFace cache."""
@@ -1522,9 +1748,9 @@ async def delete_model(model_name: str):
     try:
         # Check if model is loaded and unload it first
         if config["model_type"] == "tts":
-            tts_model = tts.get_tts_model()
-            if tts_model.is_loaded() and tts_model.model_size == config["model_size"]:
-                tts.unload_tts_model()
+            tts_model = await tts.get_tts_model_async()
+            if tts_model.is_loaded() and getattr(tts_model, 'model_size', None) == config["model_size"]:
+                tts_model.unload_model()
         elif config["model_type"] == "whisper":
             whisper_model = transcribe.get_whisper_model()
             if whisper_model.is_loaded() and whisper_model.model_size == config["model_size"]:
@@ -1634,6 +1860,16 @@ async def get_active_tasks():
     )
 
 
+# ============================================
+# WEB UI STATIC FILES
+# ============================================
+
+# Serve web UI at root if dist directory exists
+_web_dist_path = Path(__file__).parent.parent / "web" / "dist"
+if _web_dist_path.exists():
+    app.mount("/", StaticFiles(directory=str(_web_dist_path), html=True), name="web")
+
+
 # ============================================
 # STARTUP & SHUTDOWN
 # ============================================
@@ -1641,11 +1877,12 @@ async def get_active_tasks():
 def _get_gpu_status() -> str:
     """Get GPU availability status."""
     backend_type = get_backend_type()
-    if torch.cuda.is_available():
-        return f"CUDA ({torch.cuda.get_device_name(0)})"
-    elif hasattr(torch.backends, 'mps') and torch.backends.mps.is_available():
-        return "MPS (Apple Silicon)"
-    elif backend_type == "mlx":
+    if TORCH_AVAILABLE and torch is not None:
+        if torch.cuda.is_available():
+            return f"CUDA ({torch.cuda.get_device_name(0)})"
+        elif hasattr(torch.backends, 'mps') and torch.backends.mps.is_available():
+            return "MPS (Apple Silicon)"
+    if backend_type == "mlx":
         return "Metal (Apple Silicon via MLX)"
     return "None (CPU only)"
 
@@ -1684,8 +1921,14 @@ async def shutdown_event():
     """Run on application shutdown."""
     print("voicebox API shutting down...")
     # Unload models to free memory
-    tts.unload_tts_model()
-    transcribe.unload_whisper_model()
+    try:
+        tts.unload_tts_model()
+    except Exception as e:
+        print(f"Warning: Failed to unload TTS model: {e}")
+    try:
+        transcribe.unload_whisper_model()
+    except Exception as e:
+        print(f"Warning: Failed to unload Whisper model: {e}")
 
 
 # ============================================
diff --git a/backend/models.py b/backend/models.py
index 59e45405..0540644e 100644
--- a/backend/models.py
+++ b/backend/models.py
@@ -170,6 +170,13 @@ class ActiveTasksResponse(BaseModel):
     generations: List[ActiveGenerationTask]
 
 
+class FolderPathsResponse(BaseModel):
+    """Response model for system folder paths."""
+    data_dir: str
+    models_dir: str
+    providers_dir: str
+
+
 class AudioChannelCreate(BaseModel):
     """Request model for creating an audio channel."""
     name: str = Field(..., min_length=1, max_length=100)
diff --git a/backend/providers/__init__.py b/backend/providers/__init__.py
new file mode 100644
index 00000000..8ad9681d
--- /dev/null
+++ b/backend/providers/__init__.py
@@ -0,0 +1,327 @@
+"""
+Provider management system for TTS providers.
+"""
+
+from typing import Optional
+import asyncio
+import platform
+from pathlib import Path
+
+from .base import TTSProvider
+from .types import ProviderType
+from .bundled import BundledProvider
+from .local import LocalProvider
+from .installer import get_provider_binary_path, _get_providers_dir
+from ..config import get_data_dir
+import subprocess
+import socket
+
+
+class ProviderManager:
+    """Manages TTS provider lifecycle."""
+    
+    def __init__(self):
+        self.active_provider: Optional[TTSProvider] = None
+        self._default_provider: Optional[TTSProvider] = None
+        self._provider_process: Optional[subprocess.Popen] = None
+        self._provider_port: Optional[int] = None
+    
+    def _get_default_provider(self) -> TTSProvider:
+        """Get the default bundled provider."""
+        if self._default_provider is None:
+            self._default_provider = BundledProvider()
+        return self._default_provider
+    
+    async def get_active_provider(self) -> TTSProvider:
+        """
+        Get the currently active provider.
+        
+        Returns:
+            Active TTS provider instance
+        """
+        if self.active_provider is None:
+            # Default to bundled provider
+            self.active_provider = self._get_default_provider()
+        return self.active_provider
+    
+    async def start_provider(self, provider_type: str) -> None:
+        """
+        Start a TTS provider.
+        
+        Args:
+            provider_type: Type of provider to start
+        """
+        if provider_type == "apple-mlx":
+            # Use bundled MLX provider
+            self.active_provider = self._get_default_provider()
+        elif provider_type in ["pytorch-cpu", "pytorch-cuda"]:
+            # Try to start external provider subprocess if binary exists
+            provider_path = get_provider_binary_path(provider_type)
+            if provider_path and provider_path.exists():
+                # External downloaded provider exists, start it
+                # Find a free port
+                port = self._get_free_port()
+
+                # Start provider subprocess with stdout/stderr capture
+                from ..config import get_data_dir
+                import logging
+                logger = logging.getLogger(__name__)
+
+                logger.info(f"Starting provider {provider_type} on port {port}")
+                logger.info(f"Provider binary: {provider_path}")
+                logger.info(f"Data directory: {get_data_dir()}")
+
+                # Create log files for provider output (easier debugging on Windows)
+                logs_dir = get_data_dir() / "logs"
+                logs_dir.mkdir(exist_ok=True)
+                stdout_log = logs_dir / f"{provider_type}-stdout.log"
+                stderr_log = logs_dir / f"{provider_type}-stderr.log"
+
+                logger.info(f"Provider logs will be written to: {logs_dir}")
+
+                process = subprocess.Popen(
+                    [
+                        str(provider_path),
+                        "--port", str(port),
+                        "--data-dir", str(get_data_dir()),
+                    ],
+                    stdout=open(stdout_log, 'w'),
+                    stderr=open(stderr_log, 'w'),
+                    text=True,
+                    bufsize=1,
+                )
+
+                # Wait for provider to be ready
+                base_url = f"http://127.0.0.1:{port}"
+                try:
+                    await self._wait_for_provider_health(base_url, timeout=30)
+                except TimeoutError as e:
+                    # Read log files for debugging (works on all platforms unlike select)
+                    stdout_content = ""
+                    stderr_content = ""
+
+                    # Try to read available output (works on Windows and Unix)
+                    try:
+                        # Use non-blocking read with timeout
+                        import threading
+                        import queue
+
+                        def enqueue_output(stream, queue):
+                            try:
+                                for line in iter(stream.readline, ''):
+                                    queue.put(line)
+                            except:
+                                pass
+
+                        stdout_queue = queue.Queue()
+                        stderr_queue = queue.Queue()
+
+                        if process.stdout:
+                            t = threading.Thread(target=enqueue_output, args=(process.stdout, stdout_queue))
+                            t.daemon = True
+                            t.start()
+
+                        if process.stderr:
+                            t2 = threading.Thread(target=enqueue_output, args=(process.stderr, stderr_queue))
+                            t2.daemon = True
+                            t2.start()
+
+                        # Give threads a moment to read
+                        import time
+                        time.sleep(0.5)
+
+                        # Collect output
+                        while not stdout_queue.empty():
+                            stdout_lines.append(stdout_queue.get_nowait())
+                        while not stderr_queue.empty():
+                            stderr_lines.append(stderr_queue.get_nowait())
+                    except Exception as ex:
+                        logger.warning(f"Could not capture subprocess output: {ex}")
+
+                    logger.error(f"Provider failed to start within 30 seconds")
+                    logger.error(f"Check logs at: {logs_dir}")
+                    if stdout_content:
+                        logger.error(f"Stdout: {stdout_content[-2000:]}")  # Last 2000 chars
+                    if stderr_content:
+                        logger.error(f"Stderr: {stderr_content[-2000:]}")  # Last 2000 chars
+
+                    # Terminate the process
+                    process.terminate()
+                    try:
+                        process.wait(timeout=5)
+                    except subprocess.TimeoutExpired:
+                        process.kill()
+
+                    # Raise with log file location for user
+                    raise TimeoutError(
+                        f"Provider {provider_type} failed to start. Check logs at: {logs_dir}"
+                    )
+
+                # Create LocalProvider instance
+                self.active_provider = LocalProvider(base_url)
+                self._provider_process = process
+                self._provider_port = port
+
+                # Logs are written directly to files (stdout_log, stderr_log)
+                # No need for background task - users can check {logs_dir} for debugging
+            else:
+                # No external binary, use bundled provider (if available)
+                if provider_type == "pytorch-cpu":
+                    # PyTorch CPU can use bundled backend
+                    self.active_provider = self._get_default_provider()
+                else:
+                    raise ValueError(f"Provider {provider_type} is not installed. Please download it first.")
+        elif provider_type == "remote":
+            # Remote provider - will be implemented in Phase 5
+            raise NotImplementedError("Remote provider not yet implemented")
+        elif provider_type == "openai":
+            # OpenAI provider - will be implemented in Phase 5
+            raise NotImplementedError("OpenAI provider not yet implemented")
+        else:
+            raise ValueError(f"Unknown provider type: {provider_type}")
+    
+    async def stop_provider(self) -> None:
+        """Stop the active provider."""
+        if self.active_provider:
+            # Only stop if it's not the default bundled provider
+            if self.active_provider is not self._default_provider:
+                if hasattr(self.active_provider, 'stop'):
+                    await self.active_provider.stop()
+                self.active_provider = None
+            
+            # Stop subprocess if running
+            if self._provider_process:
+                self._provider_process.terminate()
+                try:
+                    self._provider_process.wait(timeout=5)
+                except subprocess.TimeoutExpired:
+                    self._provider_process.kill()
+                self._provider_process = None
+                self._provider_port = None
+    
+    async def list_installed(self) -> list[str]:
+        """
+        List installed provider types.
+        
+        Returns:
+            List of installed provider type strings
+        """
+        installed = []
+        
+        # Bundled providers are always available
+        system = platform.system()
+        machine = platform.machine()
+
+        if system == "Darwin" and machine == "arm64":
+            # Apple Silicon gets MLX bundled
+            installed.append("apple-mlx")
+        elif system == "Windows" or (system == "Darwin" and machine != "arm64"):
+            # Windows and Intel macOS get PyTorch CPU bundled
+            installed.append("pytorch-cpu")
+        # Linux: no bundled provider - users must download
+        
+        # Check for downloaded providers by checking if binary path exists
+        for provider_type in ["pytorch-cpu", "pytorch-cuda"]:
+            binary_path = get_provider_binary_path(provider_type)
+            if binary_path and binary_path.exists() and provider_type not in installed:
+                installed.append(provider_type)
+        
+        return installed
+    
+    async def get_provider_info(self, provider_type: str) -> dict:
+        """
+        Get information about a provider.
+        
+        Args:
+            provider_type: Type of provider
+            
+        Returns:
+            Provider information dictionary
+        """
+        if provider_type in ["apple-mlx", "bundled-pytorch"]:
+            return {
+                "type": provider_type,
+                "name": "Bundled Provider",
+                "installed": True,
+                "size_mb": None,  # Bundled, no separate size
+            }
+        elif provider_type == "pytorch-cpu":
+            return {
+                "type": provider_type,
+                "name": "PyTorch CPU",
+                "installed": provider_type in await self.list_installed(),
+                "size_mb": 300,
+            }
+        elif provider_type == "pytorch-cuda":
+            return {
+                "type": provider_type,
+                "name": "PyTorch CUDA",
+                "installed": provider_type in await self.list_installed(),
+                "size_mb": 2400,
+            }
+        else:
+            return {
+                "type": provider_type,
+                "name": provider_type,
+                "installed": False,
+                "size_mb": None,
+            }
+
+
+    def _get_free_port(self) -> int:
+        """Get a free port for the provider server."""
+        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+            s.bind(('', 0))
+            return s.getsockname()[1]
+    
+    async def _wait_for_provider_health(self, base_url: str, timeout: int = 30) -> None:
+        """Wait for provider to become healthy."""
+        import httpx
+        import asyncio
+
+        start_time = asyncio.get_event_loop().time()
+        while True:
+            try:
+                async with httpx.AsyncClient(timeout=2.0) as client:
+                    response = await client.get(f"{base_url}/tts/health")
+                    if response.status_code == 200:
+                        return
+            except Exception:
+                pass
+
+            if asyncio.get_event_loop().time() - start_time > timeout:
+                raise TimeoutError(f"Provider did not become healthy within {timeout} seconds")
+
+            await asyncio.sleep(0.5)
+
+    async def _log_subprocess_output(self, process: subprocess.Popen) -> None:
+        """Log subprocess stdout and stderr."""
+        import logging
+        logger = logging.getLogger(__name__)
+
+        async def read_stream(stream, prefix):
+            if stream:
+                loop = asyncio.get_event_loop()
+                while True:
+                    line = await loop.run_in_executor(None, stream.readline)
+                    if not line:
+                        break
+                    logger.info(f"{prefix}: {line.rstrip()}")
+
+        await asyncio.gather(
+            read_stream(process.stdout, "Provider stdout"),
+            read_stream(process.stderr, "Provider stderr"),
+            return_exceptions=True,
+        )
+
+
+# Global provider manager instance
+_provider_manager: Optional[ProviderManager] = None
+
+
+def get_provider_manager() -> ProviderManager:
+    """Get the global provider manager instance."""
+    global _provider_manager
+    if _provider_manager is None:
+        _provider_manager = ProviderManager()
+    return _provider_manager
diff --git a/backend/providers/base.py b/backend/providers/base.py
new file mode 100644
index 00000000..50b05ce0
--- /dev/null
+++ b/backend/providers/base.py
@@ -0,0 +1,97 @@
+"""
+Base protocol for TTS providers.
+"""
+
+from typing import Protocol, Optional, Tuple
+from typing_extensions import runtime_checkable
+import numpy as np
+
+from .types import ProviderHealth, ProviderStatus
+
+
+@runtime_checkable
+class TTSProvider(Protocol):
+    """Protocol for TTS provider implementations."""
+    
+    async def generate(
+        self,
+        text: str,
+        voice_prompt: dict,
+        language: str = "en",
+        seed: Optional[int] = None,
+        instruct: Optional[str] = None,
+    ) -> Tuple[np.ndarray, int]:
+        """
+        Generate speech audio from text.
+        
+        Args:
+            text: Text to synthesize
+            voice_prompt: Voice prompt dictionary
+            language: Language code
+            seed: Random seed for reproducibility
+            instruct: Delivery instructions
+            
+        Returns:
+            Tuple of (audio_array, sample_rate)
+        """
+        ...
+    
+    async def create_voice_prompt(
+        self,
+        audio_path: str,
+        reference_text: str,
+        use_cache: bool = True,
+    ) -> Tuple[dict, bool]:
+        """
+        Create voice prompt from reference audio.
+        
+        Args:
+            audio_path: Path to reference audio file
+            reference_text: Transcript of the audio
+            use_cache: Whether to use cached prompts
+            
+        Returns:
+            Tuple of (voice_prompt_dict, was_cached)
+        """
+        ...
+    
+    async def combine_voice_prompts(
+        self,
+        audio_paths: list[str],
+        reference_texts: list[str],
+    ) -> Tuple[np.ndarray, str]:
+        """
+        Combine multiple voice prompts.
+        
+        Args:
+            audio_paths: List of audio file paths
+            reference_texts: List of reference texts
+            
+        Returns:
+            Tuple of (combined_audio_array, combined_text)
+        """
+        ...
+    
+    async def load_model_async(self, model_size: str) -> None:
+        """Load TTS model."""
+        ...
+    
+    def unload_model(self) -> None:
+        """Unload model to free memory."""
+        ...
+    
+    def is_loaded(self) -> bool:
+        """Check if model is loaded."""
+        ...
+    
+    def _get_model_path(self, model_size: str) -> str:
+        """Get model path for a given size."""
+        ...
+    
+    async def health(self) -> ProviderHealth:
+        """Get provider health status."""
+        ...
+    
+    async def status(self) -> ProviderStatus:
+        """Get provider model status."""
+        ...
diff --git a/backend/providers/bundled.py b/backend/providers/bundled.py
new file mode 100644
index 00000000..bb34cd57
--- /dev/null
+++ b/backend/providers/bundled.py
@@ -0,0 +1,144 @@
+"""
+Bundled provider that wraps existing MLX/PyTorch backends.
+"""
+
+from typing import Optional, Tuple
+import numpy as np
+import platform
+
+from .base import TTSProvider
+from .types import ProviderHealth, ProviderStatus
+from ..backends import get_tts_backend, TTSBackend
+from ..platform_detect import get_backend_type
+
+
+class BundledProvider:
+    """Provider that wraps the existing bundled TTS backend."""
+    
+    def __init__(self):
+        self._backend: Optional[TTSBackend] = None
+    
+    def _get_backend(self) -> TTSBackend:
+        """Get or create backend instance."""
+        if self._backend is None:
+            self._backend = get_tts_backend()
+        return self._backend
+    
+    async def generate(
+        self,
+        text: str,
+        voice_prompt: dict,
+        language: str = "en",
+        seed: Optional[int] = None,
+        instruct: Optional[str] = None,
+    ) -> Tuple[np.ndarray, int]:
+        """Generate speech audio."""
+        backend = self._get_backend()
+        return await backend.generate(text, voice_prompt, language, seed, instruct)
+    
+    async def create_voice_prompt(
+        self,
+        audio_path: str,
+        reference_text: str,
+        use_cache: bool = True,
+    ) -> Tuple[dict, bool]:
+        """Create voice prompt from reference audio."""
+        backend = self._get_backend()
+        return await backend.create_voice_prompt(audio_path, reference_text, use_cache)
+    
+    async def combine_voice_prompts(
+        self,
+        audio_paths: list[str],
+        reference_texts: list[str],
+    ) -> Tuple[np.ndarray, str]:
+        """Combine multiple voice prompts."""
+        backend = self._get_backend()
+        return await backend.combine_voice_prompts(audio_paths, reference_texts)
+    
+    async def load_model_async(self, model_size: str) -> None:
+        """Load TTS model."""
+        backend = self._get_backend()
+        if hasattr(backend, 'load_model_async'):
+            await backend.load_model_async(model_size)
+        else:
+            await backend.load_model(model_size)
+
+    # Alias for compatibility
+    load_model = load_model_async
+    
+    def unload_model(self) -> None:
+        """Unload model to free memory."""
+        backend = self._get_backend()
+        backend.unload_model()
+    
+    def is_loaded(self) -> bool:
+        """Check if model is loaded."""
+        backend = self._get_backend()
+        return backend.is_loaded()
+    
+    def _get_model_path(self, model_size: str) -> str:
+        """Get model path for a given size."""
+        backend = self._get_backend()
+        return backend._get_model_path(model_size)
+    
+    async def health(self) -> ProviderHealth:
+        """Get provider health status."""
+        backend = self._get_backend()
+        backend_type = get_backend_type()
+
+        model_size = None
+        if backend.is_loaded():
+            # Try to get current model size from backend
+            if hasattr(backend, '_current_model_size') and backend._current_model_size:
+                model_size = backend._current_model_size
+
+        device = None
+        if backend_type == "mlx":
+            device = "metal"
+        elif hasattr(backend, 'device'):
+            device = backend.device
+
+        # Use apple-mlx for MLX backend, pytorch-cpu for PyTorch
+        provider_name = "apple-mlx" if backend_type == "mlx" else "pytorch-cpu"
+
+        return ProviderHealth(
+            status="healthy",
+            provider=provider_name,
+            version=None,  # Provider versioning not implemented yet
+            model=model_size,
+            device=device,
+        )
+    
+    async def status(self) -> ProviderStatus:
+        """Get provider model status."""
+        backend = self._get_backend()
+        backend_type = get_backend_type()
+        
+        model_size = None
+        if backend.is_loaded():
+            if hasattr(backend, '_current_model_size') and backend._current_model_size:
+                model_size = backend._current_model_size
+        
+        available_sizes = ["1.7B"]
+        if backend_type == "pytorch":
+            available_sizes.append("0.6B")
+        
+        gpu_available = None
+        vram_used_mb = None
+        
+        if backend_type == "pytorch":
+            try:
+                import torch
+                gpu_available = torch.cuda.is_available()
+                if gpu_available:
+                    vram_used_mb = torch.cuda.memory_allocated() / 1024 / 1024
+            except ImportError:
+                pass
+        
+        return ProviderStatus(
+            model_loaded=backend.is_loaded(),
+            model_size=model_size,
+            available_sizes=available_sizes,
+            gpu_available=gpu_available,
+            vram_used_mb=int(vram_used_mb) if vram_used_mb else None,
+        )
diff --git a/backend/providers/checksums.py b/backend/providers/checksums.py
new file mode 100644
index 00000000..75798b10
--- /dev/null
+++ b/backend/providers/checksums.py
@@ -0,0 +1,11 @@
+# Provider checksums - embedded at build time for security
+# This file is auto-generated during CI builds
+# In development, checksums are empty (verification is skipped)
+
+PROVIDER_CHECKSUMS = {
+    # Populated during release builds with SHA256 checksums of provider binaries
+    # Example:
+    # "tts-provider-pytorch-cpu-windows.exe": "abc123...",
+    # "tts-provider-pytorch-cuda-windows.exe": "def456...",
+    # "tts-provider-pytorch-cuda-linux": "789xyz...",
+}
diff --git a/backend/providers/installer.py b/backend/providers/installer.py
new file mode 100644
index 00000000..0dcca1ec
--- /dev/null
+++ b/backend/providers/installer.py
@@ -0,0 +1,262 @@
+"""
+Provider download and installation manager.
+"""
+
+import asyncio
+import httpx
+import platform
+from pathlib import Path
+from typing import Optional
+
+from .types import ProviderType
+from ..utils.progress import get_progress_manager
+from ..utils.tasks import get_task_manager
+
+
+# Provider version (independent of app version)
+PROVIDER_VERSION = "1.0.0"
+
+# Base URL for provider downloads (Cloudflare R2)
+PROVIDER_DOWNLOAD_BASE_URL = "https://downloads.voicebox.sh/providers"
+
+
+def _get_providers_dir() -> Path:
+    """Get the directory where providers are stored."""
+    system = platform.system()
+    
+    if system == "Windows":
+        appdata = Path.home() / "AppData" / "Roaming"
+    elif system == "Darwin":
+        appdata = Path.home() / "Library" / "Application Support"
+    else:  # Linux
+        appdata = Path.home() / ".local" / "share"
+    
+    providers_dir = appdata / "voicebox" / "providers"
+    providers_dir.mkdir(parents=True, exist_ok=True)
+    return providers_dir
+
+
+def _get_provider_binary_name(provider_type: str) -> str:
+    """Get the local binary filename for a provider type."""
+    system = platform.system()
+    ext = ".exe" if system == "Windows" else ""
+    
+    binary_map = {
+        "pytorch-cpu": f"tts-provider-pytorch-cpu{ext}",
+        "pytorch-cuda": f"tts-provider-pytorch-cuda{ext}",
+    }
+    
+    if provider_type not in binary_map:
+        raise ValueError(f"Unknown provider type: {provider_type}")
+    
+    return binary_map[provider_type]
+
+
+def _get_provider_download_name(provider_type: str) -> str:
+    """Get the remote download filename for a provider type (includes platform suffix)."""
+    system = platform.system()
+
+    if system == "Windows":
+        platform_suffix = "windows"
+        ext = ".zip"
+    elif system == "Linux":
+        platform_suffix = "linux"
+        ext = ".tar.gz"
+    elif system == "Darwin":
+        # Detect macOS architecture
+        machine = platform.machine()
+        if machine == "arm64":
+            platform_suffix = "macos-arm64"
+        else:
+            platform_suffix = "macos-x64"
+        ext = ".tar.gz"
+    else:
+        raise ValueError(f"Provider downloads not supported on {system}")
+
+    return f"tts-provider-{provider_type}-{platform_suffix}{ext}"
+
+
+def _get_provider_download_url(provider_type: str) -> str:
+    """Get the download URL for a provider."""
+    download_name = _get_provider_download_name(provider_type)
+    return f"{PROVIDER_DOWNLOAD_BASE_URL}/v{PROVIDER_VERSION}/{download_name}"
+
+
+async def download_provider(provider_type: str) -> Path:
+    """
+    Download and extract a provider archive from Cloudflare R2.
+
+    Args:
+        provider_type: Type of provider to download (e.g., "pytorch-cpu")
+
+    Returns:
+        Path to the extracted provider binary
+
+    Raises:
+        ValueError: If provider_type is invalid
+        httpx.HTTPError: If download fails
+    """
+    if provider_type not in ["pytorch-cpu", "pytorch-cuda"]:
+        raise ValueError(f"Provider type {provider_type} cannot be downloaded")
+
+    progress_manager = get_progress_manager()
+    task_manager = get_task_manager()
+
+    archive_name = _get_provider_download_name(provider_type)
+    download_url = _get_provider_download_url(provider_type)
+    providers_dir = _get_providers_dir()
+    archive_path = providers_dir / archive_name
+
+    # Start tracking download
+    task_manager.start_download(provider_type)
+
+    # Initialize progress state
+    progress_manager.update_progress(
+        model_name=provider_type,
+        current=0,
+        total=0,  # Will be updated once we get Content-Length
+        filename=archive_name,
+        status="downloading",
+    )
+
+    try:
+        # Download archive
+        async with httpx.AsyncClient(timeout=300.0) as client:
+            async with client.stream("GET", download_url) as response:
+                response.raise_for_status()
+
+                # Get total size from Content-Length header
+                total_size = int(response.headers.get("Content-Length", 0))
+
+                if total_size > 0:
+                    progress_manager.update_progress(
+                        model_name=provider_type,
+                        current=0,
+                        total=total_size,
+                        filename=archive_name,
+                        status="downloading",
+                    )
+
+                # Download with progress tracking
+                downloaded = 0
+                with open(archive_path, "wb") as f:
+                    async for chunk in response.aiter_bytes(chunk_size=8192):
+                        f.write(chunk)
+                        downloaded += len(chunk)
+
+                        # Update progress
+                        progress_manager.update_progress(
+                            model_name=provider_type,
+                            current=downloaded,
+                            total=total_size if total_size > 0 else downloaded,
+                            filename=archive_name,
+                            status="downloading",
+                        )
+
+        # Extract archive
+        progress_manager.update_progress(
+            model_name=provider_type,
+            current=downloaded,
+            total=downloaded,
+            filename="Extracting...",
+            status="downloading",
+        )
+
+        import zipfile
+        import tarfile
+
+        if archive_name.endswith('.zip'):
+            with zipfile.ZipFile(archive_path, 'r') as zip_ref:
+                zip_ref.extractall(providers_dir)
+        elif archive_name.endswith('.tar.gz'):
+            with tarfile.open(archive_path, 'r:gz') as tar_ref:
+                tar_ref.extractall(providers_dir)
+        else:
+            raise ValueError(f"Unsupported archive format: {archive_name}")
+
+        # Remove archive after extraction
+        archive_path.unlink()
+
+        # Get path to extracted binary
+        binary_path = get_provider_binary_path(provider_type)
+        if not binary_path:
+            raise ValueError(f"Provider binary not found after extraction")
+
+        # Make executable on Unix systems
+        if platform.system() != "Windows":
+            binary_path.chmod(0o755)
+
+        # Mark as complete
+        progress_manager.update_progress(
+            model_name=provider_type,
+            current=downloaded,
+            total=downloaded,
+            filename=_get_provider_binary_name(provider_type),
+            status="complete",
+        )
+        task_manager.complete_download(provider_type)
+
+        return binary_path
+
+    except Exception as e:
+        # Clean up archive if it exists
+        if archive_path.exists():
+            archive_path.unlink()
+
+        # Mark as error
+        progress_manager.update_progress(
+            model_name=provider_type,
+            current=0,
+            total=0,
+            filename=archive_name,
+            status="error",
+        )
+        task_manager.error_download(provider_type, str(e))
+        raise
+
+
+def get_provider_binary_path(provider_type: str) -> Optional[Path]:
+    """
+    Get the path to an installed provider binary.
+
+    Args:
+        provider_type: Type of provider
+
+    Returns:
+        Path to provider binary, or None if not installed
+    """
+    providers_dir = _get_providers_dir()
+    binary_name = _get_provider_binary_name(provider_type)
+
+    # Check for --onedir structure (directory with binary inside)
+    provider_dir = providers_dir / f"tts-provider-{provider_type}"
+    if provider_dir.exists() and provider_dir.is_dir():
+        binary_path = provider_dir / binary_name
+        if binary_path.exists() and binary_path.is_file():
+            return binary_path
+
+    # Fallback: check for direct binary (legacy)
+    provider_path = providers_dir / binary_name
+    if provider_path.exists() and provider_path.is_file():
+        return provider_path
+
+    return None
+
+
+def delete_provider(provider_type: str) -> bool:
+    """
+    Delete an installed provider binary.
+    
+    Args:
+        provider_type: Type of provider to delete
+        
+    Returns:
+        True if deleted, False if not found
+    """
+    provider_path = get_provider_binary_path(provider_type)
+    
+    if provider_path and provider_path.exists():
+        provider_path.unlink()
+        return True
+    
+    return False
diff --git a/backend/providers/local.py b/backend/providers/local.py
new file mode 100644
index 00000000..3ea4d75b
--- /dev/null
+++ b/backend/providers/local.py
@@ -0,0 +1,191 @@
+"""
+Local provider that communicates with standalone provider servers via HTTP.
+"""
+
+from typing import Optional, Tuple
+import base64
+import io
+import numpy as np
+import httpx
+import soundfile as sf
+
+from .base import TTSProvider
+from .types import ProviderHealth, ProviderStatus
+
+
+class LocalProvider:
+    """Provider that communicates with local subprocess via HTTP."""
+    
+    def __init__(self, base_url: str):
+        """
+        Initialize local provider.
+        
+        Args:
+            base_url: Base URL of the provider server (e.g., "http://localhost:8000")
+        """
+        self.base_url = base_url.rstrip('/')
+        self.client = httpx.AsyncClient(timeout=300.0)  # 5 minute timeout for generation
+        self._current_model_size = "1.7B"  # Default model size
+    
+    async def generate(
+        self,
+        text: str,
+        voice_prompt: dict,
+        language: str = "en",
+        seed: Optional[int] = None,
+        instruct: Optional[str] = None,
+    ) -> Tuple[np.ndarray, int]:
+        """Generate speech audio."""
+        response = await self.client.post(
+            f"{self.base_url}/tts/generate",
+            json={
+                "text": text,
+                "voice_prompt": voice_prompt,
+                "language": language,
+                "seed": seed,
+                "model_size": self._current_model_size,
+            }
+        )
+        response.raise_for_status()
+        data = response.json()
+        
+        # Decode base64 audio
+        audio_bytes = base64.b64decode(data["audio"])
+        audio_buffer = io.BytesIO(audio_bytes)
+        audio, sample_rate = sf.read(audio_buffer)
+        
+        return audio, data["sample_rate"]
+    
+    async def create_voice_prompt(
+        self,
+        audio_path: str,
+        reference_text: str,
+        use_cache: bool = True,
+    ) -> Tuple[dict, bool]:
+        """Create voice prompt from reference audio."""
+        # Read audio file
+        with open(audio_path, 'rb') as f:
+            audio_data = f.read()
+        
+        # Send multipart form data
+        files = {
+            "audio": ("audio.wav", audio_data, "audio/wav")
+        }
+        data = {
+            "reference_text": reference_text,
+            "use_cache": str(use_cache).lower(),
+        }
+        
+        response = await self.client.post(
+            f"{self.base_url}/tts/create_voice_prompt",
+            files=files,
+            data=data,
+        )
+        response.raise_for_status()
+        result = response.json()
+        
+        return result["voice_prompt"], result.get("was_cached", False)
+    
+    async def combine_voice_prompts(
+        self,
+        audio_paths: list[str],
+        reference_texts: list[str],
+    ) -> Tuple[np.ndarray, str]:
+        """
+        Combine multiple voice prompts.
+        
+        Note: This is not implemented in the provider API yet.
+        For now, we'll combine locally by concatenating audio.
+        """
+        import numpy as np
+        from ..utils.audio import load_audio, normalize_audio
+        
+        combined_audio = []
+        for audio_path in audio_paths:
+            audio, sr = load_audio(audio_path)
+            audio = normalize_audio(audio)
+            combined_audio.append(audio)
+        
+        # Concatenate audio
+        mixed = np.concatenate(combined_audio)
+        mixed = normalize_audio(mixed)
+        
+        # Combine texts
+        combined_text = " ".join(reference_texts)
+        
+        return mixed, combined_text
+    
+    async def load_model_async(self, model_size: str) -> None:
+        """Load TTS model."""
+        # Track the requested model size - the provider server will load it
+        # when generate() is called with this size
+        self._current_model_size = model_size
+
+    # Alias for compatibility
+    load_model = load_model_async
+    
+    def unload_model(self) -> None:
+        """Unload model to free memory."""
+        # Model unloading is handled by the provider server
+        # This is a no-op for local providers
+        pass
+    
+    def is_loaded(self) -> bool:
+        """Check if model is loaded."""
+        # We can't know this without querying the provider
+        # Return True optimistically
+        return True
+    
+    def _get_model_path(self, model_size: str) -> str:
+        """Get model path for a given size."""
+        # For local providers, model paths are handled by the provider server
+        # Return a placeholder
+        return f"Qwen/Qwen3-TTS-12Hz-{model_size}-Base"
+    
+    async def health(self) -> ProviderHealth:
+        """Get provider health status."""
+        try:
+            response = await self.client.get(f"{self.base_url}/tts/health")
+            response.raise_for_status()
+            data = response.json()
+            return ProviderHealth(
+                status=data["status"],
+                provider=data["provider"],
+                version=data.get("version"),
+                model=data.get("model"),
+                device=data.get("device"),
+            )
+        except Exception as e:
+            return ProviderHealth(
+                status="unhealthy",
+                provider="local",
+                version=None,
+                model=None,
+                device=None,
+            )
+    
+    async def status(self) -> ProviderStatus:
+        """Get provider model status."""
+        try:
+            response = await self.client.get(f"{self.base_url}/tts/status")
+            response.raise_for_status()
+            data = response.json()
+            return ProviderStatus(
+                model_loaded=data["model_loaded"],
+                model_size=data.get("model_size"),
+                available_sizes=data.get("available_sizes", []),
+                gpu_available=data.get("gpu_available"),
+                vram_used_mb=data.get("vram_used_mb"),
+            )
+        except Exception as e:
+            return ProviderStatus(
+                model_loaded=False,
+                model_size=None,
+                available_sizes=[],
+                gpu_available=None,
+                vram_used_mb=None,
+            )
+    
+    async def stop(self) -> None:
+        """Stop the provider (close HTTP client)."""
+        await self.client.aclose()
diff --git a/backend/providers/types.py b/backend/providers/types.py
new file mode 100644
index 00000000..b6b0aff1
--- /dev/null
+++ b/backend/providers/types.py
@@ -0,0 +1,34 @@
+"""
+Shared types for TTS providers.
+"""
+
+from typing import Optional, TypedDict
+from enum import Enum
+
+
+class ProviderType(str, Enum):
+    """Available provider types."""
+    BUNDLED_MLX = "apple-mlx"
+    BUNDLED_PYTORCH = "bundled-pytorch"
+    PYTORCH_CPU = "pytorch-cpu"
+    PYTORCH_CUDA = "pytorch-cuda"
+    REMOTE = "remote"
+    OPENAI = "openai"
+
+
+class ProviderHealth(TypedDict):
+    """Provider health status."""
+    status: str  # "healthy", "unhealthy", "starting"
+    provider: str
+    version: Optional[str]
+    model: Optional[str]
+    device: Optional[str]
+
+
+class ProviderStatus(TypedDict):
+    """Provider model status."""
+    model_loaded: bool
+    model_size: Optional[str]
+    available_sizes: list[str]
+    gpu_available: Optional[bool]
+    vram_used_mb: Optional[int]
diff --git a/backend/tts.py b/backend/tts.py
index 98db3412..0f9cfd5f 100644
--- a/backend/tts.py
+++ b/backend/tts.py
@@ -1,5 +1,5 @@
 """
-TTS inference module - delegates to backend abstraction layer.
+TTS inference module - delegates to provider abstraction layer.
 """
 
 from typing import Optional
@@ -7,31 +7,51 @@
 import io
 import soundfile as sf
 
-from .backends import get_tts_backend, TTSBackend
+from .backends import TTSBackend
+from .providers import get_provider_manager
+from .providers.base import TTSProvider
 
 
-def get_tts_model() -> TTSBackend:
+def get_tts_model() -> TTSProvider:
     """
-    Get TTS backend instance (MLX or PyTorch based on platform).
+    Get TTS provider instance (via ProviderManager).
     
     Returns:
-        TTS backend instance
+        TTS provider instance
     """
-    return get_tts_backend()
+    manager = get_provider_manager()
+    # Note: This is async but we need sync interface for backward compatibility
+    # In practice, this will be called from async contexts
+    import asyncio
+    try:
+        loop = asyncio.get_event_loop()
+        if loop.is_running():
+            # We're in an async context, but can't await here
+            # Return a wrapper that will use the provider manager
+            return manager._get_default_provider()
+        else:
+            return loop.run_until_complete(manager.get_active_provider())
+    except RuntimeError:
+        # No event loop, return default
+        return manager._get_default_provider()
+
+
+async def get_tts_model_async() -> TTSProvider:
+    """
+    Get TTS provider instance asynchronously.
+    
+    Returns:
+        TTS provider instance
+    """
+    manager = get_provider_manager()
+    return await manager.get_active_provider()
 
 
 def unload_tts_model():
     """Unload TTS model to free memory."""
-    backend = get_tts_backend()
-    backend.unload_model()
-
-
-def audio_to_wav_bytes(audio: np.ndarray, sample_rate: int) -> bytes:
-    """Convert audio array to WAV bytes."""
-    buffer = io.BytesIO()
-    sf.write(buffer, audio, sample_rate, format="WAV")
-    buffer.seek(0)
-    return buffer.read()
+    manager = get_provider_manager()
+    provider = manager._get_default_provider()
+    provider.unload_model()
 
 
 def audio_to_wav_bytes(audio: np.ndarray, sample_rate: int) -> bytes:
diff --git a/backend/utils/progress.py b/backend/utils/progress.py
index 418a88c7..5d8202d2 100644
--- a/backend/utils/progress.py
+++ b/backend/utils/progress.py
@@ -49,11 +49,17 @@ def _notify_listeners_threadsafe(self, model_name: str, progress_data: Dict):
                     queue.put_nowait(progress_data.copy())
                 except RuntimeError:
                     # Not in async context (running in background thread)
-                    # Use call_soon_threadsafe to safely put on queue
+                    # Use asyncio.run_coroutine_threadsafe for better PyInstaller compatibility
                     if self._main_loop and self._main_loop.is_running():
-                        self._main_loop.call_soon_threadsafe(
-                            lambda q=queue, d=progress_data.copy(): q.put_nowait(d) if not q.full() else None
-                        )
+                        async def put_data_async():
+                            try:
+                                queue.put_nowait(progress_data.copy())
+                            except asyncio.QueueFull:
+                                pass  # Queue full, drop update
+                        try:
+                            asyncio.run_coroutine_threadsafe(put_data_async(), self._main_loop)
+                        except Exception as e:
+                            logger.warning(f"Failed to schedule progress update: {e}")
                     else:
                         logger.debug(f"No main loop available for {model_name}, skipping notification")
             except asyncio.QueueFull:
diff --git a/backend/voicebox-server.spec b/backend/voicebox-server.spec
index 5d6bb317..a6ff1e41 100644
--- a/backend/voicebox-server.spec
+++ b/backend/voicebox-server.spec
@@ -1,15 +1,11 @@
 # -*- mode: python ; coding: utf-8 -*-
 from PyInstaller.utils.hooks import collect_data_files
 from PyInstaller.utils.hooks import collect_submodules
-from PyInstaller.utils.hooks import copy_metadata
 
 datas = []
-hiddenimports = ['backend', 'backend.main', 'backend.config', 'backend.database', 'backend.models', 'backend.profiles', 'backend.history', 'backend.tts', 'backend.transcribe', 'backend.platform_detect', 'backend.backends', 'backend.backends.pytorch_backend', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.validation', 'torch', 'transformers', 'fastapi', 'uvicorn', 'sqlalchemy', 'librosa', 'soundfile', 'qwen_tts', 'qwen_tts.inference', 'qwen_tts.inference.qwen3_tts_model', 'qwen_tts.inference.qwen3_tts_tokenizer', 'qwen_tts.core', 'qwen_tts.cli', 'pkg_resources.extern', 'backend.backends.mlx_backend', 'mlx', 'mlx.core', 'mlx.nn', 'mlx_audio', 'mlx_audio.tts', 'mlx_audio.stt']
-datas += collect_data_files('qwen_tts')
+hiddenimports = ['backend', 'backend.main', 'backend.config', 'backend.database', 'backend.models', 'backend.profiles', 'backend.history', 'backend.tts', 'backend.transcribe', 'backend.platform_detect', 'backend.providers', 'backend.providers.base', 'backend.providers.bundled', 'backend.providers.types', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.validation', 'fastapi', 'uvicorn', 'sqlalchemy', 'librosa', 'soundfile', 'pkg_resources.extern', 'asyncio', 'asyncio.subprocess', 'concurrent.futures', 'concurrent.futures.thread', 'backend.backends', 'backend.backends.mlx_backend', 'mlx', 'mlx.core', 'mlx.nn', 'mlx_audio', 'mlx_audio.tts', 'mlx_audio.stt']
 datas += collect_data_files('mlx')
 datas += collect_data_files('mlx_audio')
-datas += copy_metadata('qwen-tts')
-hiddenimports += collect_submodules('qwen_tts')
 hiddenimports += collect_submodules('jaraco')
 hiddenimports += collect_submodules('mlx')
 hiddenimports += collect_submodules('mlx_audio')
diff --git a/bun.lock b/bun.lock
index 9e08a825..add8f83f 100644
--- a/bun.lock
+++ b/bun.lock
@@ -13,12 +13,16 @@
     },
     "app": {
       "name": "@voicebox/app",
-      "version": "0.1.11",
+      "version": "0.1.13",
       "dependencies": {
         "@dnd-kit/core": "^6.3.1",
         "@dnd-kit/sortable": "^10.0.0",
         "@dnd-kit/utilities": "^3.2.2",
         "@hookform/resolvers": "^3.9.0",
+        "@hugeicons/core-free-icons": "^3.1.1",
+        "@hugeicons/react": "^1.1.4",
+        "@iconify-json/svg-spinners": "^1.2.4",
+        "@iconify/react": "^6.0.2",
         "@radix-ui/react-alert-dialog": "^1.1.1",
         "@radix-ui/react-avatar": "^1.1.0",
         "@radix-ui/react-dialog": "^1.1.1",
@@ -26,6 +30,7 @@
         "@radix-ui/react-label": "^2.1.0",
         "@radix-ui/react-popover": "^1.1.1",
         "@radix-ui/react-progress": "^1.1.0",
+        "@radix-ui/react-radio-group": "^1.2.0",
         "@radix-ui/react-scroll-area": "^1.1.0",
         "@radix-ui/react-select": "^2.1.1",
         "@radix-ui/react-separator": "^1.1.0",
@@ -45,7 +50,6 @@
         "clsx": "^2.1.1",
         "date-fns": "^3.6.0",
         "framer-motion": "^12.29.0",
-        "lucide-react": "^0.454.0",
         "motion": "^12.29.0",
         "react": "^18.3.0",
         "react-dom": "^18.3.0",
@@ -68,7 +72,7 @@
     },
     "landing": {
       "name": "@voicebox/landing",
-      "version": "0.1.11",
+      "version": "0.1.13",
       "dependencies": {
         "@radix-ui/react-separator": "^1.1.8",
         "@radix-ui/react-slot": "^1.2.4",
@@ -93,7 +97,7 @@
     },
     "tauri": {
       "name": "@voicebox/tauri",
-      "version": "0.1.11",
+      "version": "0.1.13",
       "dependencies": {
         "@tauri-apps/api": "^2.0.0",
         "@tauri-apps/plugin-dialog": "^2.0.0",
@@ -116,7 +120,7 @@
     },
     "web": {
       "name": "@voicebox/web",
-      "version": "0.1.11",
+      "version": "0.1.13",
       "dependencies": {
         "@tanstack/react-query": "^5.0.0",
         "react": "^18.3.0",
@@ -125,6 +129,7 @@
         "zustand": "^4.5.0",
       },
       "devDependencies": {
+        "@tailwindcss/vite": "^4.1.18",
         "@types/react": "^18.3.0",
         "@types/react-dom": "^18.3.0",
         "@typescript-eslint/eslint-plugin": "^7.0.0",
@@ -133,6 +138,7 @@
         "eslint": "^8.57.0",
         "eslint-plugin-react-hooks": "^4.6.0",
         "eslint-plugin-react-refresh": "^0.4.0",
+        "tailwindcss": "^4.1.0",
         "typescript": "^5.6.0",
         "vite": "^5.4.0",
       },
@@ -271,12 +277,22 @@
 
     "@hookform/resolvers": ["@hookform/resolvers@3.10.0", "", { "peerDependencies": { "react-hook-form": "^7.0.0" } }, "sha512-79Dv+3mDF7i+2ajj7SkypSKHhl1cbln1OGavqrsF7p6mbUv11xpqpacPsGDCTRvCSjEEIez2ef1NveSVL3b0Ag=="],
 
+    "@hugeicons/core-free-icons": ["@hugeicons/core-free-icons@3.1.1", "", {}, "sha512-UpS2lUQFi5sKyJSWwM6rO+BnPLvVz1gsyCpPHeZyVuZqi89YH8ksliza4cwaODqKOZyeXmG8juo1ty4QtQofkg=="],
+
+    "@hugeicons/react": ["@hugeicons/react@1.1.4", "", { "peerDependencies": { "react": ">=16.0.0" } }, "sha512-gsc3eZyd2fGqRUThW9+lfjxxsOkz6KNVmRXRgJjP32GL0OnnLJnl3hytKt47CBbiQj2xE2kCw+rnP3UQCThcKw=="],
+
     "@humanwhocodes/config-array": ["@humanwhocodes/config-array@0.13.0", "", { "dependencies": { "@humanwhocodes/object-schema": "^2.0.3", "debug": "^4.3.1", "minimatch": "^3.0.5" } }, "sha512-DZLEEqFWQFiyK6h5YIeynKx7JlvCYWL0cImfSRXZ9l4Sg2efkFGTuFf6vzXjK1cq6IYkU+Eg/JizXw+TD2vRNw=="],
 
     "@humanwhocodes/module-importer": ["@humanwhocodes/module-importer@1.0.1", "", {}, "sha512-bxveV4V8v5Yb4ncFTT3rPSgZBOpCkjfK0y4oVVVJwIuDVBRMDXrPyXRL988i5ap9m9bnyEEjWfm5WkBmtffLfA=="],
 
     "@humanwhocodes/object-schema": ["@humanwhocodes/object-schema@2.0.3", "", {}, "sha512-93zYdMES/c1D69yZiKDBj0V24vqNzB/koF26KPaagAfd3P/4gUlh3Dys5ogAK+Exi9QyzlD8x/08Zt7wIKcDcA=="],
 
+    "@iconify-json/svg-spinners": ["@iconify-json/svg-spinners@1.2.4", "", { "dependencies": { "@iconify/types": "*" } }, "sha512-ayn0pogFPwJA1WFZpDnoq9/hjDxN+keeCMyThaX4d3gSJ3y0mdKUxIA/b1YXWGtY9wVtZmxwcvOIeEieG4+JNg=="],
+
+    "@iconify/react": ["@iconify/react@6.0.2", "", { "dependencies": { "@iconify/types": "^2.0.0" }, "peerDependencies": { "react": ">=16" } }, "sha512-SMmC2sactfpJD427WJEDN6PMyznTFMhByK9yLW0gOTtnjzzbsi/Ke/XqsumsavFPwNiXs8jSiYeZTmLCLwO+Fg=="],
+
+    "@iconify/types": ["@iconify/types@2.0.0", "", {}, "sha512-+wluvCrRhXrhyOmRDJ3q8mux9JkKy5SJ/v8ol2tu4FVjyYvtEzkc/3pK15ET6RKg4b4w4BmTk1+gsCUhf21Ykg=="],
+
     "@img/colour": ["@img/colour@1.0.0", "", {}, "sha512-A5P/LfWGFSl6nsckYtjw9da+19jB8hkJ6ACTGcDfEJ0aE+l2n2El7dsVM7UVHZQ9s2lmYMWlrS21YLy2IR1LUw=="],
 
     "@img/sharp-darwin-arm64": ["@img/sharp-darwin-arm64@0.34.5", "", { "optionalDependencies": { "@img/sharp-libvips-darwin-arm64": "1.2.4" }, "os": "darwin", "cpu": "arm64" }, "sha512-imtQ3WMJXbMY4fxb/Ndp6HBTNVtWCUI0WdobyheGf5+ad6xX8VIDO8u2xE4qc/fr08CKG/7dDseFtn6M6g/r3w=="],
@@ -407,6 +423,8 @@
 
     "@radix-ui/react-progress": ["@radix-ui/react-progress@1.1.8", "", { "dependencies": { "@radix-ui/react-context": "1.1.3", "@radix-ui/react-primitive": "2.1.4" }, "peerDependencies": { "@types/react": "*", "@types/react-dom": "*", "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc", "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-+gISHcSPUJ7ktBy9RnTqbdKW78bcGke3t6taawyZ71pio1JewwGSJizycs7rLhGTvMJYCQB1DBK4KQsxs7U8dA=="],
 
+    "@radix-ui/react-radio-group": ["@radix-ui/react-radio-group@1.3.8", "", { "dependencies": { "@radix-ui/primitive": "1.1.3", "@radix-ui/react-compose-refs": "1.1.2", "@radix-ui/react-context": "1.1.2", "@radix-ui/react-direction": "1.1.1", "@radix-ui/react-presence": "1.1.5", "@radix-ui/react-primitive": "2.1.3", "@radix-ui/react-roving-focus": "1.1.11", "@radix-ui/react-use-controllable-state": "1.2.2", "@radix-ui/react-use-previous": "1.1.1", "@radix-ui/react-use-size": "1.1.1" }, "peerDependencies": { "@types/react": "*", "@types/react-dom": "*", "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc", "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-VBKYIYImA5zsxACdisNQ3BjCBfmbGH3kQlnFVqlWU4tXwjy7cGX8ta80BcrO+WJXIn5iBylEH3K6ZTlee//lgQ=="],
+
     "@radix-ui/react-roving-focus": ["@radix-ui/react-roving-focus@1.1.11", "", { "dependencies": { "@radix-ui/primitive": "1.1.3", "@radix-ui/react-collection": "1.1.7", "@radix-ui/react-compose-refs": "1.1.2", "@radix-ui/react-context": "1.1.2", "@radix-ui/react-direction": "1.1.1", "@radix-ui/react-id": "1.1.1", "@radix-ui/react-primitive": "2.1.3", "@radix-ui/react-use-callback-ref": "1.1.1", "@radix-ui/react-use-controllable-state": "1.2.2" }, "peerDependencies": { "@types/react": "*", "@types/react-dom": "*", "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc", "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-7A6S9jSgm/S+7MdtNDSb+IU859vQqJ/QAtcYQcfFC6W8RS4IxIZDldLR0xqCFZ6DCyrQLjLPsxtTNch5jVA4lA=="],
 
     "@radix-ui/react-scroll-area": ["@radix-ui/react-scroll-area@1.2.10", "", { "dependencies": { "@radix-ui/number": "1.1.1", "@radix-ui/primitive": "1.1.3", "@radix-ui/react-compose-refs": "1.1.2", "@radix-ui/react-context": "1.1.2", "@radix-ui/react-direction": "1.1.1", "@radix-ui/react-presence": "1.1.5", "@radix-ui/react-primitive": "2.1.3", "@radix-ui/react-use-callback-ref": "1.1.1", "@radix-ui/react-use-layout-effect": "1.1.1" }, "peerDependencies": { "@types/react": "*", "@types/react-dom": "*", "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc", "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-tAXIa1g3sM5CGpVT0uIbUx/U3Gs5N8T52IICuCtObaos1S8fzsrPXG5WObkQN3S6NVl6wKgPhAIiBGbWnvc97A=="],
@@ -881,7 +899,7 @@
 
     "lru-cache": ["lru-cache@5.1.1", "", { "dependencies": { "yallist": "^3.0.2" } }, "sha512-KpNARQA3Iwv+jTA0utUVVbrh+Jlrr1Fv0e56GGzAFOXN7dk/FviaDW8LHmK52DlcH4WP2n6gI8vN1aesBFgo9w=="],
 
-    "lucide-react": ["lucide-react@0.454.0", "", { "peerDependencies": { "react": "^16.5.1 || ^17.0.0 || ^18.0.0 || ^19.0.0-rc" } }, "sha512-hw7zMDwykCLnEzgncEEjHeA6+45aeEzRYuKHuyRSOPkhko+J3ySGjGIzu+mmMfDFG1vazHepMaYFYHbTFAZAAQ=="],
+    "lucide-react": ["lucide-react@0.316.0", "", { "peerDependencies": { "react": "^16.5.1 || ^17.0.0 || ^18.0.0" } }, "sha512-dTmYX1H4IXsRfVcj/KUxworV6814ApTl7iXaS21AimK2RUEl4j4AfOmqD3VR8phe5V91m4vEJ8tCK4uT1jE5nA=="],
 
     "magic-string": ["magic-string@0.30.21", "", { "dependencies": { "@jridgewell/sourcemap-codec": "^1.5.5" } }, "sha512-vd2F4YUyEXKGcLHoq+TEyCjxueSeHnFxyyjNp80yg0XV4vUhnDer/lvvlqM/arB5bXQN5K2/3oinyCRyx8T2CQ=="],
 
@@ -1137,8 +1155,6 @@
 
     "@typescript-eslint/typescript-estree/semver": ["semver@7.7.3", "", { "bin": { "semver": "bin/semver.js" } }, "sha512-SdsKMrI9TdgjdweUSR9MweHA4EJ8YxHn8DFaDisvhVlUOe4BF1tLD7GAj0lIqWVl+dPb/rExr0Btby5loQm20Q=="],
 
-    "@voicebox/landing/lucide-react": ["lucide-react@0.316.0", "", { "peerDependencies": { "react": "^16.5.1 || ^17.0.0 || ^18.0.0" } }, "sha512-dTmYX1H4IXsRfVcj/KUxworV6814ApTl7iXaS21AimK2RUEl4j4AfOmqD3VR8phe5V91m4vEJ8tCK4uT1jE5nA=="],
-
     "@voicebox/landing/tailwind-merge": ["tailwind-merge@3.4.0", "", {}, "sha512-uSaO4gnW+b3Y2aWoWfFpX62vn2sR3skfhbjsEnaBI81WD1wBLlHZe5sWf0AqjksNdYTbGBEd0UasQMT3SNV15g=="],
 
     "@voicebox/landing/tailwindcss": ["tailwindcss@3.4.19", "", { "dependencies": { "@alloc/quick-lru": "^5.2.0", "arg": "^5.0.2", "chokidar": "^3.6.0", "didyoumean": "^1.2.2", "dlv": "^1.1.3", "fast-glob": "^3.3.2", "glob-parent": "^6.0.2", "is-glob": "^4.0.3", "jiti": "^1.21.7", "lilconfig": "^3.1.3", "micromatch": "^4.0.8", "normalize-path": "^3.0.0", "object-hash": "^3.0.0", "picocolors": "^1.1.1", "postcss": "^8.4.47", "postcss-import": "^15.1.0", "postcss-js": "^4.0.1", "postcss-load-config": "^4.0.2 || ^5.0 || ^6.0", "postcss-nested": "^6.2.0", "postcss-selector-parser": "^6.1.2", "resolve": "^1.22.8", "sucrase": "^3.35.0" }, "bin": { "tailwind": "lib/cli.js", "tailwindcss": "lib/cli.js" } }, "sha512-3ofp+LL8E+pK/JuPLPggVAIaEuhvIz4qNcf3nA1Xn2o/7fb7s/TYpHhwGDv1ZU3PkBluUVaF8PyCHcm48cKLWQ=="],
diff --git a/data/.gitkeep b/data/.gitkeep
deleted file mode 100644
index 76bde729..00000000
--- a/data/.gitkeep
+++ /dev/null
@@ -1,7 +0,0 @@
-# User data directory
-# This directory contains:
-# - profiles/ - Voice profile audio files
-# - generations/ - Generated audio files
-# - projects/ - Audio studio project files
-# - voicebox.db - SQLite database
-# - cache/ - Voice prompt cache files
diff --git a/data/cache/.gitkeep b/data/cache/.gitkeep
deleted file mode 100644
index d66284ff..00000000
--- a/data/cache/.gitkeep
+++ /dev/null
@@ -1 +0,0 @@
-# Voice prompt cache files
diff --git a/docker-compose.cpu.yml b/docker-compose.cpu.yml
new file mode 100644
index 00000000..7093c8d7
--- /dev/null
+++ b/docker-compose.cpu.yml
@@ -0,0 +1,26 @@
+version: '3.8'
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - LOG_LEVEL=info
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
+
+volumes:
+  voicebox-data:
+    driver: local
+  huggingface-cache:
+    driver: local
diff --git a/docker-compose.yml b/docker-compose.yml
new file mode 100644
index 00000000..f8225205
--- /dev/null
+++ b/docker-compose.yml
@@ -0,0 +1,34 @@
+version: '3.8'
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - GPU_MEMORY_FRACTION=0.8
+      - LOG_LEVEL=info
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
+
+volumes:
+  voicebox-data:
+    driver: local
+  huggingface-cache:
+    driver: local
diff --git a/docs/mint.json b/docs/mint.json
index c4f582ea..bbe0c409 100644
--- a/docs/mint.json
+++ b/docs/mint.json
@@ -40,7 +40,7 @@
     {
       "group": "Getting Started",
       "icon": "rocket",
-      "pages": ["overview/introduction", "overview/installation", "overview/quick-start"]
+      "pages": ["overview/introduction", "overview/installation", "overview/docker", "overview/quick-start"]
     },
     {
       "group": "Features",
diff --git a/docs/overview/docker.mdx b/docs/overview/docker.mdx
new file mode 100644
index 00000000..0032a02a
--- /dev/null
+++ b/docs/overview/docker.mdx
@@ -0,0 +1,403 @@
+---
+title: "Docker Deployment"
+description: "Run Voicebox in Docker with the web UI for server deployments"
+---
+
+## Overview
+
+Voicebox is available as Docker images that include both the backend API and web UI. Run the full Voicebox experience in a container with a single command.
+
+**What's included:**
+- FastAPI backend with all TTS/Whisper capabilities
+- Complete web UI (same React app as the desktop version)
+- Provider download system (downloads PyTorch on first use)
+- Multi-architecture support (amd64, arm64)
+
+## Quick Start
+
+<Tabs>
+  <Tab title="NVIDIA GPU">
+    ```bash
+    docker run --gpus all -p 8000:8000 \
+      -v voicebox-data:/app/data \
+      ghcr.io/jamiepine/voicebox:latest-cuda
+    ```
+
+    Then open http://localhost:8000 to access the web UI.
+  </Tab>
+
+  <Tab title="CPU Only">
+    ```bash
+    docker run -p 8000:8000 \
+      -v voicebox-data:/app/data \
+      ghcr.io/jamiepine/voicebox:latest
+    ```
+
+    Then open http://localhost:8000 to access the web UI.
+  </Tab>
+
+  <Tab title="Docker Compose">
+    Clone the repo or download `docker-compose.yml`:
+
+    ```bash
+    # CUDA variant (default)
+    docker compose up -d
+
+    # CPU-only variant
+    docker compose -f docker-compose-cpu.yml up -d
+    ```
+
+    Then open http://localhost:8000 to access the web UI.
+  </Tab>
+</Tabs>
+
+<Note>
+  On first launch, you'll be prompted to download a TTS provider (PyTorch CPU ~300MB or PyTorch CUDA ~2.4GB). This happens once and is cached in the `huggingface-cache` volume.
+</Note>
+
+## Available Images
+
+Images are automatically built and published to GitHub Container Registry on each release.
+
+| Image | Description | Platforms |
+|-------|-------------|-----------|
+| `ghcr.io/jamiepine/voicebox:latest` | Latest CPU-only release | linux/amd64, linux/arm64 |
+| `ghcr.io/jamiepine/voicebox:0.1.13` | Specific version (CPU) | linux/amd64, linux/arm64 |
+| `ghcr.io/jamiepine/voicebox:latest-cuda` | Latest with NVIDIA GPU support | linux/amd64 |
+| `ghcr.io/jamiepine/voicebox:0.1.13-cuda` | Specific version (CUDA) | linux/amd64 |
+
+<Tip>
+  Pin to a specific version in production to avoid unexpected updates:
+  ```yaml
+  image: ghcr.io/jamiepine/voicebox:0.1.13-cuda
+  ```
+</Tip>
+
+## Docker Compose Examples
+
+### GPU Deployment (Recommended)
+
+```yaml
+version: '3.8'
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - GPU_MEMORY_FRACTION=0.8
+      - LOG_LEVEL=info
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+```
+
+### CPU Deployment
+
+```yaml
+version: '3.8'
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - LOG_LEVEL=info
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+```
+
+## Volume Mounts
+
+<CardGroup cols={2}>
+  <Card title="voicebox-data" icon="database">
+    Stores voice profiles, generated audio, and database
+  </Card>
+  <Card title="huggingface-cache" icon="download">
+    Caches downloaded TTS/Whisper models (saves re-downloading)
+  </Card>
+</CardGroup>
+
+<Warning>
+  Always mount `/app/data` to preserve your voice profiles and generations across container restarts.
+</Warning>
+
+## Environment Variables
+
+Configure Voicebox behavior with environment variables:
+
+| Variable | Default | Description |
+|----------|---------|-------------|
+| `GPU_MEMORY_FRACTION` | `0.9` | Fraction of GPU memory to use (0.0-1.0) |
+| `LOG_LEVEL` | `info` | Logging level: `debug`, `info`, `warning`, `error` |
+| `DATA_DIR` | `/app/data` | Directory for profiles and generations |
+
+Example:
+```bash
+docker run -e GPU_MEMORY_FRACTION=0.8 \
+           -e LOG_LEVEL=debug \
+           -p 8000:8000 \
+           ghcr.io/jamiepine/voicebox:latest-cuda
+```
+
+## Cloud Deployment
+
+### AWS EC2
+
+<Steps>
+  <Step title="Launch GPU Instance">
+    Use g4dn.xlarge or p3.2xlarge with NVIDIA GPU
+  </Step>
+
+  <Step title="Install Docker & NVIDIA Container Toolkit">
+    ```bash
+    # Install Docker
+    curl -fsSL https://get.docker.com -o get-docker.sh
+    sudo sh get-docker.sh
+
+    # Install NVIDIA Container Toolkit
+    distribution=$(. /etc/os-release;echo $ID$VERSION_ID)
+    curl -fsSL https://nvidia.github.io/libnvidia-container/gpgkey | sudo gpg --dearmor -o /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg
+    curl -s -L https://nvidia.github.io/libnvidia-container/$distribution/libnvidia-container.list | \
+      sed 's#deb https://#deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://#g' | \
+      sudo tee /etc/apt/sources.list.d/nvidia-container-toolkit.list
+    sudo apt-get update
+    sudo apt-get install -y nvidia-container-toolkit
+    sudo systemctl restart docker
+    ```
+  </Step>
+
+  <Step title="Deploy">
+    ```bash
+    docker run -d --gpus all -p 8000:8000 \
+      -v voicebox-data:/app/data \
+      --restart unless-stopped \
+      ghcr.io/jamiepine/voicebox:latest-cuda
+    ```
+  </Step>
+</Steps>
+
+### DigitalOcean
+
+<Steps>
+  <Step title="Create GPU Droplet">
+    ```bash
+    doctl compute droplet create voicebox \
+      --size gpu-h100x1-80gb \
+      --image ubuntu-22-04-x64 \
+      --region nyc3
+    ```
+  </Step>
+
+  <Step title="SSH and Deploy">
+    ```bash
+    ssh root@<droplet-ip>
+    curl -fsSL https://get.docker.com | sh
+    docker run -d --gpus all -p 80:8000 \
+      ghcr.io/jamiepine/voicebox:latest-cuda
+    ```
+  </Step>
+</Steps>
+
+### Fly.io
+
+Create `fly.toml`:
+
+```toml
+app = "voicebox"
+
+[build]
+  image = "ghcr.io/jamiepine/voicebox:latest"
+
+[[services]]
+  http_checks = []
+  internal_port = 8000
+  protocol = "tcp"
+
+  [[services.ports]]
+    port = 80
+    handlers = ["http"]
+
+  [[services.ports]]
+    port = 443
+    handlers = ["tls", "http"]
+
+[mounts]
+  source = "voicebox_data"
+  destination = "/app/data"
+```
+
+Deploy:
+```bash
+fly launch
+fly deploy
+```
+
+## Updates
+
+Docker images are automatically built and published on each GitHub release.
+
+<Tabs>
+  <Tab title="Latest Tag">
+    Always get the newest version:
+
+    ```bash
+    docker pull ghcr.io/jamiepine/voicebox:latest
+    docker compose up -d
+    ```
+  </Tab>
+
+  <Tab title="Pinned Version">
+    Update to a specific version:
+
+    ```yaml
+    services:
+      voicebox:
+        image: ghcr.io/jamiepine/voicebox:0.1.13-cuda
+    ```
+
+    ```bash
+    docker compose pull
+    docker compose up -d
+    ```
+  </Tab>
+
+  <Tab title="Automatic Updates">
+    Use Watchtower for automatic updates:
+
+    ```yaml
+    services:
+      voicebox:
+        image: ghcr.io/jamiepine/voicebox:latest-cuda
+        # ... other config ...
+
+      watchtower:
+        image: containrrr/watchtower
+        volumes:
+          - /var/run/docker.sock:/var/run/docker.sock
+        command: --interval 3600 # Check hourly
+    ```
+  </Tab>
+</Tabs>
+
+## GPU Requirements
+
+### NVIDIA GPU
+
+Requires:
+- **Docker version:** 19.03+
+- **NVIDIA Driver:** 450.80.02+
+- **NVIDIA Container Toolkit:** Installed and configured
+
+Verify GPU access:
+```bash
+docker run --rm --gpus all nvidia/cuda:12.1.1-base-ubuntu22.04 nvidia-smi
+```
+
+If this works, Voicebox will detect and use your GPU automatically.
+
+### AMD GPU (ROCm)
+
+AMD GPU support via ROCm is not currently available in pre-built images. If you need ROCm support, build a custom image using the ROCm base.
+
+## Troubleshooting
+
+### GPU Not Detected
+
+<Accordion title="Check NVIDIA Docker">
+  ```bash
+  # Verify NVIDIA Container Toolkit is installed
+  docker run --rm --gpus all nvidia/cuda:12.1.1-base-ubuntu22.04 nvidia-smi
+  ```
+
+  If this fails, reinstall NVIDIA Container Toolkit.
+</Accordion>
+
+<Accordion title="Insufficient GPU Memory">
+  Reduce GPU memory usage:
+
+  ```bash
+  docker run -e GPU_MEMORY_FRACTION=0.5 \
+    --gpus all -p 8000:8000 \
+    ghcr.io/jamiepine/voicebox:latest-cuda
+  ```
+
+  Or use CPU-only mode:
+  ```bash
+  docker run -p 8000:8000 \
+    ghcr.io/jamiepine/voicebox:latest
+  ```
+</Accordion>
+
+<Accordion title="Port Already in Use">
+  Change the host port:
+
+  ```bash
+  docker run -p 8080:8000 ghcr.io/jamiepine/voicebox:latest
+  ```
+
+  Then open http://localhost:8080
+</Accordion>
+
+<Accordion title="Permission Errors">
+  Run with specific user:
+
+  ```bash
+  docker run --user $(id -u):$(id -g) \
+    -v $(pwd)/data:/app/data \
+    ghcr.io/jamiepine/voicebox:latest
+  ```
+</Accordion>
+
+## Building From Source
+
+If you need to customize the Docker image:
+
+```bash
+# Clone the repo
+git clone https://github.com/jamiepine/voicebox.git
+cd voicebox
+
+# Build web UI
+bun install
+cd web && bun run build && cd ..
+
+# Build Docker image
+docker build -t voicebox:custom .
+
+# Or CUDA variant
+docker build -f Dockerfile.cuda -t voicebox:custom-cuda .
+```
+
+## Next Steps
+
+<CardGroup cols={2}>
+  <Card title="API Reference" icon="code" href="/api/overview">
+    Integrate Voicebox into your applications
+  </Card>
+  <Card title="Remote Mode" icon="server" href="/overview/remote-mode">
+    Connect desktop app to Docker backend
+  </Card>
+</CardGroup>
diff --git a/docs/overview/installation.mdx b/docs/overview/installation.mdx
index 04ddc5ba..2b1a410b 100644
--- a/docs/overview/installation.mdx
+++ b/docs/overview/installation.mdx
@@ -5,15 +5,21 @@ description: "Download and install Voicebox on macOS, Windows, or Linux"
 
 ## Download
 
-Voicebox is available for macOS and Windows, with Linux builds coming soon.
+Voicebox is available for macOS, Windows, and Linux.
 
-<CardGroup cols={2}>
+<CardGroup cols={4}>
   <Card title="macOS" icon="apple">
     Download for Apple Silicon or Intel Macs
   </Card>
   <Card title="Windows" icon="windows">
     Download MSI installer or Setup executable
   </Card>
+  <Card title="Linux" icon="linux">
+    Download AppImage or Deb package
+  </Card>
+  <Card title="Docker" icon="docker" href="/overview/docker">
+    Run with web UI in a container
+  </Card>
 </CardGroup>
 
 ### macOS
@@ -60,8 +66,33 @@ Voicebox is available for macOS and Windows, with Linux builds coming soon.
 
 ### Linux
 
+<Tabs>
+  <Tab title="AppImage">
+    Download: [voicebox_x86_64.AppImage](https://github.com/jamiepine/voicebox/releases/latest)
+
+    ```bash
+    # Make executable
+    chmod +x voicebox_x86_64.AppImage
+
+    # Run
+    ./voicebox_x86_64.AppImage
+    ```
+  </Tab>
+  <Tab title="Debian/Ubuntu">
+    Download: [voicebox_amd64.deb](https://github.com/jamiepine/voicebox/releases/latest)
+
+    ```bash
+    # Install
+    sudo dpkg -i voicebox_amd64.deb
+
+    # Run
+    voicebox
+    ```
+  </Tab>
+</Tabs>
+
 <Note>
-  Linux builds are coming soon. Currently blocked by GitHub runner disk space limitations.
+  For headless server deployments, use [Docker](/overview/docker) instead of the desktop app.
 </Note>
 
 ## First Launch
diff --git a/docs/plans/DOCKER_DEPLOYMENT.md b/docs/plans/DOCKER_DEPLOYMENT.md
index 6af65ed7..6312ed41 100644
--- a/docs/plans/DOCKER_DEPLOYMENT.md
+++ b/docs/plans/DOCKER_DEPLOYMENT.md
@@ -1,24 +1,31 @@
 # Docker Deployment Guide
 
-**Status:** In Development for v0.2.0
-**Requested By:** Reddit community ([thread](https://reddit.com/r/LocalLLaMA/...))
+**Status:** Implemented
+**Images:** `ghcr.io/jamiepine/voicebox`
 
 ## Overview
 
-Docker support makes Voicebox easier to deploy, especially for:
+Voicebox is available as Docker images with the full web UI included. Images are automatically built and published to GitHub Container Registry on each release.
 
-- **Consistent Environments**: Same setup across dev/staging/prod
-- **GPU Passthrough**: Easy NVIDIA/AMD GPU access
+**What's included:**
+- FastAPI backend with all TTS/Whisper capabilities
+- Complete web UI (same React app as the Tauri desktop version)
+- Provider download system (downloads TTS providers on first use, just like desktop)
+- Multi-architecture support (amd64, arm64 for CPU variant)
+
+Docker support is ideal for:
 - **Server Deployments**: Run on headless Linux servers
-- **Multi-User Setups**: Isolate instances per user/team
+- **GPU Passthrough**: Easy NVIDIA GPU access
+- **Consistent Environments**: Same setup across dev/staging/prod
 - **Cloud Platforms**: Deploy to AWS, GCP, Azure, DigitalOcean
+- **Multi-User Setups**: Isolate instances per user/team
 
 ## Quick Start
 
 ### Using Pre-Built Images (Recommended)
 
 ```bash
-# CPU-only version
+# CPU-only version (supports amd64 and arm64)
 docker run -p 8000:8000 -v voicebox-data:/app/data \
   ghcr.io/jamiepine/voicebox:latest
 
@@ -26,184 +33,80 @@ docker run -p 8000:8000 -v voicebox-data:/app/data \
 docker run --gpus all -p 8000:8000 -v voicebox-data:/app/data \
   ghcr.io/jamiepine/voicebox:latest-cuda
 
-# AMD GPU version (experimental)
-docker run --device=/dev/kfd --device=/dev/dri -p 8000:8000 \
-  -v voicebox-data:/app/data \
-  ghcr.io/jamiepine/voicebox:latest-rocm
+# Specific version (pinned for stability)
+docker run -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:0.1.13
 ```
 
 Then open: `http://localhost:8000`
 
-### Using Docker Compose (Easiest)
+The web UI will load automatically. On first use, you'll be prompted to download a TTS provider (PyTorch CPU ~300MB or PyTorch CUDA ~2.4GB).
 
-Create `docker-compose.yml`:
+### Using Docker Compose (Easiest)
 
-```yaml
-version: '3.8'
+Use the provided `docker-compose.yml` (CUDA) or `docker-compose.cpu.yml` in the repository root:
 
-services:
-  voicebox:
-    image: ghcr.io/jamiepine/voicebox:latest-cuda
-    ports:
-      - "8000:8000"
-    volumes:
-      - voicebox-data:/app/data
-      - huggingface-cache:/root/.cache/huggingface
-    environment:
-      - GPU_MEMORY_FRACTION=0.8  # Use 80% of GPU memory
-      - TTS_MODE=local
-      - WHISPER_MODE=local
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              count: 1
-              capabilities: [gpu]
+```bash
+# CUDA (default)
+docker compose up -d
 
-volumes:
-  voicebox-data:
-  huggingface-cache:
+# Or CPU-only
+docker compose -f docker-compose.cpu.yml up -d
 ```
 
-Run:
-```bash
-docker compose up -d
+To pin to a specific version, edit the compose file:
+```yaml
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:0.1.13-cuda  # Pinned version
 ```
 
 ## Building From Source
 
-### Basic Dockerfile
-
-```dockerfile
-# Dockerfile
-FROM python:3.11-slim
-
-WORKDIR /app
-
-# Install system dependencies
-RUN apt-get update && apt-get install -y \
-    git \
-    build-essential \
-    ffmpeg \
-    && rm -rf /var/lib/apt/lists/*
-
-# Copy application
-COPY backend/ /app/backend/
-COPY requirements.txt /app/
-
-# Install Python dependencies
-RUN pip install --no-cache-dir -r requirements.txt
-RUN pip install --no-cache-dir git+https://github.com/QwenLM/Qwen3-TTS.git
-
-# Create data directory
-RUN mkdir -p /app/data
-
-# Expose port
-EXPOSE 8000
-
-# Run server
-CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
-```
+See `Dockerfile` and `Dockerfile.cuda` in the repository root.
 
 Build and run:
 ```bash
-docker build -t voicebox .
-docker run -p 8000:8000 -v $(pwd)/data:/app/data voicebox
-```
-
-### Multi-Stage Build (Optimized)
-
-Smaller image size by separating build and runtime:
-
-```dockerfile
-# Dockerfile.optimized
-# Stage 1: Build dependencies
-FROM python:3.11-slim AS builder
-
-WORKDIR /build
-
-RUN apt-get update && apt-get install -y \
-    git build-essential && \
-    rm -rf /var/lib/apt/lists/*
-
-COPY backend/requirements.txt .
-RUN pip install --no-cache-dir --target=/build/packages \
-    -r requirements.txt
-
-RUN pip install --no-cache-dir --target=/build/packages \
-    git+https://github.com/QwenLM/Qwen3-TTS.git
-
-# Stage 2: Runtime
-FROM python:3.11-slim
-
-WORKDIR /app
-
-# Install only runtime dependencies
-RUN apt-get update && apt-get install -y \
-    ffmpeg \
-    && rm -rf /var/lib/apt/lists/*
+# Build web UI first
+bun install
+cd web && bun run build && cd ..
 
-# Copy installed packages from builder
-COPY --from=builder /build/packages /usr/local/lib/python3.11/site-packages/
-
-# Copy application code
-COPY backend/ /app/backend/
+# Build CPU image
+docker build -t voicebox .
+docker run -p 8000:8000 -v voicebox-data:/app/data voicebox
 
-# Create data directory
-RUN mkdir -p /app/data
+# Or build CUDA image
+docker build -f Dockerfile.cuda -t voicebox:cuda .
+docker run --gpus all -p 8000:8000 -v voicebox-data:/app/data voicebox:cuda
+```
 
-EXPOSE 8000
+### Architecture
 
-CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
-```
+The Docker images include:
+- **Backend**: FastAPI server with TTS/Whisper endpoints
+- **Web UI**: Pre-built React app served as static files from the backend
+- **Provider System**: Downloads PyTorch CPU/CUDA providers on first use (same UX as desktop app)
 
-Build:
-```bash
-docker build -f Dockerfile.optimized -t voicebox:slim .
-```
+Images are automatically built on release and tagged with both version number and `latest`.
 
 ## GPU Support
 
 ### NVIDIA GPUs (CUDA)
 
-**Dockerfile:**
-```dockerfile
-FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04
-
-# Install Python
-RUN apt-get update && apt-get install -y \
-    python3.11 python3-pip git ffmpeg && \
-    rm -rf /var/lib/apt/lists/*
-
-WORKDIR /app
-
-# Install PyTorch with CUDA support
-COPY backend/requirements.txt .
-RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
-
-# Install other dependencies
-RUN pip3 install -r requirements.txt
-RUN pip3 install git+https://github.com/QwenLM/Qwen3-TTS.git
-
-COPY backend/ /app/backend/
-
-EXPOSE 8000
-CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
-```
+The CUDA image includes PyTorch with CUDA 12.1 support:
 
 **Run with GPU:**
 ```bash
 docker run --gpus all -p 8000:8000 \
   -v voicebox-data:/app/data \
-  voicebox:cuda
+  ghcr.io/jamiepine/voicebox:latest-cuda
 ```
 
 **Docker Compose with GPU:**
 ```yaml
 services:
   voicebox:
-    image: voicebox:cuda
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
     deploy:
       resources:
         reservations:
@@ -213,47 +116,9 @@ services:
               capabilities: [gpu]
 ```
 
-### AMD GPUs (ROCm) - Experimental
-
-**Dockerfile:**
-```dockerfile
-FROM rocm/dev-ubuntu-22.04:6.0
-
-# Install Python
-RUN apt-get update && apt-get install -y \
-    python3.11 python3-pip git ffmpeg && \
-    rm -rf /var/lib/apt/lists/*
+### AMD GPUs (ROCm)
 
-WORKDIR /app
-
-# Install PyTorch with ROCm support
-COPY backend/requirements.txt .
-RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/rocm6.0
-
-# Install other dependencies
-RUN pip3 install -r requirements.txt
-RUN pip3 install git+https://github.com/QwenLM/Qwen3-TTS.git
-
-# Set ROCm environment variables
-ENV HSA_OVERRIDE_GFX_VERSION=10.3.0
-ENV ROCM_PATH=/opt/rocm
-
-COPY backend/ /app/backend/
-
-EXPOSE 8000
-CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
-```
-
-**Run with AMD GPU:**
-```bash
-docker run --device=/dev/kfd --device=/dev/dri \
-  --group-add video --ipc=host --cap-add=SYS_PTRACE \
-  --security-opt seccomp=unconfined \
-  -p 8000:8000 -v voicebox-data:/app/data \
-  voicebox:rocm
-```
-
-**Note:** ROCm support varies by GPU model. Works best on Linux. See [AMD ROCm docs](https://rocm.docs.amd.com) for compatibility.
+ROCm support is not currently available in pre-built images. If you need ROCm, build a custom image using the ROCm base and PyTorch ROCm builds.
 
 ## Volume Mounts
 
@@ -734,13 +599,27 @@ docker logs -f voicebox
 docker compose logs -f voicebox
 ```
 
-## Next Steps
+## Updates
+
+Docker images are automatically built and published on each GitHub release. To update:
+
+```bash
+# Pull latest
+docker pull ghcr.io/jamiepine/voicebox:latest
+docker compose up -d
+
+# Or pin to a specific version
+docker pull ghcr.io/jamiepine/voicebox:0.1.13
+```
+
+For automatic updates, use [Watchtower](https://containrrr.dev/watchtower/).
+
+## Future Enhancements
 
-- [ ] Publish official images to GitHub Container Registry
-- [ ] Add Kubernetes Helm charts
-- [ ] Create Docker Desktop extension
-- [ ] Add automated vulnerability scanning
-- [ ] Support ARM64 builds for Raspberry Pi / Apple Silicon
+- Kubernetes Helm charts
+- Docker Desktop extension
+- Automated vulnerability scanning
+- ROCm image variant
 
 ## Contributing
 
diff --git a/docs/plans/TTS_PROVIDER_ARCHITECTURE.md b/docs/plans/TTS_PROVIDER_ARCHITECTURE.md
index 8d35a7e5..14d87317 100644
--- a/docs/plans/TTS_PROVIDER_ARCHITECTURE.md
+++ b/docs/plans/TTS_PROVIDER_ARCHITECTURE.md
@@ -10,14 +10,17 @@
 
 Split the monolithic backend into modular components:
 
-1. **Main App** (~150-200MB): Tauri + FastAPI backend + Whisper + UI/profiles/history
-2. **TTS Providers** (downloadable plugins): Separate executables for model inference
+1. **Main App**:
+   - Windows/Linux (~150MB): Tauri + FastAPI backend + Whisper + UI/profiles/history
+   - macOS (~300MB): Same + MLX bundled for simplicity
+2. **TTS Providers** (Windows/Linux only): Downloadable executables for PyTorch CPU/CUDA inference
 
 This architecture solves:
 
 - ✅ GitHub 2GB release artifact limit
-- ✅ Frequent app updates without re-downloading large python binaries
-- ✅ User choice of compute backend (CPU/GPU/Cloud)
+- ✅ Frequent app updates without re-downloading large python binaries (Windows/Linux)
+- ✅ User choice of compute backend (CPU/GPU/Cloud) on Windows/Linux
+- ✅ Simplified out-of-the-box experience on macOS
 - ✅ External provider support (OpenAI, custom servers)
 - ✅ Future extensibility
 
@@ -25,6 +28,7 @@ This architecture solves:
 
 ## Architecture Diagram
 
+### Windows / Linux
 ```
 ┌─────────────────────────────────────────────────────────┐
 │  Voicebox App (Tauri + Backend)           ~150MB        │
@@ -39,27 +43,43 @@ This architecture solves:
                                           │
                             HTTP/IPC      │
                                           │
-         ┌────────────────────────────────┼─────────────────┐
-         │                                │                 │
-         ▼                                ▼                 ▼
-┌─────────────────┐      ┌─────────────────┐   ┌──────────────────┐
-│ TTS Provider:   │      │ TTS Provider:   │   │ TTS Provider:    │
-│ PyTorch CPU     │      │ PyTorch CUDA    │   │ MLX (Apple)      │
-│                 │      │                 │   │                  │
-│ ~300MB          │      │ ~2.4GB          │   │ ~800MB           │
-│                 │      │                 │   │                  │
-│ Local inference │      │ GPU inference   │   │ Metal inference  │
-└─────────────────┘      └─────────────────┘   └──────────────────┘
-         │                        │                     │
-         └────────────────────────┴─────────────────────┘
-                                  │
-                    ┌─────────────▼──────────────┐
-                    │  Future Providers:         │
-                    │  • Remote Server           │
-                    │  • OpenAI API              │
-                    │  • ElevenLabs              │
-                    │  • Custom Docker Container │
-                    └────────────────────────────┘
+                    ┌─────────────────────┴─────────────────┐
+                    │                                       │
+                    ▼                                       ▼
+       ┌─────────────────────┐              ┌─────────────────────┐
+       │ TTS Provider:       │              │ TTS Provider:       │
+       │ PyTorch CPU         │              │ PyTorch CUDA        │
+       │                     │              │                     │
+       │ ~300MB              │              │ ~2.4GB              │
+       │                     │              │                     │
+       │ Local inference     │              │ GPU inference       │
+       └─────────────────────┘              └─────────────────────┘
+                    │                                       │
+                    └───────────────┬───────────────────────┘
+                                    │
+                      ┌─────────────▼──────────────┐
+                      │  Future Providers:         │
+                      │  • Remote Server           │
+                      │  • OpenAI API              │
+                      │  • ElevenLabs              │
+                      │  • Custom Docker Container │
+                      └────────────────────────────┘
+```
+
+### macOS
+```
+┌─────────────────────────────────────────────────────────┐
+│  Voicebox App (Tauri + Backend)           ~300MB        │
+│  ├─ UI Layer (React)                                    │
+│  ├─ Backend (FastAPI)                                   │
+│  │  ├─ Voice Profiles                                   │
+│  │  ├─ Generation History                               │
+│  │  ├─ Audio Editing / Stories                          │
+│  │  └─ MLX Backend (bundled)                            │
+│  └─ Whisper (bundled, tiny ~50MB)                       │
+│                                                          │
+│  No provider downloads needed - works out of the box    │
+└─────────────────────────────────────────────────────────┘
 ```
 
 ---
@@ -91,18 +111,20 @@ This architecture solves:
 
 #### 1. Main App (voicebox.exe / .app / .AppImage)
 
-**Size:** ~100-150MB
+**Windows/Linux Size:** ~100-150MB
+**macOS Size:** ~300-350MB (includes MLX)
 
 **Includes:**
 
 - Tauri runtime + React UI
-- FastAPI backend (pure Python, no PyTorch)
+- FastAPI backend (pure Python, no PyTorch on Windows/Linux)
 - Whisper model (tiny, ~50MB)
 - SQLite database
 - Profile/history/audio editing logic
-- Provider management system
+- Provider management system (Windows/Linux only)
+- **MLX backend (macOS only, bundled)**
 
-**Does NOT include:**
+**Does NOT include (Windows/Linux only):**
 
 - PyTorch (CPU or CUDA)
 - TTS models (Qwen3-TTS)
@@ -147,23 +169,7 @@ This architecture solves:
 
 ---
 
-#### 4. TTS Provider: MLX
-
-**Binary:** `tts-provider-mlx`
-**Size:** ~150MB
-
-**Includes:**
-
-- MLX framework
-- MLX-optimized Qwen3-TTS
-- Metal acceleration
-
-**Platform:** macOS only (Apple Silicon)
-**Download source:** Cloudflare R2
-
----
-
-#### 5. TTS Provider: Remote
+#### 4. TTS Provider: Remote
 
 **Binary:** None (built-in config)
 **Size:** 0MB
@@ -182,7 +188,7 @@ This architecture solves:
 
 ---
 
-#### 6. TTS Provider: OpenAI
+#### 5. TTS Provider: OpenAI
 
 **Binary:** None (API wrapper)
 **Size:** 0MB
@@ -296,7 +302,10 @@ Model status.
 
 ```python
 class ProviderManager:
-    """Manages TTS provider lifecycle."""
+    """Manages TTS provider lifecycle (Windows/Linux only).
+
+    Note: macOS uses bundled MLX backend directly, no provider management needed.
+    """
 
     def __init__(self):
         self.active_provider: Optional[Provider] = None
@@ -308,8 +317,6 @@ class ProviderManager:
             return await self._start_local_provider("tts-provider-pytorch-cpu.exe")
         elif provider_type == "pytorch-cuda":
             return await self._start_local_provider("tts-provider-pytorch-cuda.exe")
-        elif provider_type == "mlx":
-            return await self._start_local_provider("tts-provider-mlx")
         elif provider_type == "remote":
             return self.config["remote_url"]
         elif provider_type == "openai":
@@ -434,15 +441,14 @@ class OpenAIProvider(TTSProvider):
 
 ```python
 class ProviderInstaller:
-    """Handles provider download and installation."""
+    """Handles provider download and installation (Windows/Linux only)."""
 
     async def download_provider(self, provider_type: str):
         """Download provider binary from R2."""
 
         binary_name = {
             "pytorch-cpu": "tts-provider-pytorch-cpu.exe",
-            "pytorch-cuda": "tts-provider-pytorch-cuda.exe",
-            "mlx": "tts-provider-mlx"
+            "pytorch-cuda": "tts-provider-pytorch-cuda.exe"
         }[provider_type]
 
         download_url = f"https://downloads.voicebox.sh/providers/v{PROVIDER_VERSION}/{binary_name}"
@@ -525,44 +531,38 @@ export function ProviderSettings() {
 						)}
 					</div>
 
-					{/* PyTorch CPU */}
-					<div className="flex items-center justify-between">
-						<div className="flex items-center space-x-2">
-							<RadioGroupItem value="pytorch-cpu" id="cpu" />
-							<Label htmlFor="cpu">
-								<div className="font-medium">PyTorch CPU</div>
-								<div className="text-sm text-muted-foreground">
-									Works on any system, slower inference
-								</div>
-							</Label>
-						</div>
-						{!installedProviders?.includes("pytorch-cpu") && (
-							<Button onClick={() => downloadProvider("pytorch-cpu")} size="sm">
-								Download (300MB)
-							</Button>
-						)}
-					</div>
-
-					{/* MLX (macOS only) */}
-					{isMacOS && (
+					{/* PyTorch CPU (Windows/Linux only) */}
+					{!isMacOS && (
 						<div className="flex items-center justify-between">
 							<div className="flex items-center space-x-2">
-								<RadioGroupItem value="mlx" id="mlx" />
-								<Label htmlFor="mlx">
-									<div className="font-medium">MLX (Apple Silicon)</div>
+								<RadioGroupItem value="pytorch-cpu" id="cpu" />
+								<Label htmlFor="cpu">
+									<div className="font-medium">PyTorch CPU</div>
 									<div className="text-sm text-muted-foreground">
-										Optimized for M1/M2/M3 chips
+										Works on any system, slower inference
 									</div>
 								</Label>
 							</div>
-							{!installedProviders?.includes("mlx") && (
-								<Button onClick={() => downloadProvider("mlx")} size="sm">
-									Download (800MB)
+							{!installedProviders?.includes("pytorch-cpu") && (
+								<Button onClick={() => downloadProvider("pytorch-cpu")} size="sm">
+									Download (300MB)
 								</Button>
 							)}
 						</div>
 					)}
 
+					{/* MLX bundled (macOS only) */}
+					{isMacOS && (
+						<div className="p-3 bg-muted rounded-md">
+							<div className="text-sm">
+								<div className="font-medium">MLX (Apple Silicon)</div>
+								<div className="text-muted-foreground mt-1">
+									Bundled with the app - optimized for M1/M2/M3 chips
+								</div>
+							</div>
+						</div>
+					)}
+
 					{/* Remote */}
 					<div className="space-y-2">
 						<div className="flex items-center space-x-2">
@@ -608,14 +608,18 @@ export function ProviderSettings() {
 ```
 voicebox/
 ├── backend/
-│   ├── main.py                    # Main FastAPI app (no TTS code)
+│   ├── main.py                    # Main FastAPI app (no TTS on Win/Linux)
+│   ├── backends/
+│   │   ├── __init__.py            # Backend abstraction (existing)
+│   │   ├── pytorch_backend.py     # PyTorch backend (existing, for reference)
+│   │   └── mlx_backend.py         # MLX backend (bundled in macOS build only)
 │   ├── providers/
-│   │   ├── __init__.py            # ProviderManager
-│   │   ├── base.py                # TTSProvider ABC
+│   │   ├── __init__.py            # ProviderManager (Windows/Linux)
+│   │   ├── base.py                # TTSProvider Protocol
 │   │   ├── local.py               # LocalProvider (subprocess)
 │   │   ├── remote.py              # RemoteProvider (HTTP)
 │   │   ├── openai.py              # OpenAIProvider (API wrapper)
-│   │   └── installer.py           # Provider download logic
+│   │   └── installer.py           # Provider download logic (Windows/Linux)
 │   ├── profiles.py                # Voice profile management
 │   ├── history.py                 # Generation history
 │   ├── transcribe.py              # Whisper (still bundled)
@@ -628,27 +632,22 @@ voicebox/
 │   │   ├── requirements.txt       # torch (CPU), qwen-tts, transformers
 │   │   └── build.spec             # PyInstaller spec
 │   │
-│   ├── pytorch-cuda/
-│   │   ├── main.py                # FastAPI server for TTS
-│   │   ├── tts_backend.py         # PyTorch TTS logic
-│   │   ├── requirements.txt       # torch+cu121, qwen-tts, transformers
-│   │   └── build.spec             # PyInstaller spec
-│   │
-│   └── mlx/
+│   └── pytorch-cuda/
 │       ├── main.py                # FastAPI server for TTS
-│       ├── mlx_backend.py         # MLX TTS logic
-│       ├── requirements.txt       # mlx, qwen-tts-mlx
+│       ├── tts_backend.py         # PyTorch TTS logic
+│       ├── requirements.txt       # torch+cu121, qwen-tts, transformers
 │       └── build.spec             # PyInstaller spec
 │
 ├── app/                           # Frontend (Tauri + React)
 │   └── src/
 │       └── components/
 │           └── ServerSettings/
-│               └── ProviderSettings.tsx
+│               └── ProviderSettings.tsx  # Only shown on Windows/Linux
 │
 └── tauri/
     └── src-tauri/
-        └── tauri.conf.json        # No externalBin for providers
+        └── tauri.conf.json        # No externalBin for providers (Windows/Linux)
+                                   # MLX bundled in macOS build
 ```
 
 ---
@@ -671,33 +670,35 @@ voicebox/
 
 ### Phase 2: Build Provider Binaries
 
-**Goal:** Create standalone TTS provider executables
+**Goal:** Create standalone TTS provider executables (Windows/Linux only)
 
 1. Create separate PyInstaller specs for each provider
 2. Build provider executables:
    - `tts-provider-pytorch-cpu.exe` (~300MB)
    - `tts-provider-pytorch-cuda.exe` (~2.4GB)
-   - `tts-provider-mlx` (~800MB, macOS)
 3. Test subprocess communication
 4. Upload providers to Cloudflare R2
 
 **Result:** Provider binaries exist but aren't used yet
 
+**Note:** macOS keeps MLX bundled in main app - no separate provider needed
+
 ---
 
 ### Phase 3: Remove PyTorch from Main App
 
-**Goal:** Split main app from providers
+**Goal:** Split main app from providers (Windows/Linux only)
 
-1. Exclude PyTorch/Qwen3-TTS from main app PyInstaller spec
-2. Main app now requires provider download
+1. Exclude PyTorch/Qwen3-TTS from Windows/Linux main app PyInstaller spec
+2. Windows/Linux app now requires provider download
 3. Update GitHub CI to build multiple artifacts:
-   - `voicebox-{version}-{platform}.exe` (~150MB)
+   - `voicebox-{version}-windows.exe` (~150MB, no TTS)
+   - `voicebox-{version}-linux.AppImage` (~150MB, no TTS)
+   - `voicebox-{version}-macos.app` (~300MB, MLX bundled)
    - `tts-provider-pytorch-cpu-{version}.exe`
    - `tts-provider-pytorch-cuda-{version}.exe`
-   - `tts-provider-mlx-{version}` (macOS)
 
-**Result:** Main app is small, providers downloaded separately
+**Result:** Windows/Linux apps are small with downloadable providers, macOS app is self-contained
 
 ---
 
@@ -767,7 +768,7 @@ async def check_provider_compatibility(provider_version: str) -> bool:
 
 ## User Flows
 
-### First-Time Setup
+### First-Time Setup (Windows/Linux)
 
 1. User downloads and installs Voicebox (~150MB)
 2. App launches → detects no TTS provider installed
@@ -784,10 +785,6 @@ async def check_provider_compatibility(provider_version: str) -> bool:
        ✓ Works on any system
        ✗ Slower inference
 
-   [ ] MLX (800MB)             [Download]
-       ✓ Fast on Apple Silicon
-       ✗ macOS only (M1/M2/M3)
-
    [ ] Remote Server
        URL: ___________________
 
@@ -799,19 +796,31 @@ async def check_provider_compatibility(provider_version: str) -> bool:
 5. Provider installs to AppData/Application Support
 6. App starts provider → ready to use
 
+### First-Time Setup (macOS)
+
+1. User downloads and installs Voicebox (~300MB with MLX bundled)
+2. App launches → MLX backend is ready immediately
+3. No provider setup needed - works out of the box
+
 ---
 
 ### App Update Flow (No Provider Change)
 
 **Scenario:** Bug fix in UI, no backend changes
 
+**Windows/Linux:**
 1. User gets update notification: "Voicebox v0.2.1 available"
 2. Downloads update (~150MB, not 2.4GB!)
 3. Installs and restarts
 4. **Provider stays the same** (no re-download needed)
 5. App starts using existing provider
 
-**User experience:** Fast updates, no multi-GB downloads
+**macOS:**
+1. User gets update notification: "Voicebox v0.2.1 available"
+2. Downloads update (~300MB with MLX bundled)
+3. Installs and restarts - ready to use
+
+**User experience:** Fast updates, no multi-GB downloads (especially for CUDA users)
 
 ---
 
@@ -846,9 +855,10 @@ async def check_provider_compatibility(provider_version: str) -> bool:
 
 | Benefit                       | Details                                                   |
 | ----------------------------- | --------------------------------------------------------- |
-| **GitHub Releases Work**      | Main app ~150MB << 2GB limit                              |
+| **GitHub Releases Work**      | Main app ~150MB (Win/Linux), ~300MB (macOS) << 2GB limit  |
 | **Fast Updates**              | UI/feature updates don't require re-downloading providers |
-| **User Choice**               | CPU, CUDA, MLX, OpenAI, remote server                     |
+| **User Choice**               | CPU, CUDA, OpenAI, remote server (Win/Linux)              |
+| **macOS Simplicity**          | MLX bundled - works immediately, no provider setup needed |
 | **External Provider Support** | Users can run their own TTS servers                       |
 | **Bandwidth Savings**         | Only download provider once, app updates are small        |
 | **Future-Proof**              | Easy to add new providers (ElevenLabs, custom models)     |
diff --git a/docs2/MIGRATION.md b/docs2/MIGRATION.md
new file mode 100644
index 00000000..98f2be32
--- /dev/null
+++ b/docs2/MIGRATION.md
@@ -0,0 +1,94 @@
+# Documentation Migration: Mintlify → Fumadocs
+
+This document summarizes the migration of documentation from `/docs` (Mintlify) to `/docs2` (Fumadocs).
+
+## What Was Done
+
+### 1. Files Copied
+
+- ✅ All 29 MDX files from `/docs` folders (overview, api, developer, plans)
+- ✅ All 4 root-level markdown files (AUTOUPDATER.md, AUTOUPDATER_QUICKSTART.md, TROUBLESHOOTING.md, README.md)
+- ✅ All images (3 webp files) → `public/images/`
+- ✅ All logo files (2 png files) → `public/logo/`
+
+### 2. Component Migration
+
+Created compatibility layer in `components/mintlify-compat.tsx` that maps Mintlify components to Fumadocs equivalents:
+
+- `<Frame>` → Simple div wrapper (images are zoomable by default in Fumadocs)
+- `<CardGroup>` → `<Cards>` (Fumadocs component)
+- `<Card>` → `<Card>` (with icon string → Lucide icon mapping)
+- `<Steps>` / `<Step>` → Direct mapping to Fumadocs components
+- `<Tip>`, `<Note>`, `<Info>` → `<Callout type="info">`
+- `<Warning>` → `<Callout type="warn">`
+- `<Danger>` → `<Callout type="error">`
+- `<AccordionGroup>` / `<Accordion>` → HTML `<details>` / `<summary>` elements
+
+### 3. Navigation Structure
+
+Created `meta.json` files for each folder:
+
+- `content/docs/meta.json` - Root documentation
+- `content/docs/overview/meta.json` - Overview pages
+- `content/docs/api/meta.json` - API reference
+- `content/docs/developer/meta.json` - Developer docs
+- `content/docs/plans/meta.json` - Plans/roadmap
+
+### 4. Link Fixes
+
+- Fixed incorrect `/guides/...` paths → `/overview/...`
+- All internal links now use correct paths
+
+### 5. Branding
+
+- Updated `lib/layout.shared.tsx` to use "Voicebox" as the nav title
+
+## File Structure
+
+```
+docs2/
+├── components/
+│   └── mintlify-compat.tsx    # Mintlify → Fumadocs component mappings
+├── content/docs/
+│   ├── meta.json              # Root navigation
+│   ├── overview/              # 12 MDX files
+│   ├── api/                   # 5 MDX files
+│   ├── developer/             # 12 MDX files
+│   ├── plans/                 # 4 MD files
+│   └── *.md                   # 4 root markdown files
+├── public/
+│   ├── images/                # 3 webp files
+│   └── logo/                  # 2 png files
+└── mdx-components.tsx         # MDX component configuration
+```
+
+## Icon Mapping
+
+The following icon strings are mapped to Lucide icons:
+
+- `microphone` → Mic
+- `film` → Film
+- `code` → Code
+- `shield` → Shield
+- `download` → Download
+- `rocket` → Rocket
+- `apple` → Apple
+- `windows` → Windows
+- `server` → Server
+- `user` → User
+- `waveform` → Waveform
+
+## Next Steps
+
+1. **Test the build**: Run `npm run build` (requires Node.js >= 20.9.0)
+2. **Start dev server**: Run `npm run dev` to preview
+3. **Customize styling**: Update `app/global.css` if needed
+4. **Add more icons**: Extend `iconMap` in `mintlify-compat.tsx` as needed
+5. **Review navigation**: Adjust `meta.json` files to customize page order
+
+## Notes
+
+- Image paths (`/images/...`) work as-is since Next.js serves from `public/`
+- All Mintlify components are now compatible with Fumadocs
+- Navigation structure follows Fumadocs conventions
+- No breaking changes to content - all MDX files work with compatibility layer
diff --git a/docs2/content/docs/AUTOUPDATER.md b/docs2/content/docs/AUTOUPDATER.md
new file mode 100644
index 00000000..76148c52
--- /dev/null
+++ b/docs2/content/docs/AUTOUPDATER.md
@@ -0,0 +1,203 @@
+---
+title: "Auto-Updater Documentation"
+description: "How Voicebox automatic updates work for users and developers"
+---
+
+Voicebox includes automatic updates powered by Tauri's updater plugin. This document explains how it works for both users and developers.
+
+## 1. Generate Signing Keys
+
+Run this command to generate your signing keypair:
+
+```bash
+cd tauri && bun tauri signer generate -w ~/.tauri/voicebox.key
+```
+
+This creates:
+
+- **Private key**: `~/.tauri/voicebox.key` (keep this secret!)
+- **Public key**: `~/.tauri/voicebox.key.pub`
+
+## 2. Update Configuration
+
+Copy the content from `~/.tauri/voicebox.key.pub` and replace the placeholder in `tauri/src-tauri/tauri.conf.json`:
+
+```json
+{
+	"plugins": {
+		"updater": {
+			"pubkey": "PASTE_PUBLIC_KEY_CONTENT_HERE",
+			"endpoints": [
+				"https://github.com/YOUR_USERNAME/voicebox/releases/latest/download/latest.json"
+			]
+		}
+	}
+}
+```
+
+Update the endpoint URL with your actual GitHub username/organization.
+
+## 3. Building with Signatures
+
+When building releases, set these environment variables:
+
+**macOS/Linux:**
+
+```bash
+export TAURI_SIGNING_PRIVATE_KEY="$(cat ~/.tauri/voicebox.key)"
+export TAURI_SIGNING_PRIVATE_KEY_PASSWORD=""
+bun run build
+```
+
+**Windows PowerShell:**
+
+```powershell
+$env:TAURI_SIGNING_PRIVATE_KEY = Get-Content ~/.tauri/voicebox.key -Raw
+$env:TAURI_SIGNING_PRIVATE_KEY_PASSWORD = ""
+bun run build
+```
+
+## 4. GitHub Release Setup
+
+When you create a GitHub release, the build process will generate:
+
+- Installers for each platform
+- `.sig` signature files
+- `latest.json` update manifest
+
+### Manual Release Process
+
+1. Build the app with signing keys set
+2. Create a new GitHub release
+3. Upload all files from `tauri/src-tauri/target/release/bundle/`
+4. Create `latest.json` in your release assets:
+
+```json
+{
+	"version": "0.2.0",
+	"notes": "Bug fixes and improvements",
+	"pub_date": "2026-01-25T12:00:00Z",
+	"platforms": {
+		"darwin-aarch64": {
+			"signature": "CONTENT_FROM_.app.tar.gz.sig",
+			"url": "https://github.com/YOUR_USERNAME/voicebox/releases/download/v0.2.0/voicebox_0.2.0_aarch64.dmg"
+		},
+		"darwin-x86_64": {
+			"signature": "CONTENT_FROM_.app.tar.gz.sig",
+			"url": "https://github.com/YOUR_USERNAME/voicebox/releases/download/v0.2.0/voicebox_0.2.0_x64.dmg"
+		},
+		"linux-x86_64": {
+			"signature": "CONTENT_FROM_.AppImage.sig",
+			"url": "https://github.com/YOUR_USERNAME/voicebox/releases/download/v0.2.0/voicebox_0.2.0_amd64.AppImage"
+		},
+		"windows-x86_64": {
+			"signature": "CONTENT_FROM_.msi.sig",
+			"url": "https://github.com/YOUR_USERNAME/voicebox/releases/download/v0.2.0/voicebox_0.2.0_x64_en-US.msi"
+		}
+	}
+}
+```
+
+### Automated GitHub Actions (Recommended)
+
+Create `.github/workflows/release.yml`:
+
+```yaml
+name: Release
+
+on:
+  push:
+    tags:
+      - "v*"
+
+jobs:
+  release:
+    strategy:
+      matrix:
+        platform: [macos-latest, ubuntu-22.04, windows-latest]
+
+    runs-on: ${{ matrix.platform }}
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Setup Bun
+        uses: oven-sh/setup-bun@v1
+
+      - name: Install Rust
+        uses: dtolnay/rust-toolchain@stable
+
+      - name: Install dependencies (Ubuntu)
+        if: matrix.platform == 'ubuntu-22.04'
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y libwebkit2gtk-4.1-dev libappindicator3-dev librsvg2-dev patchelf
+
+      - name: Install dependencies
+        run: bun install
+
+      - name: Build
+        env:
+          TAURI_SIGNING_PRIVATE_KEY: ${{ secrets.TAURI_SIGNING_PRIVATE_KEY }}
+          TAURI_SIGNING_PRIVATE_KEY_PASSWORD: ${{ secrets.TAURI_SIGNING_PRIVATE_KEY_PASSWORD }}
+        run: bun run build
+
+      - name: Upload Release
+        uses: softprops/action-gh-release@v1
+        with:
+          files: tauri/src-tauri/target/release/bundle/**/*
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+```
+
+Add your private key to GitHub secrets:
+
+- Go to Settings → Secrets and variables → Actions
+- Add `TAURI_SIGNING_PRIVATE_KEY` with the content of `~/.tauri/voicebox.key`
+- Add `TAURI_SIGNING_PRIVATE_KEY_PASSWORD` (empty string if no password)
+
+## Frontend Integration
+
+The frontend integration is complete with automatic update notifications and manual update checks:
+
+- **Update Notification Banner** - Appears automatically when updates are available
+- **Settings Panel** - Manual "Check for Updates" button in Settings tab
+- **Update Hook** - React hook handles all update operations
+
+See `docs/AUTOUPDATER_QUICKSTART.md` for a quick setup guide.
+
+## Security Notes
+
+- Never commit your private key to version control
+- Store private keys securely (use GitHub secrets for CI/CD)
+- The public key in `tauri.conf.json` is safe to commit
+- Updates are cryptographically verified before installation
+- HTTP endpoints are blocked by default (HTTPS only)
+
+## Testing Updates
+
+1. Build version 0.1.0 and install it
+2. Update version in `tauri.conf.json` to 0.2.0
+3. Build version 0.2.0 with signatures
+4. Create a local server or GitHub release with `latest.json`
+5. Run version 0.1.0 and trigger update check
+6. Verify update downloads and installs correctly
+
+## Troubleshooting
+
+**"Invalid signature" error:**
+
+- Verify public key matches the private key used to sign
+- Ensure signature files (.sig) are uploaded correctly
+
+**"No update available" when one exists:**
+
+- Check endpoint URL is correct
+- Verify `latest.json` format matches specification
+- Ensure version in latest.json is higher than current version
+
+**Build fails with signing:**
+
+- Confirm environment variables are set correctly
+- Check private key file exists and is readable
+- Verify private key format (should start with `dW50cnVzdGVkIGNvbW1lbnQ6`)
diff --git a/docs2/content/docs/AUTOUPDATER_QUICKSTART.md b/docs2/content/docs/AUTOUPDATER_QUICKSTART.md
new file mode 100644
index 00000000..5614536d
--- /dev/null
+++ b/docs2/content/docs/AUTOUPDATER_QUICKSTART.md
@@ -0,0 +1,129 @@
+---
+title: "Autoupdater Quick Start"
+description: "Quick guide to activate the Tauri v2 autoupdater"
+---
+
+The Tauri v2 autoupdater has been fully configured and integrated. Follow these steps to activate it.
+
+## What's Already Done
+
+✅ Rust plugin installed and initialized
+✅ Tauri configuration set up with updater settings
+✅ Permissions granted for update operations
+✅ GitHub Actions workflow updated with signing support
+✅ Frontend components created and integrated
+✅ Update notifications on app startup
+✅ Manual update check in Settings tab
+
+## Required Steps (5 minutes)
+
+### 1. Generate Signing Keys
+
+```bash
+bun run generate:keys
+```
+
+This creates:
+
+- Private key: `~/.tauri/voicebox.key` (keep secret!)
+- Public key: `~/.tauri/voicebox.key.pub` (safe to share)
+
+### 2. Update Tauri Config
+
+Open `tauri/src-tauri/tauri.conf.json` and:
+
+1. Replace `"REPLACE_WITH_YOUR_PUBLIC_KEY"` with the content from `~/.tauri/voicebox.key.pub`
+2. Update the endpoint URL with your GitHub username:
+   ```json
+   "endpoints": [
+     "https://github.com/YOUR_USERNAME/voicebox/releases/latest/download/latest.json"
+   ]
+   ```
+
+### 3. Add GitHub Secrets
+
+Go to your repo Settings → Secrets and variables → Actions:
+
+1. Add `TAURI_SIGNING_PRIVATE_KEY`:
+
+   ```bash
+   cat ~/.tauri/voicebox.key
+   ```
+
+   Copy the entire output and paste as the secret value
+
+2. Add `TAURI_SIGNING_PRIVATE_KEY_PASSWORD`:
+   Leave empty (or add your password if you set one)
+
+### 4. Test the Setup
+
+To test locally before creating a release:
+
+```bash
+bun run build:release
+```
+
+This will verify your keys are set up correctly.
+
+## How It Works
+
+### For Users
+
+1. App checks for updates on startup (only in Tauri builds)
+2. If an update is available, a banner appears at the top
+3. Users can click "Install Now" to download and install
+4. App restarts automatically after installation
+
+### For Developers
+
+1. Create a new git tag: `git tag v0.2.0 && git push --tags`
+2. GitHub Actions builds signed releases for all platforms
+3. Uploads installers and generates `latest.json` manifest
+4. Users running older versions will be notified automatically
+
+## UI Components
+
+### Update Notification Banner
+
+- Shows at top of app when update is available
+- Appears automatically on startup
+- Displays download/install progress
+
+### Settings Panel
+
+- Located in Settings tab
+- Shows current version
+- Manual "Check for Updates" button
+- Update status and progress
+
+## Troubleshooting
+
+**"Public key not configured"**
+
+- Make sure you copied the entire content from `voicebox.key.pub`
+- The key should start with `dW50cnVzdGVkIGNvbW1lbnQ6`
+
+**"Failed to check for updates"**
+
+- Endpoint URL might be incorrect
+- No releases published yet (expected for first setup)
+
+**Build fails with signing error**
+
+- Check that GitHub secrets are set correctly
+- Verify private key file exists at `~/.tauri/voicebox.key`
+
+## Next Release Workflow
+
+1. Update version in `tauri/src-tauri/tauri.conf.json`
+2. Commit changes
+3. Create and push tag: `git tag v0.2.0 && git push --tags`
+4. GitHub Actions will automatically build and create a draft release
+5. Review the release and publish it
+6. Users will be notified of the update
+
+## See Also
+
+- Full documentation: `docs/AUTOUPDATER.md`
+- Build script: `scripts/prepare-release.sh`
+- GitHub workflow: `.github/workflows/release.yml`
diff --git a/docs2/content/docs/README.md b/docs2/content/docs/README.md
new file mode 100644
index 00000000..66f7833d
--- /dev/null
+++ b/docs2/content/docs/README.md
@@ -0,0 +1,67 @@
+---
+title: "Documentation README"
+description: "Voicebox documentation development guide"
+---
+
+This directory contains the documentation for Voicebox, built with [Fumadocs](https://fumadocs.dev).
+
+## Development
+
+### Prerequisites
+
+Install Mintlify globally using bun:
+
+```bash
+bun add -g mintlify
+```
+
+Or use the helper script:
+
+```bash
+bun run install:mintlify
+```
+
+### Running Locally
+
+```bash
+bun run dev
+```
+
+This will start the Mintlify dev server.
+
+The docs will be available at `http://localhost:3000`
+
+### Structure
+
+```
+docs/
+├── mint.json           # Mintlify configuration
+├── custom.css          # Custom styles
+├── overview/           # Getting started & feature docs
+├── guides/             # User guides
+├── api/                # API reference
+├── development/        # Developer documentation
+├── logo/               # Logo assets
+└── public/             # Static assets
+```
+
+### Writing Docs
+
+- Use `.mdx` files for all documentation pages
+- Follow the existing structure in `mint.json` for navigation
+- Use Mintlify components for enhanced formatting (Card, CardGroup, Accordion, etc.)
+- Reference the [Mintlify documentation](https://mintlify.com/docs) for available components
+
+## Deployment
+
+Docs are automatically deployed when changes are pushed to the main branch.
+
+To manually deploy:
+
+```bash
+mintlify deploy
+```
+
+## Contributing
+
+See [CONTRIBUTING.md](../CONTRIBUTING.md) for contribution guidelines.
diff --git a/docs2/content/docs/TROUBLESHOOTING.md b/docs2/content/docs/TROUBLESHOOTING.md
new file mode 100644
index 00000000..18a6c255
--- /dev/null
+++ b/docs2/content/docs/TROUBLESHOOTING.md
@@ -0,0 +1,360 @@
+---
+title: "Troubleshooting Guide"
+description: "Common issues and solutions for Voicebox"
+---
+
+Common issues and solutions for Voicebox.
+
+## Installation Issues
+
+### macOS: "Voicebox cannot be opened because it is from an unidentified developer"
+
+**Solution:**
+
+1. Right-click the `.dmg` file
+2. Select "Open"
+3. Click "Open" in the security dialog
+4. Alternatively, go to System Settings → Privacy & Security → Allow Voicebox
+
+### Windows: "Windows protected your PC"
+
+**Solution:**
+
+1. Click "More info"
+2. Click "Run anyway"
+3. Windows Defender may flag new software; this is normal for unsigned apps
+
+### Linux: AppImage won't run
+
+**Solution:**
+
+```bash
+chmod +x voicebox-*.AppImage
+./voicebox-*.AppImage
+```
+
+## Runtime Issues
+
+### Server won't start
+
+**Symptoms:** App opens but shows "Server not connected"
+
+**Solutions:**
+
+1. **Check Python installation**
+
+   ```bash
+   python --version  # Should be 3.11+
+   ```
+
+2. **Check server binary exists**
+
+   - Look in `tauri/src-tauri/binaries/` for your platform
+   - Binary should match your system architecture
+
+3. **Check permissions**
+
+   ```bash
+   # macOS/Linux
+   chmod +x tauri/src-tauri/binaries/voicebox-server-*
+   ```
+
+4. **Check logs**
+   - macOS: Open Console.app and search for "voicebox"
+   - Linux: Check `~/.local/share/voicebox/` for logs
+   - Windows: Check Event Viewer
+
+### "Model download failed"
+
+**Symptoms:** First generation fails with download error
+
+**Solutions:**
+
+1. **Check internet connection**
+
+   - Models download from HuggingFace Hub (~2-4GB)
+   - First download may take several minutes
+
+2. **Check disk space**
+
+   - Models are cached in `~/.cache/huggingface/`
+   - Ensure at least 5GB free space
+
+3. **Manual download** (if automatic fails)
+   ```bash
+   pip install huggingface_hub
+   huggingface-cli download Qwen/Qwen3-TTS-12Hz-1.7B-Base
+   ```
+
+### "Out of memory" errors
+
+**Symptoms:** Generation fails with CUDA/VRAM errors
+
+**Solutions:**
+
+1. **Use smaller model**
+
+   - Switch to 0.6B model instead of 1.7B
+   - Settings → Model Management → Load 0.6B
+
+2. **Close other applications**
+
+   - Free up GPU memory
+   - Close browser tabs, other ML apps
+
+3. **Use CPU mode**
+   - Slower but works without GPU
+   - Backend automatically falls back to CPU
+
+### MLX "Failed to load the default metallib" error (Apple Silicon)
+
+**Symptoms:** Generation fails with "library not found" or "metallib" errors
+
+**Solutions:**
+
+1. **Rebuild server binary**
+
+   ```bash
+   bun run build:server
+   ```
+
+   The build script should automatically include MLX Metal shader libraries.
+
+2. **Check MLX installation**
+
+   ```bash
+   pip install -r backend/requirements-mlx.txt
+   ```
+
+3. **Verify backend detection**
+   - Check server logs for "Backend: MLX"
+   - If showing "Backend: PYTORCH", MLX may not be installed correctly
+
+### Audio playback issues
+
+**Symptoms:** Generated audio won't play
+
+**Solutions:**
+
+1. **Check audio format**
+
+   - Audio is saved as WAV files
+   - Ensure your system supports WAV playback
+
+2. **Try downloading audio**
+
+   - Right-click → Download
+   - Play in external player
+
+3. **Check browser permissions** (web version)
+   - Allow audio autoplay in browser settings
+
+### Slow generation
+
+**Symptoms:** Generation takes >30 seconds
+
+**Solutions:**
+
+1. **Check backend type** (Apple Silicon)
+
+   - Check Settings → Server Status
+   - Should show "Backend: MLX" on Apple Silicon
+   - If showing "Backend: PYTORCH", install MLX: `pip install -r backend/requirements-mlx.txt`
+   - MLX provides 4-5x faster inference on Apple Silicon
+
+2. **Use GPU** (if available)
+
+   - Check Settings → Server Status
+   - Should show "GPU available: true"
+   - Apple Silicon: Should show "Metal (Apple Silicon via MLX)"
+   - Windows/Linux: Should show "CUDA" if GPU available
+
+3. **Enable caching**
+
+   - Voice prompts are cached automatically
+   - Second generation with same voice should be faster
+
+4. **Use smaller model**
+
+   - 0.6B model is faster than 1.7B
+   - Quality difference is minimal for most voices
+
+5. **Check system resources**
+   - Close other CPU/GPU intensive apps
+   - Ensure adequate RAM (8GB+ recommended)
+
+## API Issues
+
+### "Connection refused" when using API
+
+**Solutions:**
+
+1. **Check server is running**
+
+   ```bash
+   curl http://localhost:8000/health
+   ```
+
+2. **Check remote mode**
+
+   - If connecting remotely, ensure server is started with `--host 0.0.0.0`
+   - Check firewall settings
+
+3. **Check port availability**
+   - Default port is 8000
+   - Ensure no other service is using it
+
+### CORS errors in browser
+
+**Solutions:**
+
+1. **Use desktop app** (recommended)
+
+   - Desktop app doesn't have CORS restrictions
+
+2. **Configure CORS** (for web deployment)
+   - Update `backend/main.py` CORS settings
+   - Add your domain to allowed origins
+
+## Update Issues
+
+### "Update check failed"
+
+**Solutions:**
+
+1. **Check internet connection**
+
+   - Updates are fetched from GitHub releases
+
+2. **Check GitHub access**
+
+   - Ensure `github.com` is accessible
+   - Check firewall/proxy settings
+
+3. **Manual update**
+   - Download latest release from GitHub
+   - Install manually
+
+### "Invalid signature" error
+
+**Solutions:**
+
+1. **Re-download installer**
+
+   - Signature may be corrupted
+   - Download fresh copy from GitHub
+
+2. **Check release integrity**
+   - Verify `.sig` file matches installer
+   - Report issue if signature is invalid
+
+## Data Issues
+
+### Profiles disappeared
+
+**Solutions:**
+
+1. **Check data directory**
+
+   - macOS: `~/Library/Application Support/voicebox/`
+   - Windows: `%APPDATA%/voicebox/`
+   - Linux: `~/.local/share/voicebox/`
+
+2. **Check database**
+
+   - Database: `data/voicebox.db`
+   - Ensure file exists and is readable
+
+3. **Restore from backup**
+   - Profiles can be exported/imported
+   - Check for backup files
+
+### "Database locked" error
+
+**Solutions:**
+
+1. **Close other instances**
+
+   - Ensure only one Voicebox instance is running
+
+2. **Restart app**
+
+   - Close and reopen Voicebox
+
+3. **Check file permissions**
+   - Ensure database file is writable
+   - Check directory permissions
+
+## Development Issues
+
+### Build fails
+
+**Solutions:**
+
+1. **Check Rust installation**
+
+   ```bash
+   rustc --version
+   rustup update
+   ```
+
+2. **Check Tauri dependencies**
+
+   ```bash
+   cd tauri
+   bun install
+   ```
+
+3. **Clean build**
+   ```bash
+   cd tauri/src-tauri
+   cargo clean
+   cd ../..
+   bun run build
+   ```
+
+### API client generation fails
+
+**Solutions:**
+
+1. **Start backend server**
+
+   ```bash
+   bun run dev:server
+   ```
+
+2. **Check OpenAPI endpoint**
+
+   ```bash
+   curl http://localhost:8000/openapi.json
+   ```
+
+3. **Regenerate client**
+   ```bash
+   bun run generate:api
+   ```
+
+## Still Having Issues?
+
+1. **Check existing issues**
+
+   - Search GitHub issues for similar problems
+   - Check closed issues for solutions
+
+2. **Create new issue**
+
+   - Include:
+     - OS and version
+     - Voicebox version
+     - Steps to reproduce
+     - Error messages/logs
+     - Screenshots (if applicable)
+
+3. **Get help**
+   - Check documentation in `docs/`
+   - Review `backend/README.md` for API details
+   - See `CONTRIBUTING.md` for development help
+
+---
+
+For more help, open an issue on [GitHub](https://github.com/jamiepine/voicebox/issues).
diff --git a/docs2/content/docs/api/meta.json b/docs2/content/docs/api/meta.json
new file mode 100644
index 00000000..d23c38eb
--- /dev/null
+++ b/docs2/content/docs/api/meta.json
@@ -0,0 +1,4 @@
+{
+  "title": "API Reference",
+  "pages": ["overview", "authentication", "voice-profiles", "generation", "recordings"]
+}
diff --git a/docs2/content/docs/developer/contributing.mdx b/docs2/content/docs/developer/contributing.mdx
new file mode 100644
index 00000000..8ae5914f
--- /dev/null
+++ b/docs2/content/docs/developer/contributing.mdx
@@ -0,0 +1,336 @@
+---
+title: "Contributing"
+description: "How to contribute to Voicebox"
+---
+
+Thank you for your interest in contributing to Voicebox! This guide will help you get started.
+
+## Code of Conduct
+
+- Be respectful and inclusive
+- Welcome newcomers and help them learn
+- Focus on constructive feedback
+- Respect different viewpoints and experiences
+
+## Getting Started
+
+Before you start contributing, make sure you have:
+
+1. **Read the documentation** to understand how Voicebox works
+2. **Set up your development environment** - see [Development Setup](/development/setup)
+3. **Explored the codebase** to understand the project structure
+4. **Checked existing issues** to see if someone else is working on something similar
+
+## Ways to Contribute
+
+<CardGroup cols={2}>
+	<Card title="Report Bugs" icon="bug">
+		Found a bug? Open an issue with reproduction steps
+	</Card>
+	<Card title="Request Features" icon="lightbulb">
+		Have an idea? Start a discussion or open an issue
+	</Card>
+	<Card title="Improve Docs" icon="book">
+		Fix typos, add examples, or clarify instructions
+	</Card>
+	<Card title="Write Code" icon="code">
+		Fix bugs, add features, or optimize performance
+	</Card>
+</CardGroup>
+
+## Development Workflow
+
+### 1. Fork & Clone
+
+```bash
+# Fork the repository on GitHub
+# Then clone your fork
+git clone https://github.com/YOUR_USERNAME/voicebox.git
+cd voicebox
+```
+
+### 2. Create a Branch
+
+Use descriptive branch names:
+
+```bash
+# For features
+git checkout -b feature/voice-effects
+
+# For bug fixes
+git checkout -b fix/audio-playback-issue
+
+# For documentation
+git checkout -b docs/api-examples
+```
+
+### 3. Make Your Changes
+
+Follow these guidelines:
+
+<AccordionGroup>
+  <Accordion title="Code Style">
+    **TypeScript/React:**
+    - Use TypeScript strict mode
+    - Prefer functional components with hooks
+    - Use named exports
+    - Format with Biome (runs automatically)
+
+    **Python:**
+    - Follow PEP 8
+    - Use type hints
+    - Use async/await for I/O
+    - Document functions with docstrings
+
+    **Rust:**
+    - Follow Rust conventions
+    - Use meaningful names
+    - Handle errors explicitly
+    - Run `rustfmt`
+
+  </Accordion>
+
+  <Accordion title="Commit Messages">
+    Write clear, descriptive commit messages:
+
+    ```bash
+    # Good
+    git commit -m "Add voice profile export feature"
+    git commit -m "Fix audio playback stopping after 30 seconds"
+
+    # Avoid
+    git commit -m "Update code"
+    git commit -m "Fix bug"
+    ```
+
+    Format:
+    - Use imperative mood ("Add feature" not "Added feature")
+    - Keep first line under 50 characters
+    - Add detailed description if needed
+
+  </Accordion>
+
+  <Accordion title="Testing">
+    - Test your changes manually in the app
+    - Ensure backend API endpoints work
+    - Check for TypeScript/Python errors
+    - Verify UI components render correctly
+    - Add automated tests when possible
+  </Accordion>
+</AccordionGroup>
+
+### 4. Push & Create PR
+
+```bash
+# Push your branch
+git push origin feature/your-feature-name
+
+# Then create a pull request on GitHub
+```
+
+## Pull Request Guidelines
+
+When creating a pull request:
+
+<Steps>
+  <Step title="Use a Clear Title">
+    Examples:
+    - "Add voice profile export functionality"
+    - "Fix audio playback stopping after 30 seconds"
+    - "Improve generation speed with caching"
+  </Step>
+
+{" "}
+<Step title="Provide Description">
+	Include: - What changes you made - Why you made them - How to test them -
+	Screenshots (for UI changes) - Reference related issues
+</Step>
+
+{" "}
+<Step title="Update Documentation">
+	- Update relevant docs if behavior changes - Add API documentation for new
+	endpoints - Update README if needed
+</Step>
+
+  <Step title="Check the Checklist">
+    - [ ] Code follows style guidelines
+    - [ ] Documentation updated
+    - [ ] Changes tested
+    - [ ] No breaking changes (or documented)
+    - [ ] CHANGELOG.md updated
+  </Step>
+</Steps>
+
+## Project Structure
+
+Understanding the codebase:
+
+```
+voicebox/
+├── app/              # Shared React frontend
+│   ├── src/
+│   │   ├── components/   # UI components
+│   │   ├── lib/          # Utilities and API client
+│   │   ├── hooks/        # React hooks
+│   │   └── stores/       # Zustand state stores
+├── backend/          # Python FastAPI server
+│   ├── main.py       # API routes
+│   ├── tts.py        # Voice synthesis logic
+│   ├── database.py   # SQLite operations
+│   └── models.py     # Pydantic models
+├── tauri/            # Desktop app wrapper
+│   └── src-tauri/    # Rust backend
+├── web/              # Web deployment
+├── landing/          # Marketing website
+└── scripts/          # Build & release scripts
+```
+
+## Areas for Contribution
+
+### Bug Fixes
+
+- Check [existing issues](https://github.com/jamiepine/voicebox/issues) for bugs
+- Test your fix thoroughly
+- Add regression tests if possible
+
+### New Features
+
+- Check the [roadmap](https://github.com/jamiepine/voicebox#roadmap) for planned features
+- Discuss major features in an issue first
+- Keep features focused and well-scoped
+
+### Documentation
+
+- Improve clarity and fix typos
+- Add code examples
+- Create tutorials or guides
+- Document API endpoints
+
+### UI/UX Improvements
+
+- Improve accessibility
+- Enhance visual design
+- Optimize performance
+- Add animations/transitions
+
+### Infrastructure
+
+- Improve build process
+- Add CI/CD improvements
+- Optimize bundle size
+- Add testing infrastructure
+
+## API Development
+
+When adding new API endpoints:
+
+<Steps>
+  <Step title="Add Route">
+    In `backend/main.py`:
+
+    ```python
+    @app.post("/api/new-endpoint")
+    async def new_endpoint(data: RequestModel) -> ResponseModel:
+        """Endpoint description."""
+        # Implementation
+        return response
+    ```
+
+  </Step>
+
+  <Step title="Create Models">
+    In `backend/models.py`:
+
+    ```python
+    class RequestModel(BaseModel):
+        field: str
+
+    class ResponseModel(BaseModel):
+        result: str
+    ```
+
+  </Step>
+
+  <Step title="Regenerate Client">
+    ```bash
+    bun run generate:api
+    ```
+
+    This updates the TypeScript client with type-safe bindings.
+
+  </Step>
+
+  <Step title="Update Docs">
+    The API documentation is automatically generated from the OpenAPI schema. Ensure your endpoint has proper docstrings and type hints, then regenerate the docs:
+    
+    ```bash
+    bun run generate:api
+    ```
+  </Step>
+</Steps>
+
+## Testing
+
+Currently testing is primarily manual. When adding tests:
+
+**Backend:**
+
+```bash
+cd backend
+pytest
+```
+
+**Frontend:**
+
+```bash
+bun run test
+```
+
+**E2E (future):**
+
+```bash
+bun run test:e2e
+```
+
+## Release Process
+
+Releases are managed by maintainers using `bumpversion`:
+
+```bash
+# Bump version (patch, minor, or major)
+bumpversion patch
+
+# Push with tags
+git push && git push --tags
+```
+
+GitHub Actions automatically builds and publishes releases when tags are pushed.
+
+## Community
+
+- **GitHub Issues:** Bug reports and feature requests
+- **GitHub Discussions:** General questions and ideas
+- **Discord:** Real-time chat (coming soon)
+
+## Recognition
+
+Contributors are recognized in:
+
+- [CHANGELOG.md](https://github.com/jamiepine/voicebox/blob/main/CHANGELOG.md)
+- GitHub contributor list
+- Release notes
+
+## License
+
+By contributing, you agree that your contributions will be licensed under the MIT License.
+
+## Questions?
+
+If you have questions:
+
+1. Check the [documentation](/overview/introduction)
+2. Search [existing issues](https://github.com/jamiepine/voicebox/issues)
+3. Open a new issue or discussion
+4. See [CONTRIBUTING.md](https://github.com/jamiepine/voicebox/blob/main/CONTRIBUTING.md) in the repo
+
+Thank you for contributing to Voicebox! 🎉
diff --git a/docs2/content/docs/developer/meta.json b/docs2/content/docs/developer/meta.json
new file mode 100644
index 00000000..5c97f225
--- /dev/null
+++ b/docs2/content/docs/developer/meta.json
@@ -0,0 +1,17 @@
+{
+  "title": "Developer",
+  "pages": [
+    "setup",
+    "architecture",
+    "contributing",
+    "building",
+    "autoupdater",
+    "voice-profiles",
+    "tts-generation",
+    "history",
+    "stories",
+    "transcription",
+    "audio-channels",
+    "model-management"
+  ]
+}
diff --git a/docs2/content/docs/developer/setup.mdx b/docs2/content/docs/developer/setup.mdx
new file mode 100644
index 00000000..be5b5eff
--- /dev/null
+++ b/docs2/content/docs/developer/setup.mdx
@@ -0,0 +1,245 @@
+---
+title: "Development Setup"
+description: "Set up your local development environment for Voicebox"
+---
+
+## Prerequisites
+
+Before you begin, ensure you have the following installed:
+
+<CardGroup cols={3}>
+	<Card title="Bun" icon="package">
+		[Download Bun](https://bun.sh) ```bash curl -fsSL https://bun.sh/install |
+		bash ```
+	</Card>
+	<Card title="Python 3.11+" icon="python">
+		[Download Python](https://python.org) ```bash python --version ```
+	</Card>
+	<Card title="Rust" icon="rust">
+		[Install Rust](https://rustup.rs) ```bash rustc --version ```
+	</Card>
+</CardGroup>
+
+## Clone the Repository
+
+```bash
+git clone https://github.com/jamiepine/voicebox.git
+cd voicebox
+```
+
+## Quick Setup (Recommended)
+
+The easiest way to get started is using the Makefile:
+
+```bash
+# Setup everything
+make setup
+
+# Start development
+make dev
+```
+
+<Note>
+	The Makefile is available on macOS and Linux. Windows users should follow the
+	manual setup below.
+</Note>
+
+## Manual Setup
+
+### 1. Install JavaScript Dependencies
+
+```bash
+bun install
+```
+
+This installs dependencies for:
+
+- `app/` - Shared React frontend
+- `tauri/` - Tauri desktop wrapper
+- `web/` - Web deployment wrapper
+
+### 2. Set Up Python Backend
+
+```bash
+cd backend
+
+# Create virtual environment
+python -m venv venv
+
+# Activate virtual environment
+source venv/bin/activate  # macOS/Linux
+# or
+venv\Scripts\activate  # Windows
+
+# Install Python dependencies
+pip install -r requirements.txt
+
+# Install MLX dependencies (Apple Silicon only - for faster inference)
+# On Apple Silicon, this enables native Metal acceleration
+if [[ $(uname -m) == "arm64" ]]; then
+  pip install -r requirements-mlx.txt
+fi
+
+# Install Qwen3-TTS
+pip install git+https://github.com/QwenLM/Qwen3-TTS.git
+```
+
+## Running in Development
+
+Development requires **two terminals**: one for the Python backend, one for the Tauri app.
+
+<Tabs>
+  <Tab title="Terminal 1: Backend">
+    Start the Python server first:
+
+    ```bash
+    cd backend
+    source venv/bin/activate  # Activate venv
+    bun run dev:server
+    ```
+
+    Or manually:
+    ```bash
+    uvicorn main:app --reload --port 17493
+    ```
+
+    Backend will be available at `http://localhost:17493`
+
+  </Tab>
+
+  <Tab title="Terminal 2: Desktop App">
+    Then start the Tauri app:
+
+    ```bash
+    bun run dev
+    ```
+
+    This will:
+    - Create a placeholder sidecar binary
+    - Start Vite dev server on port 5173
+    - Launch Tauri window
+    - Enable hot reload
+
+  </Tab>
+</Tabs>
+
+<Info>
+	In dev mode, the app connects to your manually-started Python server. The
+	bundled server binary is only used in production builds.
+</Info>
+
+### Optional: Web App
+
+```bash
+bun run dev:web
+```
+
+Web app will be available at `http://localhost:5174`
+
+## Model Downloads
+
+Models are automatically downloaded from HuggingFace Hub on first use:
+
+- **Whisper** (transcription): Auto-downloads on first transcription
+- **Qwen3-TTS** (voice cloning): Auto-downloads on first generation (~2-4GB)
+
+<Warning>
+	First-time usage will be slower due to model downloads, but subsequent runs
+	will use cached models.
+</Warning>
+
+## Project Structure
+
+```
+voicebox/
+├── app/              # Shared React frontend
+│   └── src/
+│       ├── components/   # UI components
+│       ├── lib/          # Utilities and API client
+│       └── hooks/        # React hooks
+├── backend/          # Python FastAPI server
+│   ├── main.py       # API routes
+│   ├── tts.py        # Voice synthesis
+│   └── database.py   # SQLite operations
+├── tauri/            # Desktop app wrapper
+│   └── src-tauri/    # Rust backend
+├── web/              # Web deployment
+├── landing/          # Marketing website
+└── scripts/          # Build & release scripts
+```
+
+## Available Make Commands
+
+Run `make help` to see all available commands:
+
+```bash
+make setup          # Install all dependencies
+make dev            # Start development servers
+make dev-web        # Start web development server
+make build          # Build desktop app
+make build-web      # Build web app
+make clean          # Clean build artifacts
+make test           # Run tests
+```
+
+## Generate OpenAPI Client
+
+After starting the backend server, generate the TypeScript API client:
+
+```bash
+./scripts/generate-api.sh
+# or
+bun run generate:api
+```
+
+This downloads the OpenAPI schema and generates the TypeScript client in `app/src/lib/api/`
+
+## Next Steps
+
+<CardGroup cols={2}>
+	<Card
+		title="Architecture"
+		icon="diagram-project"
+		href="/development/architecture"
+	>
+		Understand the system architecture
+	</Card>
+	<Card
+		title="Contributing"
+		icon="code-pull-request"
+		href="/development/contributing"
+	>
+		Read the contribution guidelines
+	</Card>
+	<Card title="Building" icon="hammer" href="/development/building">
+		Learn how to build production releases
+	</Card>
+	<Card title="API Reference" icon="code" href="/api-reference">
+		Explore the REST API
+	</Card>
+</CardGroup>
+
+## Troubleshooting
+
+<AccordionGroup>
+  <Accordion title="Backend won't start">
+    - Check Python version (must be 3.11+)
+    - Ensure virtual environment is activated
+    - Verify all dependencies are installed: `pip install -r requirements.txt`
+    - Check if port 17493 is available
+  </Accordion>
+
+{" "}
+<Accordion title="Tauri build fails">
+	- Ensure Rust is installed: `rustc --version` - Clean the build: `cd
+	tauri/src-tauri && cargo clean` - Try rebuilding: `bun run dev`
+</Accordion>
+
+  <Accordion title="OpenAPI client generation fails">
+    - Ensure backend is running: `curl http://localhost:17493/openapi.json`
+    - Check network connectivity
+    - Verify the backend is accessible at localhost:17493
+  </Accordion>
+</AccordionGroup>
+
+See the full [Troubleshooting Guide](/guides/troubleshooting) for more issues and solutions.
diff --git a/docs2/content/docs/index.mdx b/docs2/content/docs/index.mdx
new file mode 100644
index 00000000..1c2b401e
--- /dev/null
+++ b/docs2/content/docs/index.mdx
@@ -0,0 +1,50 @@
+---
+title: "Voicebox Documentation"
+description: "Welcome to Voicebox - the open-source voice synthesis studio"
+---
+
+## What is Voicebox?
+
+Voicebox is a **local-first voice cloning studio** with DAW-like features for professional voice synthesis. Think of it as the **Ollama for voice** — download models, clone voices, and generate speech entirely on your machine.
+
+<Frame>
+	<img src="/images/app-screenshot-1.webp" alt="Voicebox App Screenshot" />
+</Frame>
+
+Unlike cloud services that lock your voice data behind subscriptions, Voicebox gives you:
+
+- **Complete privacy** — models and voice data stay on your machine
+- **Professional tools** — multi-track timeline editor, audio trimming, conversation mixing
+- **Model flexibility** — currently powered by Qwen3-TTS, with support for XTTS, Bark, and other models coming soon
+- **API-first** — use the desktop app or integrate voice synthesis into your own projects
+- **Native performance** — built with Tauri (Rust), not Electron
+
+Download a voice model, clone any voice from a few seconds of audio, and compose multi-voice projects with studio-grade editing tools. No Python install required, no cloud dependency, no limits.
+
+## Key Features
+
+<CardGroup cols={2}>
+	<Card title="Voice Cloning" icon="microphone">
+		Instant cloning from just a few seconds of audio with Qwen3-TTS
+	</Card>
+	<Card title="Stories Editor" icon="film">
+		Multi-track timeline for creating conversations and narratives
+	</Card>
+	<Card title="Full API" icon="code">
+		REST API for integrating voice synthesis into your apps
+	</Card>
+	<Card title="Local-First" icon="shield">
+		Everything runs on your machine - complete privacy
+	</Card>
+</CardGroup>
+
+## Get Started
+
+<CardGroup cols={2}>
+	<Card title="Installation" icon="download" href="/docs/overview/installation">
+		Download and install Voicebox on your machine
+	</Card>
+	<Card title="Quick Start" icon="rocket" href="/docs/overview/quick-start">
+		Get up and running in 5 minutes
+	</Card>
+</CardGroup>
diff --git a/docs2/content/docs/meta.json b/docs2/content/docs/meta.json
new file mode 100644
index 00000000..42d96896
--- /dev/null
+++ b/docs2/content/docs/meta.json
@@ -0,0 +1,4 @@
+{
+  "title": "Voicebox Documentation",
+  "pages": ["overview", "api-reference", "developer", "plans"]
+}
diff --git a/docs2/content/docs/overview/creating-voice-profiles.mdx b/docs2/content/docs/overview/creating-voice-profiles.mdx
new file mode 100644
index 00000000..2894ea5d
--- /dev/null
+++ b/docs2/content/docs/overview/creating-voice-profiles.mdx
@@ -0,0 +1,297 @@
+---
+title: "Creating Voice Profiles"
+description: "Advanced guide to creating high-quality voice profiles"
+---
+
+## Overview
+
+Voice profiles are the foundation of voice cloning in Voicebox. This guide covers best practices for creating professional-quality voice profiles.
+
+## Quick Start
+
+<Steps>
+	<Step title="Prepare Audio">10-30 seconds of clear speech</Step>
+	<Step title="Create Profile">**Profiles** → **+ New Profile**</Step>
+	<Step title="Upload Sample">Add your audio file</Step>
+	<Step title="Generate">Use the profile to generate speech</Step>
+</Steps>
+
+## Audio Requirements
+
+### Ideal Sample Characteristics
+
+<CardGroup cols={2}>
+  <Card title="Duration" icon="clock">
+    **10-30 seconds**
+
+    Too short: Poor quality
+    Too long: Unnecessary
+
+  </Card>
+  <Card title="Clarity" icon="volume">
+    **Clear speech**
+
+    No background noise
+    No music or overlapping voices
+
+  </Card>
+  <Card title="Quality" icon="sparkles">
+    **High fidelity**
+
+    44.1kHz or 48kHz sample rate
+    Minimal compression
+
+  </Card>
+  <Card title="Content" icon="microphone">
+    **Natural speech**
+
+    Conversational tone
+    Complete sentences
+
+  </Card>
+</CardGroup>
+
+### File Formats
+
+Supported formats:
+
+- **WAV** (recommended) - Lossless quality
+- **MP3** - Acceptable, minimal compression
+- **M4A** - Acceptable
+- **FLAC** - Lossless alternative
+
+<Tip>Use WAV for best results. Avoid heavily compressed formats.</Tip>
+
+## Recording Tips
+
+### Environment
+
+<AccordionGroup>
+  <Accordion title="Quiet Space">
+    - Record in a quiet room
+    - Turn off fans, AC, appliances
+    - Close windows to reduce outside noise
+    - Use soft furnishings to reduce echo
+  </Accordion>
+
+{" "}
+<Accordion title="Microphone Placement">
+	- 6-12 inches from mouth - Slight angle to reduce plosives (p, b, t) - Use a
+	pop filter if available - Maintain consistent distance
+</Accordion>
+
+  <Accordion title="Recording Settings">
+    - 44.1kHz or 48kHz sample rate
+    - 16-bit or 24-bit depth
+    - Mono is fine (stereo will be converted)
+    - Avoid automatic gain control
+  </Accordion>
+</AccordionGroup>
+
+### Speaking
+
+- **Natural pace** - Don't rush or speak too slowly
+- **Clear articulation** - Pronounce words clearly
+- **Consistent volume** - Maintain steady loudness
+- **Normal tone** - Speak as you normally would
+- **Complete sentences** - Avoid fragments or "ums"
+
+## Multiple Samples
+
+Adding multiple samples can significantly improve quality:
+
+### Why Multiple Samples?
+
+<CardGroup cols={2}>
+	<Card title="Robustness" icon="shield">
+		Model learns a more complete representation
+	</Card>
+	<Card title="Versatility" icon="palette">
+		Handles different speaking styles better
+	</Card>
+	<Card title="Quality" icon="star">
+		Reduces artifacts and improves naturalness
+	</Card>
+	<Card title="Consistency" icon="check">
+		More reliable across different texts
+	</Card>
+</CardGroup>
+
+### Sample Variety
+
+Consider adding samples with:
+
+1. **Different tones**
+
+   - Casual conversation
+   - Professional/formal
+   - Excited/enthusiastic
+   - Calm/serious
+
+2. **Different content**
+
+   - Narratives
+   - Questions
+   - Statements
+   - Emotions (happy, sad, neutral)
+
+3. **Different recording conditions**
+   - Studio quality
+   - Phone call quality (if needed)
+   - Room acoustics
+
+<Warning>
+	All samples should be from the **same speaker**. Mixing voices will produce
+	poor results.
+</Warning>
+
+## Processing Existing Audio
+
+If you have existing audio (podcasts, videos, etc.):
+
+### Extracting Clean Segments
+
+<Steps>
+  <Step title="Find Clean Speech">
+    Look for segments with:
+    - Just the target speaker
+    - No background music
+    - Minimal noise
+  </Step>
+
+{" "}
+<Step title="Use Audio Editor">
+	Tools like Audacity or Adobe Audition: - Cut out clean 10-30s segments -
+	Remove silence at start/end - Normalize volume if needed
+</Step>
+
+  <Step title="Export as WAV">
+    Save as high-quality WAV file
+  </Step>
+</Steps>
+
+### Noise Reduction
+
+If you have light background noise:
+
+```
+1. Use noise reduction in Audacity:
+   - Select noise-only section
+   - Get Noise Profile
+   - Select full audio
+   - Apply noise reduction (gentle settings)
+
+2. Avoid over-processing:
+   - Can introduce artifacts
+   - May reduce voice quality
+```
+
+## Testing & Iteration
+
+### Test Your Profile
+
+After creating a profile:
+
+<Steps>
+  <Step title="Generate Test">
+    Generate a simple phrase:
+    ```
+    "Hello, this is a test of my voice profile."
+    ```
+  </Step>
+
+{" "}
+<Step title="Evaluate Quality">
+	Listen for: - Natural tone - Clear pronunciation - Proper prosody - Lack of
+	artifacts
+</Step>
+
+  <Step title="Iterate">
+    If quality is poor:
+    - Add more samples
+    - Try different source audio
+    - Check sample quality
+  </Step>
+</Steps>
+
+### Common Issues
+
+<AccordionGroup>
+  <Accordion title="Robotic Voice">
+    **Cause**: Poor quality samples or too short
+
+    **Fix**: Use longer, higher quality samples
+
+  </Accordion>
+
+  <Accordion title="Wrong Tone">
+    **Cause**: Sample tone doesn't match desired output
+
+    **Fix**: Record samples in the style you want to generate
+
+  </Accordion>
+
+  <Accordion title="Artifacts/Glitches">
+    **Cause**: Background noise or audio issues in samples
+
+    **Fix**: Clean up samples or re-record in quieter environment
+
+  </Accordion>
+</AccordionGroup>
+
+## Advanced Tips
+
+### Celebrity/Character Voices
+
+For cloning public figures or characters:
+
+1. **Legal considerations** - Ensure you have rights or it's fair use
+2. **Source quality** - Find high-quality interview audio or clean clips
+3. **Consistency** - Use clips where they speak similarly
+4. **Multiple samples** - Very important for recognizable voices
+
+### Accent & Dialect
+
+The model will preserve accent and dialect:
+
+- British English will generate British English
+- Southern accent will produce Southern accent
+- Regional pronunciations will be maintained
+
+### Emotion Transfer
+
+The emotional tone of samples affects generation:
+
+- Energetic samples → Energetic output
+- Calm samples → Calm output
+- Mix samples for versatile profile
+
+## Managing Profiles
+
+### Organization
+
+- **Descriptive names** - "John Smith - Professional Narrator"
+- **Add descriptions** - Note recording conditions, use cases
+- **Language tags** - Mark the primary language
+- **Archive unused** - Keep profile list manageable
+
+### Export/Import
+
+- **Export** profiles to share or backup
+- **Import** from colleagues or teammates
+- Profiles include voice embeddings, not original audio
+
+## Next Steps
+
+<CardGroup cols={2}>
+	<Card
+		title="Generate Speech"
+		icon="waveform"
+		href="/overview/generating-speech"
+	>
+		Use your profile to generate speech
+	</Card>
+	<Card title="Build Stories" icon="film" href="/overview/building-stories">
+		Create multi-voice narratives
+	</Card>
+</CardGroup>
diff --git a/docs2/content/docs/overview/meta.json b/docs2/content/docs/overview/meta.json
new file mode 100644
index 00000000..d3906004
--- /dev/null
+++ b/docs2/content/docs/overview/meta.json
@@ -0,0 +1,17 @@
+{
+  "title": "Overview",
+  "pages": [
+    "introduction",
+    "installation",
+    "quick-start",
+    "voice-cloning",
+    "stories-editor",
+    "recording-transcription",
+    "generation-history",
+    "remote-mode",
+    "creating-voice-profiles",
+    "generating-speech",
+    "building-stories",
+    "troubleshooting"
+  ]
+}
diff --git a/docs2/content/docs/overview/quick-start.mdx b/docs2/content/docs/overview/quick-start.mdx
new file mode 100644
index 00000000..dac64fe4
--- /dev/null
+++ b/docs2/content/docs/overview/quick-start.mdx
@@ -0,0 +1,166 @@
+---
+title: "Quick Start"
+description: "Get started with Voicebox in 5 minutes"
+---
+
+This guide will walk you through creating your first voice profile and generating speech.
+
+## Prerequisites
+
+Make sure you have [installed Voicebox](/overview/installation) and launched the app.
+
+## Step 1: Create a Voice Profile
+
+Voice profiles are the foundation of Voicebox. Each profile contains voice samples that the AI uses to clone the voice.
+
+<Steps>
+  <Step title="Navigate to Profiles">
+    Click the **Profiles** tab in the sidebar
+  </Step>
+
+  <Step title="Create New Profile">
+    Click the **+ New Profile** button
+
+    Fill in the details:
+    - **Name:** A descriptive name (e.g., "John Smith")
+    - **Language:** Select the primary language
+    - **Description:** Optional notes about the voice
+
+  </Step>
+
+  <Step title="Add Voice Sample">
+    You have two options:
+
+    **Option A: Upload Audio**
+    - Click **Upload Sample**
+    - Select an audio file (WAV, MP3, or M4A)
+    - Ideal length: 10-30 seconds of clear speech
+
+    **Option B: Record Live**
+    - Click **Record Sample**
+    - Speak clearly for 10-30 seconds
+    - Click stop when finished
+
+  </Step>
+
+  <Step title="Save Profile">
+    Click **Create Profile** to save
+  </Step>
+</Steps>
+
+<Tip>
+	For best results, use clean audio with minimal background noise and consistent
+	speaking tone.
+</Tip>
+
+## Step 2: Generate Speech
+
+Now let's use your new voice profile to generate speech.
+
+<Steps>
+  <Step title="Go to Generation">
+    Click the **Generate** tab in the sidebar
+  </Step>
+
+{" "}
+<Step title="Select Voice Profile">
+	Choose your newly created profile from the dropdown
+</Step>
+
+  <Step title="Enter Text">
+    Type or paste the text you want to generate:
+
+    ```
+    Hello! This is my first voice generation with Voicebox.
+    ```
+
+  </Step>
+
+  <Step title="Generate">
+    Click **Generate** and wait a few seconds
+
+    <Note>
+      First generation may take longer due to model initialization. Subsequent generations will be faster.
+    </Note>
+
+  </Step>
+
+  <Step title="Play & Download">
+    - Click **Play** to preview the audio
+    - Click **Download** to save the audio file
+    - The generation is also saved to your **History**
+  </Step>
+</Steps>
+
+## Step 3: Build a Story (Optional)
+
+The Stories Editor lets you create multi-voice narratives with a timeline-based interface.
+
+<Steps>
+  <Step title="Create New Story">
+    Navigate to **Stories** and click **+ New Story**
+  </Step>
+
+{" "}
+<Step title="Add Voice Tracks">
+	Click **+ Add Track** to create tracks for different speakers
+</Step>
+
+{" "}
+<Step title="Add Audio Clips">
+	- Drag generated audio from your History - Or generate new clips directly in
+	the timeline - Arrange clips on the timeline
+</Step>
+
+  <Step title="Edit & Export">
+    - Trim clips by dragging edges
+    - Adjust timing and spacing
+    - Click **Export** to render the final audio
+  </Step>
+</Steps>
+
+## What's Next?
+
+<CardGroup cols={2}>
+	<Card
+		title="Voice Cloning Guide"
+		icon="microphone"
+		href="/overview/creating-voice-profiles"
+	>
+		Learn advanced techniques for high-quality voice cloning
+	</Card>
+	<Card title="API Integration" icon="code" href="/api-reference">
+		Integrate Voicebox into your own applications
+	</Card>
+	<Card title="Stories Editor" icon="film" href="/overview/stories-editor">
+		Master the multi-track timeline editor
+	</Card>
+	<Card title="Remote Mode" icon="server" href="/overview/remote-mode">
+		Connect to a GPU server for faster generation
+	</Card>
+</CardGroup>
+
+## Tips for Success
+
+<AccordionGroup>
+  <Accordion title="Getting the Best Voice Quality">
+    - Use 10-30 seconds of clear, consistent speech
+    - Avoid background noise and echo
+    - Multiple samples from the same speaker improve quality
+    - Match the speaking style you want to generate
+  </Accordion>
+
+{" "}
+<Accordion title="Improving Generation Speed">
+	- Use a CUDA-capable GPU for 5-10x faster generation - Enable voice prompt
+	caching for repeated generations - Consider running the backend on a remote
+	GPU server
+</Accordion>
+
+  <Accordion title="Troubleshooting Common Issues">
+    - **Server won't start:** Check if port 17493 is available
+    - **Poor audio quality:** Try adding more voice samples
+    - **Slow generation:** Verify GPU acceleration is enabled
+    - See the full [Troubleshooting Guide](/overview/troubleshooting) for more
+  </Accordion>
+</AccordionGroup>
diff --git a/docs2/content/docs/plans/DOCKER_DEPLOYMENT.md b/docs2/content/docs/plans/DOCKER_DEPLOYMENT.md
new file mode 100644
index 00000000..988dab91
--- /dev/null
+++ b/docs2/content/docs/plans/DOCKER_DEPLOYMENT.md
@@ -0,0 +1,786 @@
+---
+title: "Docker Deployment Guide"
+description: "Docker deployment guide for Voicebox (In Development)"
+---
+
+**Status:** In Development for v0.2.0
+**Requested By:** Reddit community ([thread](https://reddit.com/r/LocalLLaMA/...))
+
+## Overview
+
+Docker support makes Voicebox easier to deploy, especially for:
+
+- **Consistent Environments**: Same setup across dev/staging/prod
+- **GPU Passthrough**: Easy NVIDIA/AMD GPU access
+- **Server Deployments**: Run on headless Linux servers
+- **Multi-User Setups**: Isolate instances per user/team
+- **Cloud Platforms**: Deploy to AWS, GCP, Azure, DigitalOcean
+
+## Quick Start
+
+### Using Pre-Built Images (Recommended)
+
+```bash
+# CPU-only version
+docker run -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest
+
+# NVIDIA GPU version
+docker run --gpus all -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest-cuda
+
+# AMD GPU version (experimental)
+docker run --device=/dev/kfd --device=/dev/dri -p 8000:8000 \
+  -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest-rocm
+```
+
+Then open: `http://localhost:8000`
+
+### Using Docker Compose (Easiest)
+
+Create `docker-compose.yml`:
+
+```yaml
+version: "3.8"
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - GPU_MEMORY_FRACTION=0.8 # Use 80% of GPU memory
+      - TTS_MODE=local
+      - WHISPER_MODE=local
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+```
+
+Run:
+
+```bash
+docker compose up -d
+```
+
+## Building From Source
+
+### Basic Dockerfile
+
+```dockerfile
+# Dockerfile
+FROM python:3.11-slim
+
+WORKDIR /app
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y \
+    git \
+    build-essential \
+    ffmpeg \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy application
+COPY backend/ /app/backend/
+COPY requirements.txt /app/
+
+# Install Python dependencies
+RUN pip install --no-cache-dir -r requirements.txt
+RUN pip install --no-cache-dir git+https://github.com/QwenLM/Qwen3-TTS.git
+
+# Create data directory
+RUN mkdir -p /app/data
+
+# Expose port
+EXPOSE 8000
+
+# Run server
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
+```
+
+Build and run:
+
+```bash
+docker build -t voicebox .
+docker run -p 8000:8000 -v $(pwd)/data:/app/data voicebox
+```
+
+### Multi-Stage Build (Optimized)
+
+Smaller image size by separating build and runtime:
+
+```dockerfile
+# Dockerfile.optimized
+# Stage 1: Build dependencies
+FROM python:3.11-slim AS builder
+
+WORKDIR /build
+
+RUN apt-get update && apt-get install -y \
+    git build-essential && \
+    rm -rf /var/lib/apt/lists/*
+
+COPY backend/requirements.txt .
+RUN pip install --no-cache-dir --target=/build/packages \
+    -r requirements.txt
+
+RUN pip install --no-cache-dir --target=/build/packages \
+    git+https://github.com/QwenLM/Qwen3-TTS.git
+
+# Stage 2: Runtime
+FROM python:3.11-slim
+
+WORKDIR /app
+
+# Install only runtime dependencies
+RUN apt-get update && apt-get install -y \
+    ffmpeg \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy installed packages from builder
+COPY --from=builder /build/packages /usr/local/lib/python3.11/site-packages/
+
+# Copy application code
+COPY backend/ /app/backend/
+
+# Create data directory
+RUN mkdir -p /app/data
+
+EXPOSE 8000
+
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
+```
+
+Build:
+
+```bash
+docker build -f Dockerfile.optimized -t voicebox:slim .
+```
+
+## GPU Support
+
+### NVIDIA GPUs (CUDA)
+
+**Dockerfile:**
+
+```dockerfile
+FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04
+
+# Install Python
+RUN apt-get update && apt-get install -y \
+    python3.11 python3-pip git ffmpeg && \
+    rm -rf /var/lib/apt/lists/*
+
+WORKDIR /app
+
+# Install PyTorch with CUDA support
+COPY backend/requirements.txt .
+RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
+
+# Install other dependencies
+RUN pip3 install -r requirements.txt
+RUN pip3 install git+https://github.com/QwenLM/Qwen3-TTS.git
+
+COPY backend/ /app/backend/
+
+EXPOSE 8000
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
+```
+
+**Run with GPU:**
+
+```bash
+docker run --gpus all -p 8000:8000 \
+  -v voicebox-data:/app/data \
+  voicebox:cuda
+```
+
+**Docker Compose with GPU:**
+
+```yaml
+services:
+  voicebox:
+    image: voicebox:cuda
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: all
+              capabilities: [gpu]
+```
+
+### AMD GPUs (ROCm) - Experimental
+
+**Dockerfile:**
+
+```dockerfile
+FROM rocm/dev-ubuntu-22.04:6.0
+
+# Install Python
+RUN apt-get update && apt-get install -y \
+    python3.11 python3-pip git ffmpeg && \
+    rm -rf /var/lib/apt/lists/*
+
+WORKDIR /app
+
+# Install PyTorch with ROCm support
+COPY backend/requirements.txt .
+RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/rocm6.0
+
+# Install other dependencies
+RUN pip3 install -r requirements.txt
+RUN pip3 install git+https://github.com/QwenLM/Qwen3-TTS.git
+
+# Set ROCm environment variables
+ENV HSA_OVERRIDE_GFX_VERSION=10.3.0
+ENV ROCM_PATH=/opt/rocm
+
+COPY backend/ /app/backend/
+
+EXPOSE 8000
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
+```
+
+**Run with AMD GPU:**
+
+```bash
+docker run --device=/dev/kfd --device=/dev/dri \
+  --group-add video --ipc=host --cap-add=SYS_PTRACE \
+  --security-opt seccomp=unconfined \
+  -p 8000:8000 -v voicebox-data:/app/data \
+  voicebox:rocm
+```
+
+**Note:** ROCm support varies by GPU model. Works best on Linux. See [AMD ROCm docs](https://rocm.docs.amd.com) for compatibility.
+
+## Volume Mounts
+
+### Essential Volumes
+
+```bash
+docker run -v voicebox-data:/app/data \           # Profiles, generations, history
+           -v huggingface-cache:/root/.cache/huggingface \  # Downloaded models
+           -p 8000:8000 voicebox
+```
+
+### Development Volume Mounts
+
+For development with hot-reload:
+
+```bash
+docker run -v $(pwd)/backend:/app/backend \       # Live code changes
+           -v voicebox-data:/app/data \
+           -e RELOAD=true \
+           -p 8000:8000 voicebox
+```
+
+### Custom Model Storage
+
+Use external model directory:
+
+```bash
+docker run -v /path/to/models:/models \
+           -e MODELS_DIR=/models \
+           -v voicebox-data:/app/data \
+           -p 8000:8000 voicebox
+```
+
+## Environment Variables
+
+Configure Voicebox via environment variables:
+
+```bash
+docker run -e TTS_MODE=local \
+           -e WHISPER_MODE=openai-api \
+           -e OPENAI_API_KEY=sk-... \
+           -e GPU_MEMORY_FRACTION=0.8 \
+           -e LOG_LEVEL=info \
+           -p 8000:8000 voicebox
+```
+
+### Available Variables
+
+| Variable              | Default       | Description                                        |
+| --------------------- | ------------- | -------------------------------------------------- |
+| `TTS_MODE`            | `local`       | TTS provider: `local`, `remote`                    |
+| `TTS_REMOTE_URL`      | -             | URL for remote TTS server                          |
+| `WHISPER_MODE`        | `local`       | Whisper provider: `local`, `openai-api`, `remote`  |
+| `WHISPER_REMOTE_URL`  | -             | URL for remote Whisper server                      |
+| `OPENAI_API_KEY`      | -             | OpenAI API key (if using OpenAI Whisper)           |
+| `GPU_MEMORY_FRACTION` | `0.9`         | Fraction of GPU memory to use (0.0-1.0)            |
+| `DATA_DIR`            | `/app/data`   | Directory for profiles/generations                 |
+| `MODELS_DIR`          | `/app/models` | Directory for local models                         |
+| `LOG_LEVEL`           | `info`        | Logging level: `debug`, `info`, `warning`, `error` |
+| `RELOAD`              | `false`       | Enable hot-reload for development                  |
+
+## Complete Docker Compose Examples
+
+### Production Deployment
+
+```yaml
+# docker-compose.prod.yml
+version: "3.8"
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - TTS_MODE=local
+      - WHISPER_MODE=local
+      - GPU_MEMORY_FRACTION=0.8
+      - LOG_LEVEL=info
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
+
+volumes:
+  voicebox-data:
+    driver: local
+  huggingface-cache:
+    driver: local
+```
+
+Run:
+
+```bash
+docker compose -f docker-compose.prod.yml up -d
+```
+
+### Development Setup
+
+```yaml
+# docker-compose.dev.yml
+version: "3.8"
+
+services:
+  voicebox:
+    build:
+      context: .
+      dockerfile: Dockerfile
+    ports:
+      - "8000:8000"
+    volumes:
+      - ./backend:/app/backend:ro
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - RELOAD=true
+      - LOG_LEVEL=debug
+      - TTS_MODE=local
+    command: uvicorn backend.main:app --host 0.0.0.0 --port 8000 --reload
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+```
+
+### Multi-Service Stack
+
+Full stack with reverse proxy and monitoring:
+
+```yaml
+# docker-compose.stack.yml
+version: "3.8"
+
+services:
+  # Main Voicebox app
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    restart: unless-stopped
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - TTS_MODE=local
+      - WHISPER_MODE=local
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+
+  # Nginx reverse proxy
+  nginx:
+    image: nginx:alpine
+    ports:
+      - "80:80"
+      - "443:443"
+    volumes:
+      - ./nginx.conf:/etc/nginx/nginx.conf:ro
+      - ./ssl:/etc/nginx/ssl:ro
+    depends_on:
+      - voicebox
+
+  # Prometheus monitoring (optional)
+  prometheus:
+    image: prom/prometheus
+    ports:
+      - "9090:9090"
+    volumes:
+      - ./prometheus.yml:/etc/prometheus/prometheus.yml
+      - prometheus-data:/prometheus
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+  prometheus-data:
+```
+
+## Cloud Deployment
+
+### AWS EC2
+
+1. **Launch GPU Instance** (g4dn.xlarge or p3.2xlarge)
+2. **Install Docker + nvidia-docker:**
+   ```bash
+   # Amazon Linux 2
+   sudo yum install -y docker
+   sudo systemctl start docker
+   distribution=$(. /etc/os-release;echo $ID$VERSION_ID)
+   curl -s -L https://nvidia.github.io/nvidia-docker/gpgkey | sudo apt-key add -
+   curl -s -L https://nvidia.github.io/nvidia-docker/$distribution/nvidia-docker.list | \
+     sudo tee /etc/apt/sources.list.d/nvidia-docker.list
+   sudo apt-get update && sudo apt-get install -y nvidia-docker2
+   sudo systemctl restart docker
+   ```
+3. **Deploy:**
+   ```bash
+   docker run --gpus all -d -p 80:8000 \
+     -v voicebox-data:/app/data \
+     --restart unless-stopped \
+     ghcr.io/jamiepine/voicebox:latest-cuda
+   ```
+
+### DigitalOcean
+
+Use GPU Droplet + Docker:
+
+```bash
+# Create droplet via CLI
+doctl compute droplet create voicebox \
+  --size gpu-h100x1-80gb \
+  --image ubuntu-22-04-x64 \
+  --region nyc3
+
+# SSH and deploy
+ssh root@<droplet-ip>
+curl -fsSL https://get.docker.com -o get-docker.sh
+sh get-docker.sh
+docker run --gpus all -d -p 80:8000 voicebox:cuda
+```
+
+### Google Cloud Run (CPU-only)
+
+```bash
+# Build and push
+docker build -t gcr.io/your-project/voicebox .
+docker push gcr.io/your-project/voicebox
+
+# Deploy to Cloud Run
+gcloud run deploy voicebox \
+  --image gcr.io/your-project/voicebox \
+  --platform managed \
+  --region us-central1 \
+  --memory 4Gi \
+  --cpu 2 \
+  --port 8000
+```
+
+### Fly.io
+
+Create `fly.toml`:
+
+```toml
+app = "voicebox"
+
+[build]
+  image = "ghcr.io/jamiepine/voicebox:latest"
+
+[[services]]
+  http_checks = []
+  internal_port = 8000
+  protocol = "tcp"
+
+  [[services.ports]]
+    port = 80
+    handlers = ["http"]
+
+  [[services.ports]]
+    port = 443
+    handlers = ["tls", "http"]
+
+[mounts]
+  source = "voicebox_data"
+  destination = "/app/data"
+```
+
+Deploy:
+
+```bash
+fly launch
+fly deploy
+```
+
+## Troubleshooting
+
+### GPU Not Detected
+
+**Check NVIDIA Docker:**
+
+```bash
+docker run --rm --gpus all nvidia/cuda:12.1.0-base-ubuntu22.04 nvidia-smi
+```
+
+If this fails, reinstall nvidia-docker2.
+
+**Check AMD ROCm:**
+
+```bash
+docker run --rm --device=/dev/kfd --device=/dev/dri rocm/dev-ubuntu-22.04:6.0 rocminfo
+```
+
+### Permission Errors
+
+Container can't write to volumes:
+
+```bash
+# Fix permissions
+docker run --user $(id -u):$(id -g) -v $(pwd)/data:/app/data voicebox
+```
+
+### Out of Memory
+
+Reduce GPU memory usage:
+
+```bash
+docker run -e GPU_MEMORY_FRACTION=0.5 voicebox
+```
+
+Or use CPU-only:
+
+```bash
+docker run -e DEVICE=cpu voicebox
+```
+
+### Model Download Fails
+
+Ensure HuggingFace cache is writable:
+
+```bash
+docker run -v huggingface-cache:/root/.cache/huggingface voicebox
+```
+
+Or use host cache:
+
+```bash
+docker run -v ~/.cache/huggingface:/root/.cache/huggingface voicebox
+```
+
+### Port Already in Use
+
+Change host port:
+
+```bash
+docker run -p 8080:8000 voicebox  # Use port 8080 instead
+```
+
+## Security Best Practices
+
+### 1. Don't Run as Root
+
+Create non-root user in Dockerfile:
+
+```dockerfile
+RUN useradd -m -u 1000 voicebox
+USER voicebox
+```
+
+### 2. Use Secrets for API Keys
+
+Don't put API keys in docker-compose.yml:
+
+```bash
+# Use Docker secrets
+echo "sk-your-key" | docker secret create openai_key -
+
+docker service create \
+  --secret openai_key \
+  -e OPENAI_API_KEY_FILE=/run/secrets/openai_key \
+  voicebox
+```
+
+### 3. Network Isolation
+
+Use internal networks for multi-container setups:
+
+```yaml
+services:
+  voicebox:
+    networks:
+      - internal
+  nginx:
+    networks:
+      - internal
+      - external
+    ports:
+      - "80:80"
+
+networks:
+  internal:
+    internal: true
+  external:
+```
+
+### 4. Resource Limits
+
+Prevent resource exhaustion:
+
+```yaml
+services:
+  voicebox:
+    deploy:
+      resources:
+        limits:
+          cpus: "4"
+          memory: 8G
+        reservations:
+          cpus: "2"
+          memory: 4G
+```
+
+## Performance Tuning
+
+### GPU Memory Management
+
+```bash
+# Use 80% of GPU (default 90%)
+docker run -e GPU_MEMORY_FRACTION=0.8 voicebox
+
+# Allow GPU memory growth (prevents OOM)
+docker run -e TF_FORCE_GPU_ALLOW_GROWTH=true voicebox
+```
+
+### Model Caching
+
+Pre-download models to volume:
+
+```bash
+# Download models first
+docker run --rm -v huggingface-cache:/root/.cache/huggingface \
+  voicebox python -c "
+from transformers import WhisperProcessor, WhisperForConditionalGeneration
+WhisperProcessor.from_pretrained('openai/whisper-base')
+WhisperForConditionalGeneration.from_pretrained('openai/whisper-base')
+"
+
+# Then run normally
+docker run -v huggingface-cache:/root/.cache/huggingface voicebox
+```
+
+### Multi-Worker Setup
+
+Use uvicorn workers for better throughput:
+
+```dockerfile
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000", "--workers", "4"]
+```
+
+## Monitoring
+
+### Health Checks
+
+Built-in health endpoint:
+
+```bash
+curl http://localhost:8000/health
+```
+
+Docker health check:
+
+```yaml
+healthcheck:
+  test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
+  interval: 30s
+  timeout: 10s
+  retries: 3
+```
+
+### Prometheus Metrics
+
+Add metrics exporter:
+
+```python
+# backend/main.py
+from prometheus_fastapi_instrumentator import Instrumentator
+
+Instrumentator().instrument(app).expose(app)
+```
+
+Then scrape `/metrics` with Prometheus.
+
+### Logs
+
+View container logs:
+
+```bash
+docker logs -f voicebox
+
+# Or with compose
+docker compose logs -f voicebox
+```
+
+## Next Steps
+
+- [ ] Publish official images to GitHub Container Registry
+- [ ] Add Kubernetes Helm charts
+- [ ] Create Docker Desktop extension
+- [ ] Add automated vulnerability scanning
+- [ ] Support ARM64 builds for Raspberry Pi / Apple Silicon
+
+## Contributing
+
+Help improve Docker support:
+
+1. Test on different platforms (AMD GPU, ARM64, etc.)
+2. Submit Dockerfile optimizations
+3. Share deployment configurations
+4. Report issues: [GitHub Issues](https://github.com/jamiepine/voicebox/issues)
+
+## Resources
+
+- [Docker Documentation](https://docs.docker.com)
+- [NVIDIA Container Toolkit](https://github.com/NVIDIA/nvidia-docker)
+- [AMD ROCm Docker](https://rocm.docs.amd.com/projects/install-on-linux/en/latest/how-to/docker.html)
+- [Docker Compose Reference](https://docs.docker.com/compose/compose-file/)
diff --git a/docs2/content/docs/plans/EXTERNAL_PROVIDERS.md b/docs2/content/docs/plans/EXTERNAL_PROVIDERS.md
new file mode 100644
index 00000000..24cea16f
--- /dev/null
+++ b/docs2/content/docs/plans/EXTERNAL_PROVIDERS.md
@@ -0,0 +1,461 @@
+---
+title: "External Provider Support"
+description: "External provider support for Voicebox (Planned)"
+---
+
+**Status:** Planned for v0.2.0
+**Discussion:** [Reddit Thread](https://reddit.com/r/LocalLLaMA/...)
+
+## Overview
+
+External provider support allows you to connect Voicebox to remotely-hosted TTS and Whisper services instead of running models locally. This is useful for:
+
+- **Existing GPU Infrastructure**: You already have Qwen3-TTS running on a GPU server
+- **AMD GPU Users**: Run models on your AMD hardware, use Voicebox as the UI
+- **Cloud Deployments**: Host models on Modal, Replicate, RunPod, etc.
+- **Team Sharing**: Multiple users share one GPU server running models
+- **Mixed Deployments**: Local Whisper + remote TTS, or vice versa
+
+## Architecture
+
+```
+┌─────────────────┐         HTTP/API         ┌──────────────────┐
+│   Voicebox UI   │ ───────────────────────> │  Your TTS Server │
+│   + Backend     │                           │  (Qwen3-TTS on   │
+│                 │ <─────────────────────── │   AMD/NVIDIA GPU)│
+│  - Profiles     │      Audio + Metadata     └──────────────────┘
+│  - History      │
+│  - Audio Edit   │         HTTP/API         ┌──────────────────┐
+│  - UI           │ ───────────────────────> │ Whisper Service  │
+└─────────────────┘                           │ (OpenAI API or   │
+                                              │  self-hosted)    │
+                                              └──────────────────┘
+```
+
+**What Voicebox Still Handles:**
+
+- Voice profile management
+- Generation history
+- Audio trimming/editing
+- Multi-track story editor
+- UI/UX layer
+
+**What External Providers Handle:**
+
+- Model inference (TTS generation, transcription)
+- GPU allocation
+- Model loading/caching
+
+## Configuration
+
+### Environment Variables
+
+```bash
+# TTS Provider
+TTS_MODE=remote                              # local | remote
+TTS_REMOTE_URL=http://192.168.1.100:8000    # Your TTS server URL
+TTS_API_KEY=your-api-key                     # Optional authentication
+
+# Whisper Provider
+WHISPER_MODE=openai-api                      # local | openai-api | remote
+WHISPER_REMOTE_URL=http://localhost:9000     # For self-hosted Whisper
+OPENAI_API_KEY=sk-...                        # For OpenAI Whisper API
+```
+
+### Voicebox Config UI (Planned)
+
+Settings page will include:
+
+- Provider selection dropdowns
+- URL/API key inputs
+- Connection test button
+- Latency/status indicators
+
+## Hosting External Services
+
+### Option 1: Simple FastAPI Server (Recommended)
+
+Create a lightweight server to expose your local Qwen3-TTS model:
+
+```python
+# tts_server.py
+from fastapi import FastAPI, UploadFile, File
+from qwen_tts import Qwen3TTSModel
+import numpy as np
+import base64
+
+app = FastAPI()
+model = Qwen3TTSModel.from_pretrained(
+    "Qwen/Qwen3-TTS-12Hz-1.7B-Base",
+    device_map="cuda"  # or "cpu" for AMD ROCm: use torch+rocm
+)
+
+@app.post("/v1/generate")
+async def generate(
+    text: str,
+    voice_prompt: dict,
+    language: str = "en",
+    seed: int = None
+):
+    """Generate speech from text using voice prompt."""
+    audio, sample_rate = model.generate_voice_clone(
+        text=text,
+        voice_clone_prompt=voice_prompt,
+    )
+
+    # Return as base64 for transport
+    audio_bytes = audio.tobytes()
+    return {
+        "audio": base64.b64encode(audio_bytes).decode(),
+        "sample_rate": sample_rate,
+        "dtype": str(audio.dtype)
+    }
+
+@app.post("/v1/create_voice_prompt")
+async def create_voice_prompt(
+    audio: UploadFile = File(...),
+    reference_text: str = ""
+):
+    """Create voice prompt from reference audio."""
+    # Save uploaded audio temporarily
+    audio_path = f"/tmp/{audio.filename}"
+    with open(audio_path, "wb") as f:
+        f.write(await audio.read())
+
+    # Create voice prompt
+    voice_prompt = model.create_voice_clone_prompt(
+        ref_audio=audio_path,
+        ref_text=reference_text,
+    )
+
+    return {"voice_prompt": voice_prompt}
+
+@app.get("/health")
+async def health():
+    return {
+        "status": "healthy",
+        "model": "Qwen3-TTS-12Hz-1.7B-Base",
+        "device": str(model.device)
+    }
+
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=8000)
+```
+
+**Run it:**
+
+```bash
+# Install dependencies
+pip install fastapi uvicorn qwen-tts torch
+
+# For AMD GPUs, use ROCm PyTorch:
+pip install torch --index-url https://download.pytorch.org/whl/rocm6.4
+
+# Start server
+python tts_server.py
+```
+
+### Option 2: vLLM (If Supported)
+
+```bash
+vllm serve Qwen/Qwen3-TTS-12Hz-1.7B-Base \
+  --host 0.0.0.0 \
+  --port 8000 \
+  --gpu-memory-utilization 0.9
+```
+
+### Option 3: Cloud Platforms
+
+**Modal.com Example:**
+
+```python
+import modal
+
+app = modal.App("qwen-tts")
+image = modal.Image.debian_slim().pip_install("qwen-tts", "torch")
+
+@app.function(gpu="A10G", image=image)
+@modal.web_endpoint(method="POST")
+def generate(text: str, voice_prompt: dict):
+    from qwen_tts import Qwen3TTSModel
+    model = Qwen3TTSModel.from_pretrained("Qwen/Qwen3-TTS-12Hz-1.7B-Base")
+    audio, sr = model.generate_voice_clone(text, voice_prompt)
+    return {"audio": audio.tolist(), "sample_rate": sr}
+```
+
+Deploy: `modal deploy tts_server.py`
+Get URL: `https://yourapp--generate.modal.run`
+
+## API Specification
+
+External TTS providers must implement these endpoints:
+
+### `POST /v1/generate`
+
+Generate speech from text.
+
+**Request:**
+
+```json
+{
+	"text": "Hello, this is a test.",
+	"voice_prompt": {
+		/* voice prompt object */
+	},
+	"language": "en",
+	"seed": 12345
+}
+```
+
+**Response:**
+
+```json
+{
+	"audio": "base64-encoded-audio-bytes",
+	"sample_rate": 24000,
+	"dtype": "float32"
+}
+```
+
+### `POST /v1/create_voice_prompt`
+
+Create a voice prompt from reference audio.
+
+**Request:** (multipart/form-data)
+
+- `audio`: Audio file upload
+- `reference_text`: Transcript of the audio
+
+**Response:**
+
+```json
+{
+	"voice_prompt": {
+		/* voice prompt object */
+	}
+}
+```
+
+### `GET /health`
+
+Health check endpoint.
+
+**Response:**
+
+```json
+{
+	"status": "healthy",
+	"model": "Qwen3-TTS-12Hz-1.7B-Base",
+	"device": "cuda:0"
+}
+```
+
+## Whisper External Providers
+
+### OpenAI Whisper API
+
+Simply set:
+
+```bash
+WHISPER_MODE=openai-api
+OPENAI_API_KEY=sk-...
+```
+
+Voicebox will use OpenAI's Whisper API automatically.
+
+### Self-Hosted Whisper
+
+Run your own Whisper server:
+
+```python
+# whisper_server.py
+from fastapi import FastAPI, UploadFile, File
+from transformers import WhisperProcessor, WhisperForConditionalGeneration
+import librosa
+
+app = FastAPI()
+processor = WhisperProcessor.from_pretrained("openai/whisper-base")
+model = WhisperForConditionalGeneration.from_pretrained("openai/whisper-base")
+
+@app.post("/v1/transcribe")
+async def transcribe(audio: UploadFile = File(...), language: str = None):
+    # Load audio
+    audio_path = f"/tmp/{audio.filename}"
+    with open(audio_path, "wb") as f:
+        f.write(await audio.read())
+
+    audio_data, sr = librosa.load(audio_path, sr=16000)
+
+    # Process
+    inputs = processor(audio_data, sampling_rate=16000, return_tensors="pt")
+    predicted_ids = model.generate(inputs["input_features"])
+    transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)[0]
+
+    return {"text": transcription}
+```
+
+Configure Voicebox:
+
+```bash
+WHISPER_MODE=remote
+WHISPER_REMOTE_URL=http://localhost:9000
+```
+
+## Use Cases
+
+### 1. AMD GPU User with Existing Setup
+
+**Scenario:** You have a Radeon 7900 XTX running Qwen3-TTS on Linux.
+
+**Setup:**
+
+1. Run `tts_server.py` on your AMD box (ROCm PyTorch)
+2. Configure Voicebox: `TTS_MODE=remote`, `TTS_REMOTE_URL=http://amd-box:8000`
+3. Use Voicebox UI for profiles, generation, editing
+4. TTS happens on your AMD GPU
+
+### 2. Team Deployment
+
+**Scenario:** 5 team members, 1 GPU server.
+
+**Setup:**
+
+1. Deploy TTS server on shared GPU box
+2. Each person runs Voicebox desktop app locally
+3. All point to same `TTS_REMOTE_URL`
+4. Profiles and history stay local per user
+5. GPU usage is shared
+
+### 3. Hybrid Local/Remote
+
+**Scenario:** Fast local Whisper, heavy TTS on cloud.
+
+**Setup:**
+
+```bash
+TTS_MODE=remote
+TTS_REMOTE_URL=https://your-modal-app.modal.run
+
+WHISPER_MODE=local  # Fast transcription on your CPU
+```
+
+### 4. OpenAI Whisper + Self-Hosted TTS
+
+**Scenario:** Use OpenAI's API for transcription, run TTS locally.
+
+**Setup:**
+
+```bash
+TTS_MODE=local
+
+WHISPER_MODE=openai-api
+OPENAI_API_KEY=sk-...
+```
+
+## Security Considerations
+
+### Authentication
+
+Add API key authentication to your external server:
+
+```python
+from fastapi import Header, HTTPException
+
+API_KEY = "your-secret-key"
+
+async def verify_api_key(x_api_key: str = Header(...)):
+    if x_api_key != API_KEY:
+        raise HTTPException(status_code=401, detail="Invalid API key")
+
+@app.post("/v1/generate", dependencies=[Depends(verify_api_key)])
+async def generate(...):
+    ...
+```
+
+Configure Voicebox:
+
+```bash
+TTS_API_KEY=your-secret-key
+```
+
+### Network Security
+
+- **VPN/Tailscale**: Use private network for remote servers
+- **HTTPS**: Use reverse proxy (nginx/Caddy) with SSL certificates
+- **Firewall**: Restrict access to known IPs
+
+### Rate Limiting
+
+Protect your external server:
+
+```python
+from slowapi import Limiter
+from slowapi.util import get_remote_address
+
+limiter = Limiter(key_func=get_remote_address)
+app.state.limiter = limiter
+
+@app.post("/v1/generate")
+@limiter.limit("10/minute")
+async def generate(...):
+    ...
+```
+
+## Performance Considerations
+
+### Latency
+
+External providers add network latency:
+
+- **Local network**: ~10-50ms overhead (negligible)
+- **Same datacenter**: ~1-5ms overhead
+- **Cross-region cloud**: 50-200ms+ overhead
+
+For real-time applications, keep TTS server on local network or same cloud region.
+
+### Caching
+
+Implement response caching on external server:
+
+```python
+from functools import lru_cache
+
+@lru_cache(maxsize=1000)
+def get_cached_generation(text, voice_prompt_hash, language, seed):
+    return model.generate_voice_clone(text, voice_prompt)
+```
+
+### Load Balancing
+
+For high-traffic deployments, run multiple TTS servers behind a load balancer:
+
+```
+Voicebox ──> Load Balancer ──> TTS Server 1 (GPU 1)
+                           ├──> TTS Server 2 (GPU 2)
+                           └──> TTS Server 3 (GPU 3)
+```
+
+## Future Enhancements
+
+- [ ] **Provider Marketplace**: Built-in directory of compatible providers
+- [ ] **Automatic Fallback**: If remote fails, fallback to local
+- [ ] **Cost Tracking**: Monitor API usage and costs
+- [ ] **Performance Metrics**: Latency, throughput dashboards
+- [ ] **Multi-Provider**: Use different providers for different voices/languages
+
+## Contributing
+
+If you build an external provider, please share:
+
+1. Server implementation
+2. Performance benchmarks
+3. Deployment guide
+
+Submit to: [GitHub Discussions](https://github.com/jamiepine/voicebox/discussions)
+
+## Questions?
+
+- **Discord**: [Join the community](https://discord.gg/...)
+- **GitHub**: [Open an issue](https://github.com/jamiepine/voicebox/issues)
+- **Docs**: [Full documentation](https://voicebox.sh/docs)
diff --git a/docs2/content/docs/plans/MLX_AUDIO.md b/docs2/content/docs/plans/MLX_AUDIO.md
new file mode 100644
index 00000000..021911fc
--- /dev/null
+++ b/docs2/content/docs/plans/MLX_AUDIO.md
@@ -0,0 +1,431 @@
+---
+title: "MLX Audio Integration"
+description: "MLX Audio integration for Voicebox (Validated)"
+---
+
+**Status:** Validated ✅
+**Context:** [mlx-audio v0.3.1 release](https://github.com/Blaizzy/mlx-audio)
+
+## Validation Results
+
+We validated mlx-audio in an isolated environment (`mlx-test/`). Key findings:
+
+| Metric          | Result                                      |
+| --------------- | ------------------------------------------- |
+| MLX Version     | 0.30.4                                      |
+| Model Load Time | ~1s (after initial download)                |
+| Generation RTF  | **0.5-0.6x** (1.7-2x faster than real-time) |
+| Test Hardware   | Apple Silicon Mac                           |
+
+### Model Mapping
+
+| voicebox (PyTorch)              | mlx-audio (MLX)                               |
+| ------------------------------- | --------------------------------------------- |
+| `Qwen/Qwen3-TTS-12Hz-1.7B-Base` | `mlx-community/Qwen3-TTS-12Hz-1.7B-Base-bf16` |
+| `Qwen/Qwen3-TTS-12Hz-0.6B-Base` | (not yet converted)                           |
+
+### mlx-audio API
+
+The API uses a **generator-based streaming pattern**:
+
+```python
+from mlx_audio.tts import load
+
+model = load("mlx-community/Qwen3-TTS-12Hz-1.7B-Base-bf16")
+
+# generate() yields GenerationResult objects
+for result in model.generate("Hello world"):
+    audio = result.audio           # numpy array of samples
+    sample_rate = result.sample_rate  # 24000
+    rtf = result.real_time_factor  # e.g., 0.55
+```
+
+### Known Warnings (harmless)
+
+```
+You are using a model of type qwen3_tts to instantiate a model of type .
+The tokenizer you are loading... with an incorrect regex pattern...
+```
+
+These warnings appear but don't affect functionality or output quality.
+
+### Demo Script
+
+Run `mlx-test/demo.py` to test:
+
+```bash
+cd mlx-test && source venv/bin/activate && python demo.py "Your text here"
+```
+
+## Problem
+
+Apple Silicon users are stuck on CPU inference while Windows and Linux users get CUDA acceleration. The current PyTorch MPS backend has stability issues (lines 34-36 in `backend/tts.py` and `backend/transcribe.py`), forcing a CPU fallback that makes voicebox significantly slower on M1/M2/M3 Macs.
+
+This creates a poor experience for a large portion of users who bought Apple Silicon specifically for ML workloads.
+
+## Solution
+
+Integrate [mlx-audio](https://github.com/Blaizzy/mlx-audio) as the inference engine for macOS Apple Silicon builds. MLX is Apple's native ML framework, optimized for Metal and the unified memory architecture. It's fast, stable, and already supports the same Qwen3-TTS models we use.
+
+**Key wins:**
+
+- Native GPU acceleration on Apple Silicon (no more CPU fallback)
+- Streaming TTS support (faster perceived latency)
+- Memory optimizations (run larger models on less RAM)
+- Fixed 0.6B silence bug that we currently ship
+- Same Qwen3-TTS models (zero migration cost for users)
+
+## Architecture
+
+### Current Stack
+
+```
+┌─────────────────────────┐
+│   PyTorch + Qwen3-TTS   │
+│   (CPU only on macOS)   │
+└─────────────────────────┘
+```
+
+### Proposed Stack
+
+```
+┌─────────────────────────────────────────┐
+│  Platform Detection at Runtime          │
+└─────────────────────────────────────────┘
+           │
+           ├─── Apple Silicon (aarch64-darwin)
+           │    ┌─────────────────────────┐
+           │    │  MLX Audio Backend      │
+           │    │  - Qwen3-TTS (mlx)      │
+           │    │  - Whisper (mlx)        │
+           │    │  - Streaming support    │
+           │    └─────────────────────────┘
+           │
+           └─── Other (x86_64, Windows, Linux)
+                ┌─────────────────────────┐
+                │  PyTorch Backend        │
+                │  - Qwen3-TTS (pytorch)  │
+                │  - Whisper (pytorch)    │
+                │  - CUDA if available    │
+                └─────────────────────────┘
+```
+
+## Implementation Phases
+
+### Phase 1: Platform Detection & Dependency Management
+
+Create a backend that switches between PyTorch and MLX based on runtime platform detection.
+
+**New files:**
+
+- `backend/platform.py` - Detect Apple Silicon, return backend type
+- `backend/backends/__init__.py` - Backend factory pattern
+- `backend/requirements-mlx.txt` - MLX-specific deps (macOS only)
+
+**Modified files:**
+
+- `backend/requirements.txt` - Keep PyTorch as default
+- `backend/main.py` - Import from backend factory instead of direct imports
+
+**Platform detection logic:**
+
+```python
+def get_backend_type() -> str:
+    """Detect best backend for current platform."""
+    if platform.system() == "Darwin" and platform.machine() == "arm64":
+        # Apple Silicon detected
+        try:
+            import mlx
+            return "mlx"
+        except ImportError:
+            return "pytorch"  # Fallback if mlx not installed
+    return "pytorch"
+```
+
+### Phase 2: MLX Backend Implementation
+
+Create parallel implementations of TTS and STT using mlx-audio.
+
+**New files:**
+
+- `backend/backends/mlx_backend.py` - MLX inference engine
+- `backend/backends/pytorch_backend.py` - Refactor current code into backend
+
+**Interface both backends must implement:**
+
+```python
+class TTSBackend(Protocol):
+    async def load_model(self, model_size: str) -> None: ...
+    async def create_voice_prompt(self, audio_path: str, reference_text: str) -> dict: ...
+    async def generate(self, text: str, voice_prompt: dict, **kwargs) -> Tuple[np.ndarray, int]: ...
+    async def generate_streaming(self, text: str, voice_prompt: dict, **kwargs) -> AsyncIterator[bytes]: ...
+    def unload_model(self) -> None: ...
+
+class STTBackend(Protocol):
+    async def load_model(self, model_size: str) -> None: ...
+    async def transcribe(self, audio_path: str, language: Optional[str]) -> str: ...
+    def unload_model(self) -> None: ...
+```
+
+**MLX backend implementation notes:**
+
+mlx-audio's `generate()` returns a generator by default (streaming is built-in):
+
+```python
+# MLX backend wrapper
+from mlx_audio.tts import load
+
+class MLXTTSBackend:
+    def __init__(self):
+        self.model = None
+
+    async def load_model(self, model_size: str) -> None:
+        model_map = {
+            "1.7B": "mlx-community/Qwen3-TTS-12Hz-1.7B-Base-bf16",
+            # "0.6B": needs conversion to mlx format
+        }
+        self.model = load(model_map[model_size])
+
+    async def generate(self, text: str, voice_prompt: dict, **kwargs) -> Tuple[np.ndarray, int]:
+        # Collect all chunks from generator
+        chunks = []
+        for result in self.model.generate(text):  # TODO: add voice_prompt support
+            chunks.append(np.array(result.audio))
+        return np.concatenate(chunks), 24000
+```
+
+**MLX-specific features to expose:**
+
+- Streaming TTS (new endpoint: `/api/generate/stream`)
+- Memory-optimized model loading
+- Qwen3-ASR for transcription (in addition to Whisper)
+
+### Phase 3: API Layer Updates
+
+Update FastAPI endpoints to support new streaming capabilities and maintain backward compatibility.
+
+**Modified files:**
+
+- `backend/main.py` - Add streaming endpoints
+- `backend/tts.py` - Refactor to use backend abstraction
+- `backend/transcribe.py` - Refactor to use backend abstraction
+
+**New endpoints:**
+
+```python
+@app.post("/api/generate/stream")
+async def generate_stream(...) -> StreamingResponse:
+    """Stream TTS chunks as they're generated (MLX only)."""
+    backend = get_backend()
+    if not hasattr(backend, 'generate_streaming'):
+        raise HTTPException(501, "Streaming not supported on this backend")
+    return StreamingResponse(backend.generate_streaming(...), media_type="audio/wav")
+```
+
+**Backward compatibility:**
+
+- Keep all existing `/api/generate` endpoints unchanged
+- PyTorch backend users see no behavior change
+- MLX users automatically get faster inference, streaming is opt-in
+
+### Phase 4: Frontend Integration
+
+Add UI indicators for backend type and streaming progress.
+
+**Modified files:**
+
+- `app/src/hooks/useGenerationForm.tsx` - Add streaming support
+- `app/src/components/GenerationForm.tsx` - Show backend badge, streaming toggle
+- `app/src/lib/api.ts` - Add streaming API client
+
+**UI additions:**
+
+- Badge showing current backend ("MLX" or "PyTorch")
+- Toggle for streaming mode (disabled if PyTorch)
+- Real-time streaming playback (WaveSurfer progressive loading)
+
+### Phase 5: Build & Distribution
+
+Create separate installers for MLX (Apple Silicon) and PyTorch (Universal).
+
+**Modified files:**
+
+- `tauri/src-tauri/tauri.conf.json` - Add target-specific builds
+- `.github/workflows/release.yml` - Build both variants
+
+**Build matrix:**
+
+```yaml
+- target: aarch64-apple-darwin
+  backend: mlx
+  installer: voicebox-macos-silicon-{version}.dmg
+
+- target: x86_64-apple-darwin
+  backend: pytorch
+  installer: voicebox-macos-intel-{version}.dmg
+
+- target: x86_64-pc-windows-msvc
+  backend: pytorch
+  installer: voicebox-windows-{version}.exe
+```
+
+**Installation flow:**
+
+- Auto-detect architecture, recommend correct installer
+- MLX installer includes `mlx-audio` in embedded Python
+- PyTorch installer includes `torch` in embedded Python
+- Both can coexist (different backend, same profile format)
+
+### Phase 6: Testing & Validation
+
+Ensure both backends produce compatible outputs.
+
+**New files:**
+
+- `backend/tests/test_backend_parity.py` - Verify both backends produce similar audio
+- `backend/tests/test_streaming.py` - Streaming-specific tests
+
+**Test scenarios:**
+
+- Same voice prompt on both backends → similar (not identical) audio output
+- Profile created on MLX → loads on PyTorch (and vice versa)
+- Streaming chunks assemble into valid WAV file
+- Model downloads work on both backends
+- Memory usage stays within bounds
+
+### Phase 7: Documentation
+
+Update user-facing docs and developer guides.
+
+**New files:**
+
+- `docs/developer/BACKENDS.md` - Guide for adding new backends
+- `docs/overview/performance.md` - Backend comparison benchmarks
+
+**Modified files:**
+
+- `README.md` - Note Apple Silicon acceleration
+- `docs/TROUBLESHOOTING.md` - Add MLX-specific issues
+
+**Key docs to write:**
+
+- Which installer to download (architecture detection)
+- Performance comparison (MLX vs PyTorch on same M2 hardware)
+- How streaming mode works
+- How to force PyTorch on Apple Silicon (for debugging)
+
+## Technical Decisions
+
+### Why Dual Backend Instead of MLX-Only?
+
+**Pros of dual backend:**
+
+- Windows and Intel Mac users unaffected
+- Easier testing (can compare outputs)
+- Fallback if MLX has issues
+
+**Cons of dual backend:**
+
+- More code to maintain
+- Two dependency trees
+- Build complexity (separate installers)
+
+**Decision:** Dual backend. The maintenance cost is worth it to avoid breaking existing users and to have a fallback.
+
+### Why Separate Installers Instead of Runtime Detection?
+
+**Pros of separate installers:**
+
+- Smaller bundle size (don't ship both PyTorch and MLX)
+- Clearer to users which version they have
+- Easier to debug (no "which backend am I running?" confusion)
+- Can optimize each build for its target
+
+**Cons:**
+
+- More installers to build and test
+- Users might download the wrong one
+
+**Decision:** Separate installers. Bundle size matters (PyTorch + MLX would be huge), and we can auto-detect architecture on the download page.
+
+### Streaming vs Batch Generation
+
+MLX supports streaming, PyTorch doesn't (without significant work). Should streaming be:
+
+1. MLX-only feature (✅ chosen)
+2. Implemented for both (lots of work)
+3. Not exposed at all (wasted opportunity)
+
+**Decision:** MLX-only. Expose as opt-in feature with graceful degradation (button disabled on PyTorch backend).
+
+## Migration Path
+
+Nothing needs migrating, macos users will just notice a speed-boost in inference
+
+**Data format compatibility:**
+
+- Profiles (SQLite) → no schema changes needed
+- Voice prompts (cached) → backend-agnostic (just numpy arrays)
+- Audio files → unchanged
+
+## Performance Expectations
+
+### Measured Results (from validation)
+
+| Metric                  | MLX (measured) | PyTorch CPU (estimated) |
+| ----------------------- | -------------- | ----------------------- |
+| **6s audio generation** | ~3-4s          | ~10-15s                 |
+| **Real-time factor**    | 0.5-0.6x       | 2-3x                    |
+| **Model load (cached)** | ~1s            | ~3-5s                   |
+
+### TTS Generation (1.7B model, ~20s output)
+
+- **PyTorch CPU (M2 Max):** ~45-60s (slower than real-time)
+- **MLX (M2 Max):** ~8-12s (faster than real-time)
+- **Improvement:** ~4-5x faster
+
+### Whisper Transcription (10s audio clip)
+
+- **PyTorch CPU:** ~5-8s
+- **MLX:** ~1-2s
+- **Improvement:** ~3-4x faster
+
+### Memory Usage (1.7B model)
+
+- **PyTorch:** ~8-10GB (no GPU offload, so CPU RAM)
+- **MLX:** ~4-6GB (unified memory, better optimization)
+- **Improvement:** ~40% less RAM
+
+Full benchmarks will be in `docs/overview/performance.md` after Phase 6.
+
+## Open Questions
+
+- **Should we support Qwen3-ASR (MLX-only) in addition to Whisper?** Adds another model option but increases complexity. Probably phase 8+. - Sure
+- **Should we backport streaming to PyTorch?** Would require chunking and callback-based generation. Probably not worth it given mlx-audio already has it. - No
+- **What's the auto-update UX for migrating PyTorch→MLX users?** Needs design. Don't want to force reinstall, but also want to make upgrade obvious. - it just updates, users see nothing
+- **Do we expose backend selection in settings or hide it?** Leaning toward auto-detect only, with env var override for power users.
+
+## Success Metrics
+
+How we'll know this worked:
+
+1. **Performance:** Apple Silicon users report generation faster than real-time
+2. **Adoption:** >80% of macOS downloads are MLX build within 1 month
+3. **Stability:** <5% increase in bug reports (backend abstraction doesn't introduce regressions)
+4. **Feedback:** Positive sentiment in Discord/GitHub about macOS performance
+
+## Related Work
+
+- [PyTorch MPS tracking issue](https://github.com/pytorch/pytorch/issues/77764) - Why we can't use MPS directly
+- [mlx-audio server implementation](https://github.com/Blaizzy/mlx-audio/blob/main/examples/server.py) - Reference for streaming API
+- [MLX Whisper benchmarks](https://github.com/ml-explore/mlx-examples/tree/main/whisper) - Performance data
+
+## Next Steps
+
+1. ~~Validate mlx-audio can load Qwen3-TTS models (quick test)~~ ✅ Done - see `mlx-test/`
+2. Get approval on dual-backend architecture
+3. Start Phase 1 (platform detection)
+
+## Questions?
+
+Feedback welcome in GitHub discussions or Discord.
diff --git a/docs2/content/docs/plans/OPENAI_SUPPORT.md b/docs2/content/docs/plans/OPENAI_SUPPORT.md
new file mode 100644
index 00000000..e570dcf0
--- /dev/null
+++ b/docs2/content/docs/plans/OPENAI_SUPPORT.md
@@ -0,0 +1,238 @@
+---
+title: "OpenAI API Compatibility"
+description: "OpenAI API compatibility for Voicebox (Planned)"
+---
+
+**Status:** Planned for v0.2.0
+
+**Issue:** [#10 OpenAI API compatibility](https://github.com/jamiepine/voicebox/issues/10)
+
+## Overview
+
+This feature exposes OpenAI-compatible endpoints from Voicebox, allowing any tool, library, or application that speaks the OpenAI Audio API to use Voicebox as a drop-in local replacement.
+
+```mermaid
+flowchart LR
+    subgraph clients [External Clients]
+        SDK[OpenAI SDK]
+        Curl[curl / HTTP]
+        Apps[Third-party Apps]
+    end
+
+    subgraph voicebox [Voicebox Server]
+        OpenAI["/v1/audio/* endpoints"]
+        TTS[TTSModel]
+        Whisper[WhisperModel]
+        Profiles[Voice Profiles]
+    end
+
+    SDK --> OpenAI
+    Curl --> OpenAI
+    Apps --> OpenAI
+    OpenAI --> TTS
+    OpenAI --> Whisper
+    OpenAI --> Profiles
+```
+
+## Use Cases
+
+- **OpenAI SDK users**: `openai.audio.speech.create()` works with Voicebox
+- **LLM frameworks**: LangChain, AutoGen, etc. can use Voicebox for TTS
+- **Shell scripts**: `curl` commands copy-pasted from OpenAI docs work
+- **Existing integrations**: Any tool expecting OpenAI's API works without code changes
+
+## Endpoints to Implement
+
+### 1. `POST /v1/audio/speech` (TTS)
+
+OpenAI spec: https://platform.openai.com/docs/api-reference/audio/createSpeech
+
+**Request:**
+
+```json
+{
+	"model": "tts-1",
+	"input": "Hello world!",
+	"voice": "alloy",
+	"response_format": "mp3",
+	"speed": 1.0
+}
+```
+
+**Response:** Audio file (mp3, wav, opus, aac, flac, pcm)
+
+**Voice Mapping Strategy:**
+
+- `voice` parameter maps to Voicebox profile names (case-insensitive)
+- If no match, use a configurable default profile
+- Support special syntax: `voice: "profile:uuid"` for explicit profile ID
+
+### 2. `POST /v1/audio/transcriptions` (Whisper)
+
+OpenAI spec: https://platform.openai.com/docs/api-reference/audio/createTranscription
+
+**Request:** (multipart/form-data)
+
+- `file`: Audio file
+- `model`: "whisper-1"
+- `language`: Optional language hint
+- `response_format`: json, text, srt, verbose_json, vtt
+
+**Response:**
+
+```json
+{
+	"text": "Hello world!"
+}
+```
+
+## Implementation Details
+
+### New File: `backend/openai_compat.py`
+
+Create a dedicated module with an APIRouter for OpenAI-compatible endpoints:
+
+```python
+from fastapi import APIRouter, UploadFile, File, Form, HTTPException
+from fastapi.responses import StreamingResponse
+from pydantic import BaseModel
+from typing import Literal, Optional
+
+router = APIRouter(prefix="/v1/audio", tags=["OpenAI Compatible"])
+
+class SpeechRequest(BaseModel):
+    model: str = "tts-1"
+    input: str
+    voice: str = "alloy"
+    response_format: Literal["mp3", "wav", "opus", "aac", "flac", "pcm"] = "mp3"
+    speed: float = 1.0
+
+@router.post("/speech")
+async def create_speech(request: SpeechRequest, db: Session = Depends(get_db)):
+    # 1. Map voice name to profile
+    # 2. Generate audio using existing TTSModel
+    # 3. Convert to requested format
+    # 4. Return audio stream
+    ...
+
+@router.post("/transcriptions")
+async def create_transcription(
+    file: UploadFile = File(...),
+    model: str = Form("whisper-1"),
+    language: Optional[str] = Form(None),
+    response_format: str = Form("json"),
+):
+    # 1. Save uploaded file
+    # 2. Transcribe using existing WhisperModel
+    # 3. Return in requested format
+    ...
+```
+
+### Voice Profile Resolution
+
+Add helper in [backend/profiles.py](backend/profiles.py):
+
+```python
+async def resolve_voice_for_openai(voice: str, db: Session) -> Optional[VoiceProfile]:
+    """
+    Resolve OpenAI voice parameter to a Voicebox profile.
+
+    Priority:
+    1. Exact profile name match (case-insensitive)
+    2. Profile ID match (if voice starts with "profile:")
+    3. Default profile from config
+    4. First available profile
+    """
+    ...
+```
+
+### Audio Format Conversion
+
+Add conversion utilities in [backend/utils/audio.py](backend/utils/audio.py):
+
+```python
+def convert_audio_format(
+    audio: np.ndarray,
+    sample_rate: int,
+    target_format: str,  # mp3, wav, opus, aac, flac, pcm
+) -> bytes:
+    """Convert audio to target format using ffmpeg or pydub."""
+    ...
+```
+
+### Configuration
+
+Add to [backend/config.py](backend/config.py):
+
+```python
+# OpenAI API Compatibility
+OPENAI_COMPAT_ENABLED = True
+OPENAI_COMPAT_DEFAULT_VOICE = None  # Profile ID or name for default voice
+OPENAI_COMPAT_REQUIRE_AUTH = False  # Require API key validation
+OPENAI_COMPAT_API_KEY = None        # If set, validate against this
+```
+
+### Integration with main.py
+
+In [backend/main.py](backend/main.py), include the router:
+
+```python
+from . import openai_compat
+
+# Add OpenAI-compatible routes
+if config.OPENAI_COMPAT_ENABLED:
+    app.include_router(openai_compat.router)
+```
+
+## Streaming Support (Future Enhancement)
+
+Initial implementation returns complete audio. Streaming can be added later:
+
+```python
+@router.post("/speech")
+async def create_speech(request: SpeechRequest):
+    if request.stream:
+        return StreamingResponse(
+            generate_audio_chunks(request),
+            media_type=f"audio/{request.response_format}"
+        )
+    ...
+```
+
+## Testing
+
+Example usage after implementation:
+
+```bash
+# TTS with curl
+curl http://localhost:8000/v1/audio/speech \
+  -H "Content-Type: application/json" \
+  -d '{"model": "tts-1", "input": "Hello!", "voice": "MyProfile"}' \
+  --output speech.mp3
+
+# With OpenAI Python SDK
+from openai import OpenAI
+client = OpenAI(base_url="http://localhost:8000/v1", api_key="unused")
+response = client.audio.speech.create(
+    model="tts-1",
+    voice="MyProfile",
+    input="Hello world!"
+)
+response.stream_to_file("output.mp3")
+
+# Transcription
+curl http://localhost:8000/v1/audio/transcriptions \
+  -F file=@audio.mp3 \
+  -F model="whisper-1"
+```
+
+## Security Considerations
+
+- Optional API key validation (for shared deployments)
+- Rate limiting on endpoints
+- Input length limits (same as existing `/generate` endpoint)
+
+## Dependencies
+
+- `pydub` or `ffmpeg-python` for audio format conversion (mp3, opus, etc.)
+- No changes to existing TTS/Whisper model code
diff --git a/docs2/content/docs/plans/meta.json b/docs2/content/docs/plans/meta.json
new file mode 100644
index 00000000..fc3ea779
--- /dev/null
+++ b/docs2/content/docs/plans/meta.json
@@ -0,0 +1,4 @@
+{
+  "title": "Plans",
+  "pages": ["DOCKER_DEPLOYMENT", "EXTERNAL_PROVIDERS", "MLX_AUDIO", "OPENAI_SUPPORT"]
+}
diff --git a/docs2/lib/layout.shared.tsx b/docs2/lib/layout.shared.tsx
new file mode 100644
index 00000000..1d8ed146
--- /dev/null
+++ b/docs2/lib/layout.shared.tsx
@@ -0,0 +1,9 @@
+import type { BaseLayoutProps } from 'fumadocs-ui/layouts/shared';
+
+export function baseOptions(): BaseLayoutProps {
+  return {
+    nav: {
+      title: 'Voicebox',
+    },
+  };
+}
diff --git a/docs2/mdx-components.tsx b/docs2/mdx-components.tsx
new file mode 100644
index 00000000..68824788
--- /dev/null
+++ b/docs2/mdx-components.tsx
@@ -0,0 +1,39 @@
+import defaultMdxComponents from 'fumadocs-ui/mdx';
+import type { MDXComponents } from 'mdx/types';
+import { APIPage } from '@/components/api-page';
+import {
+  Accordion,
+  AccordionGroup,
+  CardGroup,
+  Danger,
+  Frame,
+  Info,
+  MintlifyCard,
+  Note,
+  Step,
+  Steps,
+  Tip,
+  Warning,
+} from '@/components/mintlify-compat';
+
+export function getMDXComponents(components?: MDXComponents): MDXComponents {
+  return {
+    ...defaultMdxComponents,
+    // Mintlify compatibility components
+    Frame,
+    CardGroup,
+    Card: MintlifyCard,
+    Steps,
+    Step,
+    Tip,
+    Note,
+    Warning,
+    Info,
+    Danger,
+    AccordionGroup,
+    Accordion,
+    // OpenAPI component
+    APIPage,
+    ...components,
+  };
+}
diff --git a/docs2/openapi.json b/docs2/openapi.json
new file mode 100644
index 00000000..b573a920
--- /dev/null
+++ b/docs2/openapi.json
@@ -0,0 +1,877 @@
+{
+  "openapi": "3.1.0",
+  "info": {
+    "title": "voicebox API",
+    "description": "Production-quality Qwen3-TTS voice cloning API",
+    "version": "0.1.0"
+  },
+  "servers": [{ "url": "http://localhost:8000", "description": "Local development server" }],
+  "paths": {
+    "/": {
+      "get": {
+        "summary": "Root",
+        "description": "Root endpoint.",
+        "operationId": "root__get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          }
+        }
+      }
+    },
+    "/health": {
+      "get": {
+        "summary": "Health",
+        "description": "Health check endpoint.",
+        "operationId": "health_health_get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": { "schema": { "$ref": "#/components/schemas/HealthResponse" } }
+            }
+          }
+        }
+      }
+    },
+    "/profiles": {
+      "get": {
+        "summary": "List Profiles",
+        "description": "List all voice profiles.",
+        "operationId": "list_profiles_profiles_get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "items": { "$ref": "#/components/schemas/VoiceProfileResponse" },
+                  "type": "array",
+                  "title": "Response List Profiles Profiles Get"
+                }
+              }
+            }
+          }
+        }
+      },
+      "post": {
+        "summary": "Create Profile",
+        "description": "Create a new voice profile.",
+        "operationId": "create_profile_profiles_post",
+        "requestBody": {
+          "content": {
+            "application/json": { "schema": { "$ref": "#/components/schemas/VoiceProfileCreate" } }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/VoiceProfileResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/profiles/{profile_id}": {
+      "get": {
+        "summary": "Get Profile",
+        "description": "Get a voice profile by ID.",
+        "operationId": "get_profile_profiles__profile_id__get",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/VoiceProfileResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      },
+      "put": {
+        "summary": "Update Profile",
+        "description": "Update a voice profile.",
+        "operationId": "update_profile_profiles__profile_id__put",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "requestBody": {
+          "required": true,
+          "content": {
+            "application/json": { "schema": { "$ref": "#/components/schemas/VoiceProfileCreate" } }
+          }
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/VoiceProfileResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      },
+      "delete": {
+        "summary": "Delete Profile",
+        "description": "Delete a voice profile.",
+        "operationId": "delete_profile_profiles__profile_id__delete",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/profiles/{profile_id}/samples": {
+      "post": {
+        "summary": "Add Profile Sample",
+        "description": "Add a sample to a voice profile.",
+        "operationId": "add_profile_sample_profiles__profile_id__samples_post",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "requestBody": {
+          "required": true,
+          "content": {
+            "multipart/form-data": {
+              "schema": {
+                "$ref": "#/components/schemas/Body_add_profile_sample_profiles__profile_id__samples_post"
+              }
+            }
+          }
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/ProfileSampleResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      },
+      "get": {
+        "summary": "Get Profile Samples",
+        "description": "Get all samples for a profile.",
+        "operationId": "get_profile_samples_profiles__profile_id__samples_get",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "type": "array",
+                  "items": { "$ref": "#/components/schemas/ProfileSampleResponse" },
+                  "title": "Response Get Profile Samples Profiles  Profile Id  Samples Get"
+                }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/profiles/samples/{sample_id}": {
+      "delete": {
+        "summary": "Delete Profile Sample",
+        "description": "Delete a profile sample.",
+        "operationId": "delete_profile_sample_profiles_samples__sample_id__delete",
+        "parameters": [
+          {
+            "name": "sample_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Sample Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/generate": {
+      "post": {
+        "summary": "Generate Speech",
+        "description": "Generate speech from text using a voice profile.",
+        "operationId": "generate_speech_generate_post",
+        "requestBody": {
+          "content": {
+            "application/json": { "schema": { "$ref": "#/components/schemas/GenerationRequest" } }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/GenerationResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/history": {
+      "get": {
+        "summary": "List History",
+        "description": "List generation history with optional filters.",
+        "operationId": "list_history_history_get",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "query",
+            "required": false,
+            "schema": { "anyOf": [{ "type": "string" }, { "type": "null" }], "title": "Profile Id" }
+          },
+          {
+            "name": "search",
+            "in": "query",
+            "required": false,
+            "schema": { "anyOf": [{ "type": "string" }, { "type": "null" }], "title": "Search" }
+          },
+          {
+            "name": "limit",
+            "in": "query",
+            "required": false,
+            "schema": { "type": "integer", "default": 50, "title": "Limit" }
+          },
+          {
+            "name": "offset",
+            "in": "query",
+            "required": false,
+            "schema": { "type": "integer", "default": 0, "title": "Offset" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HistoryListResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/history/{generation_id}": {
+      "get": {
+        "summary": "Get Generation",
+        "description": "Get a generation by ID.",
+        "operationId": "get_generation_history__generation_id__get",
+        "parameters": [
+          {
+            "name": "generation_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Generation Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": { "schema": { "$ref": "#/components/schemas/HistoryResponse" } }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      },
+      "delete": {
+        "summary": "Delete Generation",
+        "description": "Delete a generation.",
+        "operationId": "delete_generation_history__generation_id__delete",
+        "parameters": [
+          {
+            "name": "generation_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Generation Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/history/stats": {
+      "get": {
+        "summary": "Get Stats",
+        "description": "Get generation statistics.",
+        "operationId": "get_stats_history_stats_get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          }
+        }
+      }
+    },
+    "/transcribe": {
+      "post": {
+        "summary": "Transcribe Audio",
+        "description": "Transcribe audio file to text.",
+        "operationId": "transcribe_audio_transcribe_post",
+        "requestBody": {
+          "content": {
+            "multipart/form-data": {
+              "schema": { "$ref": "#/components/schemas/Body_transcribe_audio_transcribe_post" }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/TranscriptionResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/audio/{generation_id}": {
+      "get": {
+        "summary": "Get Audio",
+        "description": "Serve generated audio file.",
+        "operationId": "get_audio_audio__generation_id__get",
+        "parameters": [
+          {
+            "name": "generation_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Generation Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/models/load": {
+      "post": {
+        "summary": "Load Model",
+        "description": "Manually load TTS model.",
+        "operationId": "load_model_models_load_post",
+        "parameters": [
+          {
+            "name": "model_size",
+            "in": "query",
+            "required": false,
+            "schema": { "type": "string", "default": "1.7B", "title": "Model Size" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/models/unload": {
+      "post": {
+        "summary": "Unload Model",
+        "description": "Unload TTS model to free memory.",
+        "operationId": "unload_model_models_unload_post",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          }
+        }
+      }
+    },
+    "/models/progress/{model_name}": {
+      "get": {
+        "summary": "Get Model Progress",
+        "description": "Get model download progress via Server-Sent Events.",
+        "operationId": "get_model_progress_models_progress__model_name__get",
+        "parameters": [
+          {
+            "name": "model_name",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Model Name" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/models/status": {
+      "get": {
+        "summary": "Get Model Status",
+        "description": "Get status of all available models.",
+        "operationId": "get_model_status_models_status_get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/ModelStatusListResponse" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/models/download": {
+      "post": {
+        "summary": "Trigger Model Download",
+        "description": "Trigger download of a specific model.",
+        "operationId": "trigger_model_download_models_download_post",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": { "$ref": "#/components/schemas/ModelDownloadRequest" }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    }
+  },
+  "components": {
+    "schemas": {
+      "Body_add_profile_sample_profiles__profile_id__samples_post": {
+        "properties": {
+          "file": { "type": "string", "format": "binary", "title": "File" },
+          "reference_text": { "type": "string", "title": "Reference Text" }
+        },
+        "type": "object",
+        "required": ["file", "reference_text"],
+        "title": "Body_add_profile_sample_profiles__profile_id__samples_post"
+      },
+      "Body_transcribe_audio_transcribe_post": {
+        "properties": {
+          "file": { "type": "string", "format": "binary", "title": "File" },
+          "language": { "anyOf": [{ "type": "string" }, { "type": "null" }], "title": "Language" }
+        },
+        "type": "object",
+        "required": ["file"],
+        "title": "Body_transcribe_audio_transcribe_post"
+      },
+      "GenerationRequest": {
+        "properties": {
+          "profile_id": { "type": "string", "title": "Profile Id" },
+          "text": { "type": "string", "maxLength": 5000, "minLength": 1, "title": "Text" },
+          "language": {
+            "type": "string",
+            "pattern": "^(en|zh)$",
+            "title": "Language",
+            "default": "en"
+          },
+          "seed": {
+            "anyOf": [{ "type": "integer", "minimum": 0.0 }, { "type": "null" }],
+            "title": "Seed"
+          },
+          "model_size": {
+            "anyOf": [{ "type": "string", "pattern": "^(1\\.7B|0\\.6B)$" }, { "type": "null" }],
+            "title": "Model Size",
+            "default": "1.7B"
+          }
+        },
+        "type": "object",
+        "required": ["profile_id", "text"],
+        "title": "GenerationRequest",
+        "description": "Request model for voice generation."
+      },
+      "GenerationResponse": {
+        "properties": {
+          "id": { "type": "string", "title": "Id" },
+          "profile_id": { "type": "string", "title": "Profile Id" },
+          "text": { "type": "string", "title": "Text" },
+          "language": { "type": "string", "title": "Language" },
+          "audio_path": { "type": "string", "title": "Audio Path" },
+          "duration": { "type": "number", "title": "Duration" },
+          "seed": { "anyOf": [{ "type": "integer" }, { "type": "null" }], "title": "Seed" },
+          "created_at": { "type": "string", "format": "date-time", "title": "Created At" }
+        },
+        "type": "object",
+        "required": [
+          "id",
+          "profile_id",
+          "text",
+          "language",
+          "audio_path",
+          "duration",
+          "seed",
+          "created_at"
+        ],
+        "title": "GenerationResponse",
+        "description": "Response model for voice generation."
+      },
+      "HTTPValidationError": {
+        "properties": {
+          "detail": {
+            "items": { "$ref": "#/components/schemas/ValidationError" },
+            "type": "array",
+            "title": "Detail"
+          }
+        },
+        "type": "object",
+        "title": "HTTPValidationError"
+      },
+      "HealthResponse": {
+        "properties": {
+          "status": { "type": "string", "title": "Status" },
+          "model_loaded": { "type": "boolean", "title": "Model Loaded" },
+          "model_downloaded": {
+            "anyOf": [{ "type": "boolean" }, { "type": "null" }],
+            "title": "Model Downloaded"
+          },
+          "model_size": {
+            "anyOf": [{ "type": "string" }, { "type": "null" }],
+            "title": "Model Size"
+          },
+          "gpu_available": { "type": "boolean", "title": "Gpu Available" },
+          "vram_used_mb": {
+            "anyOf": [{ "type": "number" }, { "type": "null" }],
+            "title": "Vram Used Mb"
+          }
+        },
+        "type": "object",
+        "required": ["status", "model_loaded", "gpu_available"],
+        "title": "HealthResponse",
+        "description": "Response model for health check."
+      },
+      "HistoryListResponse": {
+        "properties": {
+          "items": {
+            "items": { "$ref": "#/components/schemas/HistoryResponse" },
+            "type": "array",
+            "title": "Items"
+          },
+          "total": { "type": "integer", "title": "Total" }
+        },
+        "type": "object",
+        "required": ["items", "total"],
+        "title": "HistoryListResponse",
+        "description": "Response model for history list."
+      },
+      "HistoryResponse": {
+        "properties": {
+          "id": { "type": "string", "title": "Id" },
+          "profile_id": { "type": "string", "title": "Profile Id" },
+          "profile_name": { "type": "string", "title": "Profile Name" },
+          "text": { "type": "string", "title": "Text" },
+          "language": { "type": "string", "title": "Language" },
+          "audio_path": { "type": "string", "title": "Audio Path" },
+          "duration": { "type": "number", "title": "Duration" },
+          "seed": { "anyOf": [{ "type": "integer" }, { "type": "null" }], "title": "Seed" },
+          "created_at": { "type": "string", "format": "date-time", "title": "Created At" }
+        },
+        "type": "object",
+        "required": [
+          "id",
+          "profile_id",
+          "profile_name",
+          "text",
+          "language",
+          "audio_path",
+          "duration",
+          "seed",
+          "created_at"
+        ],
+        "title": "HistoryResponse",
+        "description": "Response model for history entry (includes profile name)."
+      },
+      "ModelDownloadRequest": {
+        "properties": { "model_name": { "type": "string", "title": "Model Name" } },
+        "type": "object",
+        "required": ["model_name"],
+        "title": "ModelDownloadRequest",
+        "description": "Request model for triggering model download."
+      },
+      "ModelStatus": {
+        "properties": {
+          "model_name": { "type": "string", "title": "Model Name" },
+          "display_name": { "type": "string", "title": "Display Name" },
+          "downloaded": { "type": "boolean", "title": "Downloaded" },
+          "size_mb": { "anyOf": [{ "type": "number" }, { "type": "null" }], "title": "Size Mb" },
+          "loaded": { "type": "boolean", "title": "Loaded", "default": false }
+        },
+        "type": "object",
+        "required": ["model_name", "display_name", "downloaded"],
+        "title": "ModelStatus",
+        "description": "Response model for model status."
+      },
+      "ModelStatusListResponse": {
+        "properties": {
+          "models": {
+            "items": { "$ref": "#/components/schemas/ModelStatus" },
+            "type": "array",
+            "title": "Models"
+          }
+        },
+        "type": "object",
+        "required": ["models"],
+        "title": "ModelStatusListResponse",
+        "description": "Response model for model status list."
+      },
+      "ProfileSampleResponse": {
+        "properties": {
+          "id": { "type": "string", "title": "Id" },
+          "profile_id": { "type": "string", "title": "Profile Id" },
+          "audio_path": { "type": "string", "title": "Audio Path" },
+          "reference_text": { "type": "string", "title": "Reference Text" }
+        },
+        "type": "object",
+        "required": ["id", "profile_id", "audio_path", "reference_text"],
+        "title": "ProfileSampleResponse",
+        "description": "Response model for profile sample."
+      },
+      "TranscriptionResponse": {
+        "properties": {
+          "text": { "type": "string", "title": "Text" },
+          "duration": { "type": "number", "title": "Duration" }
+        },
+        "type": "object",
+        "required": ["text", "duration"],
+        "title": "TranscriptionResponse",
+        "description": "Response model for transcription."
+      },
+      "ValidationError": {
+        "properties": {
+          "loc": {
+            "items": { "anyOf": [{ "type": "string" }, { "type": "integer" }] },
+            "type": "array",
+            "title": "Location"
+          },
+          "msg": { "type": "string", "title": "Message" },
+          "type": { "type": "string", "title": "Error Type" }
+        },
+        "type": "object",
+        "required": ["loc", "msg", "type"],
+        "title": "ValidationError"
+      },
+      "VoiceProfileCreate": {
+        "properties": {
+          "name": { "type": "string", "maxLength": 100, "minLength": 1, "title": "Name" },
+          "description": {
+            "anyOf": [{ "type": "string", "maxLength": 500 }, { "type": "null" }],
+            "title": "Description"
+          },
+          "language": {
+            "type": "string",
+            "pattern": "^(en|zh)$",
+            "title": "Language",
+            "default": "en"
+          }
+        },
+        "type": "object",
+        "required": ["name"],
+        "title": "VoiceProfileCreate",
+        "description": "Request model for creating a voice profile."
+      },
+      "VoiceProfileResponse": {
+        "properties": {
+          "id": { "type": "string", "title": "Id" },
+          "name": { "type": "string", "title": "Name" },
+          "description": {
+            "anyOf": [{ "type": "string" }, { "type": "null" }],
+            "title": "Description"
+          },
+          "language": { "type": "string", "title": "Language" },
+          "created_at": { "type": "string", "format": "date-time", "title": "Created At" },
+          "updated_at": { "type": "string", "format": "date-time", "title": "Updated At" }
+        },
+        "type": "object",
+        "required": ["id", "name", "description", "language", "created_at", "updated_at"],
+        "title": "VoiceProfileResponse",
+        "description": "Response model for voice profile."
+      }
+    }
+  }
+}
diff --git a/docs2/package.json b/docs2/package.json
new file mode 100644
index 00000000..1d14cd8f
--- /dev/null
+++ b/docs2/package.json
@@ -0,0 +1,32 @@
+{
+  "name": "example-next-mdx",
+  "version": "0.0.0",
+  "private": true,
+  "scripts": {
+    "build": "fumadocs-mdx && next build",
+    "dev": "fumadocs-mdx && next dev",
+    "start": "next start",
+    "postinstall": "fumadocs-mdx"
+  },
+  "dependencies": {
+    "fumadocs-core": "^16.4.11",
+    "fumadocs-mdx": "13",
+    "fumadocs-openapi": "^10.2.7",
+    "fumadocs-ui": "^16.4.11",
+    "lucide-react": "^0.546.0",
+    "next": "^16.1.6",
+    "react": "^19.2.0",
+    "react-dom": "^19.2.0",
+    "shiki": "^3.22.0"
+  },
+  "devDependencies": {
+    "@tailwindcss/postcss": "^4.1.15",
+    "@types/mdx": "^2.0.13",
+    "@types/node": "^24.9.1",
+    "@types/react": "^19.2.2",
+    "@types/react-dom": "^19.2.2",
+    "postcss": "^8.5.6",
+    "tailwindcss": "^4.1.15",
+    "typescript": "^5.9.3"
+  }
+}
diff --git a/landing/package.json b/landing/package.json
index 655e57a6..8af4d00e 100644
--- a/landing/package.json
+++ b/landing/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@voicebox/landing",
-  "version": "0.1.12",
+  "version": "0.1.13",
   "description": "Landing page for voicebox.sh",
   "scripts": {
     "dev": "bun --bun next dev --turbo",
diff --git a/package.json b/package.json
index c0f3c21e..fd5b78ed 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "voicebox",
-  "version": "0.1.12",
+  "version": "0.1.13",
   "private": true,
   "workspaces": [
     "app",
@@ -18,6 +18,7 @@
     "build:web": "cd web && bun run build",
     "build:landing": "cd landing && bun run build",
     "build:release": "./scripts/prepare-release.sh",
+    "build:providers": "python scripts/build-providers-local.py",
     "generate:api": "./scripts/generate-api.sh",
     "generate:keys": "cd tauri && bun tauri signer generate -w ~/.tauri/voicebox.key",
     "build:server": "./scripts/build-server.sh",
diff --git a/providers/README.md b/providers/README.md
new file mode 100644
index 00000000..6f4a6f42
--- /dev/null
+++ b/providers/README.md
@@ -0,0 +1,312 @@
+# TTS Provider Architecture
+
+This document explains how Voicebox's modular TTS provider system works.
+
+## Overview
+
+Voicebox uses a **pluggable provider architecture** that separates the main application from TTS inference. This solves several problems:
+
+- **GitHub's 2GB release limit** - CUDA builds are ~2.4GB, too large for GitHub releases
+- **Faster app updates** - UI/feature updates don't require re-downloading heavy ML binaries
+- **User choice** - Users can pick CPU, CUDA, or external providers based on their hardware
+
+## Architecture Diagram
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  Voicebox App                                               │
+│  ├─ UI (React)                                              │
+│  ├─ Backend (FastAPI)                                       │
+│  │   ├─ Voice Profiles                                      │
+│  │   ├─ Generation History                                  │
+│  │   ├─ Whisper STT (bundled)                               │
+│  │   └─ Provider Manager ◄────────────────┐                 │
+│  │                                         │                │
+│  └─ providers/                             │                │
+│      ├─ bundled.py (wraps backends/)       │                │
+│      └─ local.py (HTTP client)─────────────┼───┐            │
+│                                            │   │            │
+└────────────────────────────────────────────┼───┼────────────┘
+                                             │   │
+                        ┌────────────────────┘   │
+                        │                        │ HTTP
+                        ▼                        ▼
+              ┌──────────────────┐    ┌──────────────────────┐
+              │ backends/        │    │ Standalone Provider  │
+              │ (bundled on Mac) │    │ (subprocess)         │
+              │                  │    │                      │
+              │ - mlx_backend    │    │ - FastAPI server     │
+              │ - pytorch_backend│    │ - PyTorch + Qwen-TTS │
+              └──────────────────┘    │ - Runs on localhost  │
+                                      └──────────────────────┘
+```
+
+## Platform Behavior
+
+| Platform              | App Size | TTS Backend     | Provider Download |
+| --------------------- | -------- | --------------- | ----------------- |
+| macOS (Apple Silicon) | ~300MB   | MLX bundled     | Not needed        |
+| macOS (Intel)         | ~300MB   | PyTorch bundled | Not needed        |
+| Windows               | ~150MB   | None bundled    | Required          |
+| Linux                 | ~150MB   | None bundled    | Required          |
+
+### macOS (Apple Silicon)
+
+- MLX backend is **bundled** in the app
+- Works immediately after install
+- Uses Metal for GPU acceleration
+
+### macOS (Intel)
+
+- PyTorch backend is **bundled** in the app
+- Works immediately after install
+- Uses CPU inference
+
+### Windows / Linux
+
+- **No TTS bundled** - keeps app small (~150MB)
+- On first use, prompts to download a provider
+- Provider options:
+  - **PyTorch CPU** (~300MB) - Works on any system
+  - **PyTorch CUDA** (~2.4GB) - Fast inference on NVIDIA GPUs
+
+## Directory Structure
+
+```
+voicebox/
+├── backend/
+│   ├── backends/                 # Actual TTS implementations
+│   │   ├── __init__.py          # TTSBackend Protocol
+│   │   ├── mlx_backend.py       # MLX implementation (macOS)
+│   │   └── pytorch_backend.py   # PyTorch implementation
+│   │
+│   └── providers/               # Provider abstraction layer
+│       ├── __init__.py          # ProviderManager
+│       ├── base.py              # TTSProvider Protocol
+│       ├── bundled.py           # Wraps backends/ for bundled use
+│       ├── local.py             # HTTP client for subprocess providers
+│       ├── installer.py         # Downloads providers from R2
+│       └── types.py             # Shared types
+│
+└── providers/                   # Standalone provider builds
+    ├── pytorch-cpu/
+    │   ├── main.py              # FastAPI server
+    │   ├── build.py             # PyInstaller build script
+    │   └── requirements.txt
+    │
+    └── pytorch-cuda/
+        ├── main.py              # FastAPI server
+        │   build.py              # PyInstaller build script
+        └── requirements.txt
+```
+
+## How Providers Work
+
+### 1. BundledProvider (macOS)
+
+On macOS, the `BundledProvider` directly calls the bundled `backends/` code:
+
+```python
+# backend/providers/bundled.py
+class BundledProvider:
+    def __init__(self):
+        self._backend = get_tts_backend()  # MLX or PyTorch
+
+    async def generate(self, text, voice_prompt, ...):
+        return await self._backend.generate(text, voice_prompt, ...)
+```
+
+### 2. LocalProvider (Windows/Linux)
+
+On Windows/Linux, the `LocalProvider` communicates with a standalone provider via HTTP:
+
+```python
+# backend/providers/local.py
+class LocalProvider:
+    def __init__(self, base_url: str):
+        self.base_url = base_url  # e.g., "http://127.0.0.1:8765"
+
+    async def generate(self, text, voice_prompt, ...):
+        response = await self.client.post(
+            f"{self.base_url}/tts/generate",
+            json={"text": text, "voice_prompt": voice_prompt, ...}
+        )
+        # Decode audio from response
+        return audio, sample_rate
+```
+
+### 3. Standalone Provider Server
+
+The standalone providers are self-contained FastAPI servers:
+
+```python
+# providers/pytorch-cpu/main.py
+@app.post("/tts/generate")
+async def generate(text: str, voice_prompt: dict, ...):
+    audio, sr = await backend.generate(text, voice_prompt, ...)
+    return {"audio": base64_encode(audio), "sample_rate": sr}
+```
+
+## Provider API Specification
+
+All providers (local or remote) must implement these HTTP endpoints:
+
+### POST /tts/generate
+
+Generate speech from text.
+
+**Request:**
+
+```json
+{
+	"text": "Hello world!",
+	"voice_prompt": {
+		/* voice embedding */
+	},
+	"language": "en",
+	"seed": 12345,
+	"model_size": "1.7B"
+}
+```
+
+**Response:**
+
+```json
+{
+	"audio": "base64-encoded-wav",
+	"sample_rate": 24000,
+	"duration": 2.5
+}
+```
+
+### POST /tts/create_voice_prompt
+
+Create voice embedding from reference audio.
+
+**Request:** `multipart/form-data`
+
+- `audio`: Audio file
+- `reference_text`: Transcript
+
+**Response:**
+
+```json
+{
+	"voice_prompt": {
+		/* voice embedding */
+	},
+	"was_cached": false
+}
+```
+
+### GET /tts/health
+
+Health check.
+
+**Response:**
+
+```json
+{
+	"status": "healthy",
+	"provider": "pytorch-cuda",
+	"version": "1.0.0",
+	"model": "1.7B",
+	"device": "cuda:0"
+}
+```
+
+### GET /tts/status
+
+Model status.
+
+**Response:**
+
+```json
+{
+	"model_loaded": true,
+	"model_size": "1.7B",
+	"available_sizes": ["0.6B", "1.7B"],
+	"gpu_available": true,
+	"vram_used_mb": 1234
+}
+```
+
+## Provider Lifecycle
+
+### Startup Flow (Windows/Linux)
+
+```
+1. App launches
+2. ProviderManager checks for installed providers
+3. If none installed:
+   └─ Show setup wizard, prompt download
+4. If installed:
+   ├─ Start provider subprocess on random port
+   ├─ Wait for /tts/health to return 200
+   └─ Create LocalProvider with that URL
+5. Generation requests go through LocalProvider → subprocess
+```
+
+### Download Flow
+
+```
+1. User clicks "Download PyTorch CUDA"
+2. Installer downloads from Cloudflare R2:
+   https://downloads.voicebox.sh/providers/v1.0.0/tts-provider-pytorch-cuda-windows.exe
+3. Saved to:
+   - Windows: %APPDATA%/voicebox/providers/
+   - Linux: ~/.local/share/voicebox/providers/
+4. Provider is now available to start
+```
+
+## Building Providers
+
+### Prerequisites
+
+- Python 3.12
+- PyInstaller
+
+### Build PyTorch CPU Provider
+
+```bash
+cd providers/pytorch-cpu
+pip install -r requirements.txt
+python build.py
+# Output: dist/tts-provider-pytorch-cpu.exe
+```
+
+### Build PyTorch CUDA Provider
+
+```bash
+cd providers/pytorch-cuda
+pip install torch --index-url https://download.pytorch.org/whl/cu121
+pip install -r requirements.txt
+python build.py
+# Output: dist/tts-provider-pytorch-cuda.exe (~2.4GB)
+```
+
+## Provider Versioning
+
+Providers have **independent versions** from the app:
+
+- **App version:** `v0.2.0` (frequent updates)
+- **Provider version:** `v1.0.0` (rare updates)
+
+Providers only need updates when:
+
+- TTS model changes (new Qwen3-TTS version)
+- API spec changes
+- Bug fixes in inference code
+
+The app checks provider compatibility on startup.
+
+## Future Providers
+
+The architecture supports additional providers:
+
+- **Remote Server** - Connect to your own TTS server
+- **OpenAI API** - Use OpenAI's TTS (requires API key)
+- **ElevenLabs** - Cloud TTS service
+- **Docker** - Run providers in containers
+
+These would implement the same HTTP API spec.
diff --git a/providers/pytorch-cpu/build.py b/providers/pytorch-cpu/build.py
new file mode 100644
index 00000000..a443f343
--- /dev/null
+++ b/providers/pytorch-cpu/build.py
@@ -0,0 +1,90 @@
+"""
+PyInstaller build script for PyTorch CPU provider.
+"""
+
+import PyInstaller.__main__
+import os
+import platform
+from pathlib import Path
+
+
+def build_provider():
+    """Build PyTorch CPU provider as standalone binary."""
+    provider_dir = Path(__file__).parent
+    backend_dir = provider_dir.parent.parent / "backend"
+    
+    # PyInstaller arguments
+    args = [
+        'main.py',
+        '--onedir',  # Changed from --onefile to work around Windows extraction issues
+        '--name', 'tts-provider-pytorch-cpu',
+    ]
+    
+    # Add backend to path
+    args.extend([
+        '--paths', str(backend_dir.parent),
+    ])
+    
+    # Add hidden imports
+    args.extend([
+        '--hidden-import', 'backend',
+        '--hidden-import', 'backend.backends',
+        '--hidden-import', 'backend.backends.pytorch_backend',
+        '--hidden-import', 'backend.config',
+        '--hidden-import', 'backend.utils.audio',
+        '--hidden-import', 'backend.utils.cache',
+        '--hidden-import', 'backend.utils.progress',
+        '--hidden-import', 'backend.utils.hf_progress',
+        '--hidden-import', 'backend.utils.tasks',
+        '--hidden-import', 'torch',
+        '--hidden-import', 'transformers',
+        '--hidden-import', 'qwen_tts',
+        '--hidden-import', 'qwen_tts.inference',
+        '--hidden-import', 'qwen_tts.inference.qwen3_tts_model',
+        '--hidden-import', 'qwen_tts.inference.qwen3_tts_tokenizer',
+        '--hidden-import', 'qwen_tts.core',
+        '--hidden-import', 'qwen_tts.cli',
+        '--copy-metadata', 'qwen-tts',
+        '--collect-submodules', 'qwen_tts',
+        '--collect-data', 'qwen_tts',
+        '--hidden-import', 'pkg_resources.extern',
+        '--collect-submodules', 'jaraco',
+        '--hidden-import', 'fastapi',
+        '--hidden-import', 'uvicorn',
+        # Critical uvicorn imports for PyInstaller
+        '--hidden-import', 'uvicorn.logging',
+        '--hidden-import', 'uvicorn.loops',
+        '--hidden-import', 'uvicorn.loops.auto',
+        '--hidden-import', 'uvicorn.protocols',
+        '--hidden-import', 'uvicorn.protocols.http',
+        '--hidden-import', 'uvicorn.protocols.http.auto',
+        '--hidden-import', 'uvicorn.protocols.websockets',
+        '--hidden-import', 'uvicorn.protocols.websockets.auto',
+        '--hidden-import', 'uvicorn.lifespan',
+        '--hidden-import', 'uvicorn.lifespan.on',
+        '--collect-submodules', 'uvicorn',
+        '--hidden-import', 'soundfile',
+        '--hidden-import', 'numpy',
+        '--hidden-import', 'librosa',
+    ])
+
+    args.extend([
+        '--noconfirm',
+        '--clean',
+    ])
+    
+    # Change to provider directory
+    os.chdir(provider_dir)
+    
+    # Run PyInstaller
+    PyInstaller.__main__.run(args)
+    
+    binary_name = 'tts-provider-pytorch-cpu'
+    if platform.system() == "Windows":
+        binary_name += '.exe'
+    
+    print(f"Binary built in {provider_dir / 'dist' / binary_name}")
+
+
+if __name__ == '__main__':
+    build_provider()
diff --git a/providers/pytorch-cpu/build_and_install.py b/providers/pytorch-cpu/build_and_install.py
new file mode 100644
index 00000000..7a63e091
--- /dev/null
+++ b/providers/pytorch-cpu/build_and_install.py
@@ -0,0 +1,57 @@
+"""
+Build PyTorch CPU provider and install to local provider directory.
+"""
+
+import platform
+import shutil
+from pathlib import Path
+
+from build import build_provider
+
+
+def get_providers_dir() -> Path:
+    """Get the directory where providers are stored."""
+    system = platform.system()
+
+    if system == "Windows":
+        appdata = Path.home() / "AppData" / "Roaming"
+    elif system == "Darwin":
+        appdata = Path.home() / "Library" / "Application Support"
+    else:  # Linux
+        appdata = Path.home() / ".local" / "share"
+
+    providers_dir = appdata / "voicebox" / "providers"
+    providers_dir.mkdir(parents=True, exist_ok=True)
+    return providers_dir
+
+
+def main():
+    """Build and install provider."""
+    provider_dir = Path(__file__).parent
+
+    # Build the provider
+    print("Building PyTorch CPU provider...")
+    build_provider()
+
+    # Determine binary name
+    binary_name = "tts-provider-pytorch-cpu"
+    if platform.system() == "Windows":
+        binary_name += ".exe"
+
+    # Source and destination paths
+    source = provider_dir / "dist" / binary_name
+    destination = get_providers_dir() / binary_name
+
+    # Copy to provider directory
+    print(f"Installing to {destination}...")
+    shutil.copy2(source, destination)
+
+    # Make executable on Unix systems
+    if platform.system() != "Windows":
+        destination.chmod(0o755)
+
+    print(f"✓ Provider installed successfully to {destination}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/providers/pytorch-cpu/main.py b/providers/pytorch-cpu/main.py
new file mode 100644
index 00000000..e295e08b
--- /dev/null
+++ b/providers/pytorch-cpu/main.py
@@ -0,0 +1,238 @@
+"""
+Standalone TTS provider server for PyTorch CPU.
+"""
+
+import argparse
+import asyncio
+import base64
+import io
+import sys
+from pathlib import Path
+from typing import Optional
+
+import numpy as np
+import soundfile as sf
+from fastapi import FastAPI, File, Form, HTTPException, UploadFile
+from fastapi.middleware.cors import CORSMiddleware
+import uvicorn
+
+# Add parent directory to path to import backend modules
+sys.path.insert(0, str(Path(__file__).parent.parent.parent / "backend"))
+
+from backend.backends.pytorch_backend import PyTorchTTSBackend
+
+
+app = FastAPI(title="Voicebox TTS Provider - PyTorch CPU")
+
+# CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+# Global backend instance
+_backend: Optional[PyTorchTTSBackend] = None
+
+
+def get_backend() -> PyTorchTTSBackend:
+    """Get or create backend instance."""
+    global _backend
+    if _backend is None:
+        _backend = PyTorchTTSBackend()
+    return _backend
+
+
+@app.get("/tts/health")
+async def health():
+    """Health check endpoint."""
+    backend = get_backend()
+    backend_type = "pytorch-cpu"
+    
+    model_size = None
+    if backend.is_loaded():
+        if hasattr(backend, '_current_model_size') and backend._current_model_size:
+            model_size = backend._current_model_size
+    
+    device = backend.device if hasattr(backend, 'device') else "cpu"
+    
+    return {
+        "status": "healthy",
+        "provider": backend_type,
+        "version": "1.0.0",  # TODO: Get from version file
+        "model": model_size,
+        "device": device,
+    }
+
+
+@app.get("/tts/status")
+async def status():
+    """Model status endpoint."""
+    backend = get_backend()
+    
+    model_size = None
+    if backend.is_loaded():
+        if hasattr(backend, '_current_model_size') and backend._current_model_size:
+            model_size = backend._current_model_size
+    
+    available_sizes = ["1.7B", "0.6B"]
+    
+    gpu_available = False
+    vram_used_mb = None
+    
+    try:
+        import torch
+        gpu_available = torch.cuda.is_available()
+        if gpu_available:
+            vram_used_mb = int(torch.cuda.memory_allocated() / 1024 / 1024)
+    except ImportError:
+        pass
+    
+    return {
+        "model_loaded": backend.is_loaded(),
+        "model_size": model_size,
+        "available_sizes": available_sizes,
+        "gpu_available": gpu_available,
+        "vram_used_mb": vram_used_mb,
+    }
+
+
+@app.post("/tts/generate")
+async def generate(
+    text: str,
+    voice_prompt: dict,
+    language: str = "en",
+    seed: Optional[int] = None,
+    model_size: str = "1.7B",
+):
+    """
+    Generate speech from text.
+    
+    Request body (JSON):
+    {
+        "text": "Hello world!",
+        "voice_prompt": {...},
+        "language": "en",
+        "seed": 12345,
+        "model_size": "1.7B"
+    }
+    """
+    backend = get_backend()
+    
+    # Load model if not loaded or different size
+    if not backend.is_loaded() or (
+        hasattr(backend, '_current_model_size') and 
+        backend._current_model_size != model_size
+    ):
+        await backend.load_model_async(model_size)
+    
+    # Generate audio
+    audio, sample_rate = await backend.generate(
+        text=text,
+        voice_prompt=voice_prompt,
+        language=language,
+        seed=seed,
+        instruct=None,  # TODO: Add instruct support
+    )
+    
+    # Convert to base64
+    buffer = io.BytesIO()
+    sf.write(buffer, audio, sample_rate, format="WAV")
+    buffer.seek(0)
+    audio_bytes = buffer.read()
+    audio_b64 = base64.b64encode(audio_bytes).decode('utf-8')
+    
+    # Calculate duration
+    duration = len(audio) / sample_rate
+    
+    return {
+        "audio": audio_b64,
+        "sample_rate": sample_rate,
+        "duration": duration,
+    }
+
+
+@app.post("/tts/create_voice_prompt")
+async def create_voice_prompt(
+    audio: UploadFile = File(...),
+    reference_text: str = Form(...),
+    use_cache: bool = Form(True),
+):
+    """
+    Create voice prompt from reference audio.
+    
+    Request (multipart/form-data):
+    - audio: Audio file
+    - reference_text: Transcript
+    - use_cache: Whether to use cached prompts (default: true)
+    """
+    backend = get_backend()
+    
+    # Save uploaded file temporarily
+    import tempfile
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
+        tmp_path = tmp_file.name
+        content = await audio.read()
+        tmp_file.write(content)
+    
+    try:
+        # Create voice prompt
+        voice_prompt, was_cached = await backend.create_voice_prompt(
+            audio_path=tmp_path,
+            reference_text=reference_text,
+            use_cache=use_cache,
+        )
+        
+        return {
+            "voice_prompt": voice_prompt,
+            "was_cached": was_cached,
+        }
+    finally:
+        # Clean up temp file
+        Path(tmp_path).unlink(missing_ok=True)
+
+
+def main():
+    """Main entry point."""
+    parser = argparse.ArgumentParser(description="Voicebox TTS Provider - PyTorch CPU")
+    parser.add_argument(
+        "--port",
+        type=int,
+        default=0,  # 0 means random port
+        help="Port to bind to",
+    )
+    parser.add_argument(
+        "--data-dir",
+        type=str,
+        default=None,
+        help="Data directory for models and cache",
+    )
+    args = parser.parse_args()
+    
+    # Set data directory if provided
+    if args.data_dir:
+        from backend import config
+        config.set_data_dir(args.data_dir)
+    
+    # Determine port
+    port = args.port
+    if port == 0:
+        import socket
+        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+            s.bind(('', 0))
+            port = s.getsockname()[1]
+    
+    print(f"Starting TTS Provider (PyTorch CPU) on port {port}")
+    
+    uvicorn.run(
+        app,
+        host="127.0.0.1",
+        port=port,
+        log_level="info",
+    )
+
+
+if __name__ == "__main__":
+    main()
diff --git a/providers/pytorch-cpu/requirements.txt b/providers/pytorch-cpu/requirements.txt
new file mode 100644
index 00000000..3f4144e3
--- /dev/null
+++ b/providers/pytorch-cpu/requirements.txt
@@ -0,0 +1,8 @@
+torch>=2.0.0
+transformers>=4.30.0
+qwen-tts>=0.0.5
+fastapi>=0.100.0
+uvicorn>=0.23.0
+soundfile>=0.12.0
+numpy>=1.24.0
+librosa>=0.10.0
diff --git a/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec b/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec
new file mode 100644
index 00000000..8ab78036
--- /dev/null
+++ b/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec
@@ -0,0 +1,48 @@
+# -*- mode: python ; coding: utf-8 -*-
+from PyInstaller.utils.hooks import collect_data_files
+from PyInstaller.utils.hooks import collect_submodules
+from PyInstaller.utils.hooks import copy_metadata
+
+datas = []
+hiddenimports = ['backend', 'backend.backends', 'backend.backends.pytorch_backend', 'backend.config', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.tasks', 'torch', 'transformers', 'qwen_tts', 'qwen_tts.inference', 'qwen_tts.inference.qwen3_tts_model', 'qwen_tts.inference.qwen3_tts_tokenizer', 'qwen_tts.core', 'qwen_tts.cli', 'pkg_resources.extern', 'fastapi', 'uvicorn', 'soundfile', 'numpy', 'librosa']
+datas += collect_data_files('qwen_tts')
+datas += copy_metadata('qwen-tts')
+hiddenimports += collect_submodules('qwen_tts')
+hiddenimports += collect_submodules('jaraco')
+
+
+a = Analysis(
+    ['main.py'],
+    pathex=['/Users/jamespine/Projects/voicebox'],
+    binaries=[],
+    datas=datas,
+    hiddenimports=hiddenimports,
+    hookspath=[],
+    hooksconfig={},
+    runtime_hooks=[],
+    excludes=['torch.utils.tensorboard', 'tensorboard', 'triton', 'torch._dynamo', 'torch._inductor', 'torch.utils.benchmark', 'IPython', 'matplotlib', 'PIL', 'cv2', 'torchvision', 'torchaudio'],
+    noarchive=False,
+    optimize=0,
+)
+pyz = PYZ(a.pure)
+
+exe = EXE(
+    pyz,
+    a.scripts,
+    a.binaries,
+    a.datas,
+    [],
+    name='tts-provider-pytorch-cpu',
+    debug=False,
+    bootloader_ignore_signals=False,
+    strip=False,
+    upx=True,
+    upx_exclude=[],
+    runtime_tmpdir=None,
+    console=True,
+    disable_windowed_traceback=False,
+    argv_emulation=False,
+    target_arch=None,
+    codesign_identity=None,
+    entitlements_file=None,
+)
diff --git a/providers/pytorch-cuda/build.py b/providers/pytorch-cuda/build.py
new file mode 100644
index 00000000..c45f1196
--- /dev/null
+++ b/providers/pytorch-cuda/build.py
@@ -0,0 +1,92 @@
+"""
+PyInstaller build script for PyTorch CUDA provider.
+"""
+
+import PyInstaller.__main__
+import os
+import platform
+from pathlib import Path
+
+
+def build_provider():
+    """Build PyTorch CUDA provider as standalone binary."""
+    provider_dir = Path(__file__).parent
+    backend_dir = provider_dir.parent.parent / "backend"
+    
+    # PyInstaller arguments
+    args = [
+        'main.py',
+        '--onedir',  # Changed from --onefile to work around Windows extraction issues
+        '--name', 'tts-provider-pytorch-cuda',
+    ]
+    
+    # Add backend to path
+    args.extend([
+        '--paths', str(backend_dir.parent),
+    ])
+    
+    # Add hidden imports
+    args.extend([
+        '--hidden-import', 'backend',
+        '--hidden-import', 'backend.backends',
+        '--hidden-import', 'backend.backends.pytorch_backend',
+        '--hidden-import', 'backend.config',
+        '--hidden-import', 'backend.utils.audio',
+        '--hidden-import', 'backend.utils.cache',
+        '--hidden-import', 'backend.utils.progress',
+        '--hidden-import', 'backend.utils.hf_progress',
+        '--hidden-import', 'backend.utils.tasks',
+        '--hidden-import', 'torch',
+        '--hidden-import', 'torch.cuda',
+        '--hidden-import', 'torch.backends.cudnn',
+        '--hidden-import', 'transformers',
+        '--hidden-import', 'qwen_tts',
+        '--hidden-import', 'qwen_tts.inference',
+        '--hidden-import', 'qwen_tts.inference.qwen3_tts_model',
+        '--hidden-import', 'qwen_tts.inference.qwen3_tts_tokenizer',
+        '--hidden-import', 'qwen_tts.core',
+        '--hidden-import', 'qwen_tts.cli',
+        '--copy-metadata', 'qwen-tts',
+        '--collect-submodules', 'qwen_tts',
+        '--collect-data', 'qwen_tts',
+        '--hidden-import', 'pkg_resources.extern',
+        '--collect-submodules', 'jaraco',
+        '--hidden-import', 'fastapi',
+        '--hidden-import', 'uvicorn',
+        # Critical uvicorn imports for PyInstaller
+        '--hidden-import', 'uvicorn.logging',
+        '--hidden-import', 'uvicorn.loops',
+        '--hidden-import', 'uvicorn.loops.auto',
+        '--hidden-import', 'uvicorn.protocols',
+        '--hidden-import', 'uvicorn.protocols.http',
+        '--hidden-import', 'uvicorn.protocols.http.auto',
+        '--hidden-import', 'uvicorn.protocols.websockets',
+        '--hidden-import', 'uvicorn.protocols.websockets.auto',
+        '--hidden-import', 'uvicorn.lifespan',
+        '--hidden-import', 'uvicorn.lifespan.on',
+        '--collect-submodules', 'uvicorn',
+        '--hidden-import', 'soundfile',
+        '--hidden-import', 'numpy',
+        '--hidden-import', 'librosa',
+    ])
+
+    args.extend([
+        '--noconfirm',
+        '--clean',
+    ])
+    
+    # Change to provider directory
+    os.chdir(provider_dir)
+    
+    # Run PyInstaller
+    PyInstaller.__main__.run(args)
+    
+    binary_name = 'tts-provider-pytorch-cuda'
+    if platform.system() == "Windows":
+        binary_name += '.exe'
+    
+    print(f"Binary built in {provider_dir / 'dist' / binary_name}")
+
+
+if __name__ == '__main__':
+    build_provider()
diff --git a/providers/pytorch-cuda/build_and_install.py b/providers/pytorch-cuda/build_and_install.py
new file mode 100644
index 00000000..227dca0e
--- /dev/null
+++ b/providers/pytorch-cuda/build_and_install.py
@@ -0,0 +1,57 @@
+"""
+Build PyTorch CUDA provider and install to local provider directory.
+"""
+
+import platform
+import shutil
+from pathlib import Path
+
+from build import build_provider
+
+
+def get_providers_dir() -> Path:
+    """Get the directory where providers are stored."""
+    system = platform.system()
+
+    if system == "Windows":
+        appdata = Path.home() / "AppData" / "Roaming"
+    elif system == "Darwin":
+        appdata = Path.home() / "Library" / "Application Support"
+    else:  # Linux
+        appdata = Path.home() / ".local" / "share"
+
+    providers_dir = appdata / "voicebox" / "providers"
+    providers_dir.mkdir(parents=True, exist_ok=True)
+    return providers_dir
+
+
+def main():
+    """Build and install provider."""
+    provider_dir = Path(__file__).parent
+
+    # Build the provider
+    print("Building PyTorch CUDA provider...")
+    build_provider()
+
+    # Determine binary name
+    binary_name = "tts-provider-pytorch-cuda"
+    if platform.system() == "Windows":
+        binary_name += ".exe"
+
+    # Source and destination paths
+    source = provider_dir / "dist" / binary_name
+    destination = get_providers_dir() / binary_name
+
+    # Copy to provider directory
+    print(f"Installing to {destination}...")
+    shutil.copy2(source, destination)
+
+    # Make executable on Unix systems
+    if platform.system() != "Windows":
+        destination.chmod(0o755)
+
+    print(f"✓ Provider installed successfully to {destination}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/providers/pytorch-cuda/main.py b/providers/pytorch-cuda/main.py
new file mode 100644
index 00000000..a89782ff
--- /dev/null
+++ b/providers/pytorch-cuda/main.py
@@ -0,0 +1,238 @@
+"""
+Standalone TTS provider server for PyTorch CUDA.
+"""
+
+import argparse
+import asyncio
+import base64
+import io
+import sys
+from pathlib import Path
+from typing import Optional
+
+import numpy as np
+import soundfile as sf
+from fastapi import FastAPI, File, Form, HTTPException, UploadFile
+from fastapi.middleware.cors import CORSMiddleware
+import uvicorn
+
+# Add parent directory to path to import backend modules
+sys.path.insert(0, str(Path(__file__).parent.parent.parent / "backend"))
+
+from backend.backends.pytorch_backend import PyTorchTTSBackend
+
+
+app = FastAPI(title="Voicebox TTS Provider - PyTorch CUDA")
+
+# CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+# Global backend instance
+_backend: Optional[PyTorchTTSBackend] = None
+
+
+def get_backend() -> PyTorchTTSBackend:
+    """Get or create backend instance."""
+    global _backend
+    if _backend is None:
+        _backend = PyTorchTTSBackend()
+    return _backend
+
+
+@app.get("/tts/health")
+async def health():
+    """Health check endpoint."""
+    backend = get_backend()
+    backend_type = "pytorch-cuda"
+    
+    model_size = None
+    if backend.is_loaded():
+        if hasattr(backend, '_current_model_size') and backend._current_model_size:
+            model_size = backend._current_model_size
+    
+    device = backend.device if hasattr(backend, 'device') else "cpu"
+    
+    return {
+        "status": "healthy",
+        "provider": backend_type,
+        "version": "1.0.0",  # TODO: Get from version file
+        "model": model_size,
+        "device": device,
+    }
+
+
+@app.get("/tts/status")
+async def status():
+    """Model status endpoint."""
+    backend = get_backend()
+    
+    model_size = None
+    if backend.is_loaded():
+        if hasattr(backend, '_current_model_size') and backend._current_model_size:
+            model_size = backend._current_model_size
+    
+    available_sizes = ["1.7B", "0.6B"]
+    
+    gpu_available = False
+    vram_used_mb = None
+    
+    try:
+        import torch
+        gpu_available = torch.cuda.is_available()
+        if gpu_available:
+            vram_used_mb = int(torch.cuda.memory_allocated() / 1024 / 1024)
+    except ImportError:
+        pass
+    
+    return {
+        "model_loaded": backend.is_loaded(),
+        "model_size": model_size,
+        "available_sizes": available_sizes,
+        "gpu_available": gpu_available,
+        "vram_used_mb": vram_used_mb,
+    }
+
+
+@app.post("/tts/generate")
+async def generate(
+    text: str,
+    voice_prompt: dict,
+    language: str = "en",
+    seed: Optional[int] = None,
+    model_size: str = "1.7B",
+):
+    """
+    Generate speech from text.
+    
+    Request body (JSON):
+    {
+        "text": "Hello world!",
+        "voice_prompt": {...},
+        "language": "en",
+        "seed": 12345,
+        "model_size": "1.7B"
+    }
+    """
+    backend = get_backend()
+    
+    # Load model if not loaded or different size
+    if not backend.is_loaded() or (
+        hasattr(backend, '_current_model_size') and 
+        backend._current_model_size != model_size
+    ):
+        await backend.load_model_async(model_size)
+    
+    # Generate audio
+    audio, sample_rate = await backend.generate(
+        text=text,
+        voice_prompt=voice_prompt,
+        language=language,
+        seed=seed,
+        instruct=None,  # TODO: Add instruct support
+    )
+    
+    # Convert to base64
+    buffer = io.BytesIO()
+    sf.write(buffer, audio, sample_rate, format="WAV")
+    buffer.seek(0)
+    audio_bytes = buffer.read()
+    audio_b64 = base64.b64encode(audio_bytes).decode('utf-8')
+    
+    # Calculate duration
+    duration = len(audio) / sample_rate
+    
+    return {
+        "audio": audio_b64,
+        "sample_rate": sample_rate,
+        "duration": duration,
+    }
+
+
+@app.post("/tts/create_voice_prompt")
+async def create_voice_prompt(
+    audio: UploadFile = File(...),
+    reference_text: str = Form(...),
+    use_cache: bool = Form(True),
+):
+    """
+    Create voice prompt from reference audio.
+    
+    Request (multipart/form-data):
+    - audio: Audio file
+    - reference_text: Transcript
+    - use_cache: Whether to use cached prompts (default: true)
+    """
+    backend = get_backend()
+    
+    # Save uploaded file temporarily
+    import tempfile
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
+        tmp_path = tmp_file.name
+        content = await audio.read()
+        tmp_file.write(content)
+    
+    try:
+        # Create voice prompt
+        voice_prompt, was_cached = await backend.create_voice_prompt(
+            audio_path=tmp_path,
+            reference_text=reference_text,
+            use_cache=use_cache,
+        )
+        
+        return {
+            "voice_prompt": voice_prompt,
+            "was_cached": was_cached,
+        }
+    finally:
+        # Clean up temp file
+        Path(tmp_path).unlink(missing_ok=True)
+
+
+def main():
+    """Main entry point."""
+    parser = argparse.ArgumentParser(description="Voicebox TTS Provider - PyTorch CUDA")
+    parser.add_argument(
+        "--port",
+        type=int,
+        default=0,  # 0 means random port
+        help="Port to bind to",
+    )
+    parser.add_argument(
+        "--data-dir",
+        type=str,
+        default=None,
+        help="Data directory for models and cache",
+    )
+    args = parser.parse_args()
+    
+    # Set data directory if provided
+    if args.data_dir:
+        from backend import config
+        config.set_data_dir(args.data_dir)
+    
+    # Determine port
+    port = args.port
+    if port == 0:
+        import socket
+        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+            s.bind(('', 0))
+            port = s.getsockname()[1]
+    
+    print(f"Starting TTS Provider (PyTorch CUDA) on port {port}")
+    
+    uvicorn.run(
+        app,
+        host="127.0.0.1",
+        port=port,
+        log_level="info",
+    )
+
+
+if __name__ == "__main__":
+    main()
diff --git a/providers/pytorch-cuda/requirements.txt b/providers/pytorch-cuda/requirements.txt
new file mode 100644
index 00000000..5a106503
--- /dev/null
+++ b/providers/pytorch-cuda/requirements.txt
@@ -0,0 +1,10 @@
+torch>=2.0.0 --index-url https://download.pytorch.org/whl/cu121
+torchvision>=0.15.0 --index-url https://download.pytorch.org/whl/cu121
+torchaudio>=2.0.0 --index-url https://download.pytorch.org/whl/cu121
+transformers>=4.30.0
+qwen-tts>=0.0.5
+fastapi>=0.100.0
+uvicorn>=0.23.0
+soundfile>=0.12.0
+numpy>=1.24.0
+librosa>=0.10.0
diff --git a/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec b/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec
new file mode 100644
index 00000000..01230506
--- /dev/null
+++ b/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec
@@ -0,0 +1,48 @@
+# -*- mode: python ; coding: utf-8 -*-
+from PyInstaller.utils.hooks import collect_data_files
+from PyInstaller.utils.hooks import collect_submodules
+from PyInstaller.utils.hooks import copy_metadata
+
+datas = []
+hiddenimports = ['backend', 'backend.backends', 'backend.backends.pytorch_backend', 'backend.config', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.tasks', 'torch', 'torch.cuda', 'torch.backends.cudnn', 'transformers', 'qwen_tts', 'qwen_tts.inference', 'qwen_tts.inference.qwen3_tts_model', 'qwen_tts.inference.qwen3_tts_tokenizer', 'qwen_tts.core', 'qwen_tts.cli', 'pkg_resources.extern', 'fastapi', 'uvicorn', 'soundfile', 'numpy', 'librosa']
+datas += collect_data_files('qwen_tts')
+datas += copy_metadata('qwen-tts')
+hiddenimports += collect_submodules('qwen_tts')
+hiddenimports += collect_submodules('jaraco')
+
+
+a = Analysis(
+    ['main.py'],
+    pathex=['/Users/jamespine/Projects/voicebox'],
+    binaries=[],
+    datas=datas,
+    hiddenimports=hiddenimports,
+    hookspath=[],
+    hooksconfig={},
+    runtime_hooks=[],
+    excludes=['torch.utils.tensorboard', 'tensorboard', 'triton', 'torch._dynamo', 'torch._inductor', 'torch.utils.benchmark', 'IPython', 'matplotlib', 'PIL', 'cv2', 'torchvision', 'torchaudio'],
+    noarchive=False,
+    optimize=0,
+)
+pyz = PYZ(a.pure)
+
+exe = EXE(
+    pyz,
+    a.scripts,
+    a.binaries,
+    a.datas,
+    [],
+    name='tts-provider-pytorch-cuda',
+    debug=False,
+    bootloader_ignore_signals=False,
+    strip=False,
+    upx=True,
+    upx_exclude=[],
+    runtime_tmpdir=None,
+    console=True,
+    disable_windowed_traceback=False,
+    argv_emulation=False,
+    target_arch=None,
+    codesign_identity=None,
+    entitlements_file=None,
+)
diff --git a/scripts/build-providers-local.py b/scripts/build-providers-local.py
new file mode 100755
index 00000000..05edde2c
--- /dev/null
+++ b/scripts/build-providers-local.py
@@ -0,0 +1,46 @@
+#!/usr/bin/env python3
+"""
+Build and install all TTS providers locally for development.
+"""
+
+import subprocess
+import sys
+from pathlib import Path
+
+
+def main():
+    """Build and install all providers."""
+    project_root = Path(__file__).parent.parent
+    providers_dir = project_root / "providers"
+
+    providers = ["pytorch-cpu", "pytorch-cuda"]
+
+    for provider in providers:
+        provider_path = providers_dir / provider
+        script_path = provider_path / "build_and_install.py"
+
+        if not script_path.exists():
+            print(f"⚠ Skipping {provider}: build_and_install.py not found")
+            continue
+
+        print(f"\n{'=' * 60}")
+        print(f"Building and installing {provider}...")
+        print(f"{'=' * 60}\n")
+
+        try:
+            subprocess.run(
+                [sys.executable, str(script_path)],
+                cwd=provider_path,
+                check=True,
+            )
+        except subprocess.CalledProcessError as e:
+            print(f"✗ Failed to build {provider}: {e}")
+            sys.exit(1)
+
+    print(f"\n{'=' * 60}")
+    print("✓ All providers built and installed successfully!")
+    print(f"{'=' * 60}\n")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/tauri/package.json b/tauri/package.json
index 163f56c8..f7ec77ec 100644
--- a/tauri/package.json
+++ b/tauri/package.json
@@ -1,7 +1,7 @@
 {
   "name": "@voicebox/tauri",
   "private": true,
-  "version": "0.1.12",
+  "version": "0.1.13",
   "type": "module",
   "scripts": {
     "dev": "vite",
diff --git a/tauri/src-tauri/Cargo.lock b/tauri/src-tauri/Cargo.lock
index 4528097c..450b9a35 100644
--- a/tauri/src-tauri/Cargo.lock
+++ b/tauri/src-tauri/Cargo.lock
@@ -5041,7 +5041,7 @@ checksum = "0b928f33d975fc6ad9f86c8f283853ad26bdd5b10b7f1542aa2fa15e2289105a"
 
 [[package]]
 name = "voicebox"
-version = "0.1.11"
+version = "0.1.13"
 dependencies = [
  "base64 0.22.1",
  "core-foundation-sys",
diff --git a/tauri/src-tauri/Cargo.toml b/tauri/src-tauri/Cargo.toml
index 739dd34d..aa3b1a9c 100644
--- a/tauri/src-tauri/Cargo.toml
+++ b/tauri/src-tauri/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "voicebox"
-version = "0.1.12"
+version = "0.1.13"
 description = "A production-quality desktop app for Qwen3-TTS voice cloning and generation"
 authors = ["you"]
 license = ""
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index de0e9a08..a67539b6 100644
Binary files a/tauri/src-tauri/gen/Assets.car and b/tauri/src-tauri/gen/Assets.car differ
diff --git a/tauri/src-tauri/src/audio_capture/linux.rs b/tauri/src-tauri/src/audio_capture/linux.rs
index 8af26e97..7550e086 100644
--- a/tauri/src-tauri/src/audio_capture/linux.rs
+++ b/tauri/src-tauri/src/audio_capture/linux.rs
@@ -1,14 +1,14 @@
 use crate::audio_capture::AudioCaptureState;
 
 pub async fn start_capture(
-    state: &AudioCaptureState,
-    max_duration_secs: u32,
+    _state: &AudioCaptureState,
+    _max_duration_secs: u32,
 ) -> Result<(), String> {
-    todo!("implement Linux audio capture")
+    Err("Audio capture is not supported on Linux, YET. Use the built-in recording features instead.".to_string())
 }
 
-pub async fn stop_capture(state: &AudioCaptureState) -> Result<String, String> {
-    todo!("implement Linux audio capture stop")
+pub async fn stop_capture(_state: &AudioCaptureState) -> Result<String, String> {
+    Err("Audio capture is not supported on Linux.".to_string())
 }
 
 pub fn is_supported() -> bool {
diff --git a/tauri/src-tauri/src/main.rs b/tauri/src-tauri/src/main.rs
index 255655aa..25251169 100644
--- a/tauri/src-tauri/src/main.rs
+++ b/tauri/src-tauri/src/main.rs
@@ -423,43 +423,30 @@ fn is_process_running(pid: u32) -> bool {
     false
 }
 
-/// Kill entire Windows process tree by enumerating children
+/// Kill entire Windows process tree using taskkill's built-in /T flag
+/// This is more reliable than WMIC-based enumeration (WMIC is deprecated on Windows 11)
 #[cfg(windows)]
 fn kill_windows_process_tree(parent_pid: u32) -> Result<(), String> {
     use std::process::Command;
 
-    // Find all child processes using WMIC
-    let output = Command::new("wmic")
-        .args([
-            "process",
-            "where",
-            &format!("ParentProcessId={}", parent_pid),
-            "get",
-            "ProcessId"
-        ])
+    // taskkill with /T kills the entire process tree
+    // /F = force, /T = tree (kill child processes)
+    let result = Command::new("taskkill")
+        .args(["/PID", &parent_pid.to_string(), "/T", "/F"])
         .output();
 
-    if let Ok(output) = output {
-        let output_str = String::from_utf8_lossy(&output.stdout);
-        for line in output_str.lines().skip(1) { // Skip header
-            if let Ok(child_pid) = line.trim().parse::<u32>() {
-                println!("Found child process: {}", child_pid);
-                // Recursively kill child's children
-                let _ = kill_windows_process_tree(child_pid);
-                // Kill the child
-                let _ = Command::new("taskkill")
-                    .args(["/PID", &child_pid.to_string(), "/F"])
-                    .output();
+    match result {
+        Ok(output) => {
+            if output.status.success() {
+                println!("Successfully killed process tree for PID {}", parent_pid);
+            } else {
+                let stderr = String::from_utf8_lossy(&output.stderr);
+                eprintln!("taskkill stderr: {}", stderr);
             }
+            Ok(())
         }
+        Err(e) => Err(format!("Failed to run taskkill: {}", e))
     }
-
-    // Kill the parent process
-    let _ = Command::new("taskkill")
-        .args(["/PID", &parent_pid.to_string(), "/F"])
-        .output();
-
-    Ok(())
 }
 
 #[command]
diff --git a/tauri/src-tauri/tauri.conf.json b/tauri/src-tauri/tauri.conf.json
index 53b95d18..202d22e0 100644
--- a/tauri/src-tauri/tauri.conf.json
+++ b/tauri/src-tauri/tauri.conf.json
@@ -1,7 +1,7 @@
 {
   "$schema": "https://schema.tauri.app/config/2",
   "productName": "Voicebox",
-  "version": "0.1.12",
+  "version": "0.1.13",
   "identifier": "sh.voicebox.app",
   "build": {
     "beforeDevCommand": "bun run dev",
@@ -56,7 +56,7 @@
   },
   "plugins": {
     "shell": {
-      "open": true
+      "open": "^((mailto:\\w+)|(tel:\\w+)|(https?://\\w+)|(/[^\\s]+)|([a-zA-Z]:\\\\[^\\s]*)).*"
     },
     "updater": {
       "pubkey": "dW50cnVzdGVkIGNvbW1lbnQ6IG1pbmlzaWduIHB1YmxpYyBrZXk6IEUxRENBQkRBQjdBNTM1OTIKUldTU05hVzMycXZjNGJGcUxmcVVocll2QjdSaTJNdlFxR2M3VDJsMnVvbDdyZGRPMmRlOW9aWTcK",
diff --git a/tauri/src/platform/filesystem.ts b/tauri/src/platform/filesystem.ts
index 2292a99a..226a2cba 100644
--- a/tauri/src/platform/filesystem.ts
+++ b/tauri/src/platform/filesystem.ts
@@ -1,4 +1,4 @@
-import type { PlatformFilesystem, FileFilter } from '@/platform/types';
+import type { FileFilter, PlatformFilesystem } from '@/platform/types';
 
 export const tauriFilesystem: PlatformFilesystem = {
   async saveFile(filename: string, blob: Blob, filters?: FileFilter[]) {
@@ -38,4 +38,15 @@ export const tauriFilesystem: PlatformFilesystem = {
       document.body.removeChild(a);
     }
   },
+
+  async openFolder(path: string): Promise<boolean> {
+    try {
+      const { open } = await import('@tauri-apps/plugin-shell');
+      await open(path);
+      return true;
+    } catch (error) {
+      console.error('Failed to open folder:', error);
+      return false;
+    }
+  },
 };
diff --git a/web/index.html b/web/index.html
index 1ae976ad..c7a4be9f 100644
--- a/web/index.html
+++ b/web/index.html
@@ -1,5 +1,5 @@
 <!doctype html>
-<html lang="en">
+<html lang="en" class="dark">
   <head>
     <meta charset="UTF-8" />
     <link rel="icon" type="image/svg+xml" href="/vite.svg" />
diff --git a/web/package.json b/web/package.json
index 99d82c56..0fa0534d 100644
--- a/web/package.json
+++ b/web/package.json
@@ -1,7 +1,7 @@
 {
   "name": "@voicebox/web",
   "private": true,
-  "version": "0.1.12",
+  "version": "0.1.13",
   "type": "module",
   "scripts": {
     "dev": "vite",
@@ -17,6 +17,7 @@
     "wavesurfer.js": "^7.0.0"
   },
   "devDependencies": {
+    "@tailwindcss/vite": "^4.1.18",
     "@types/react": "^18.3.0",
     "@types/react-dom": "^18.3.0",
     "@typescript-eslint/eslint-plugin": "^7.0.0",
@@ -25,6 +26,7 @@
     "eslint": "^8.57.0",
     "eslint-plugin-react-hooks": "^4.6.0",
     "eslint-plugin-react-refresh": "^0.4.0",
+    "tailwindcss": "^4.1.0",
     "typescript": "^5.6.0",
     "vite": "^5.4.0"
   }
diff --git a/web/src/assets.d.ts b/web/src/assets.d.ts
new file mode 100644
index 00000000..1c592325
--- /dev/null
+++ b/web/src/assets.d.ts
@@ -0,0 +1,4 @@
+declare module '*.png' {
+  const value: string;
+  export default value;
+}
diff --git a/web/src/platform/filesystem.ts b/web/src/platform/filesystem.ts
index 1f45a49c..d2717bd2 100644
--- a/web/src/platform/filesystem.ts
+++ b/web/src/platform/filesystem.ts
@@ -1,4 +1,4 @@
-import type { PlatformFilesystem, FileFilter } from '@/platform/types';
+import type { FileFilter, PlatformFilesystem } from '@/platform/types';
 
 export const webFilesystem: PlatformFilesystem = {
   async saveFile(filename: string, blob: Blob, _filters?: FileFilter[]) {
@@ -12,4 +12,10 @@ export const webFilesystem: PlatformFilesystem = {
     window.URL.revokeObjectURL(url);
     document.body.removeChild(a);
   },
+
+  async openFolder(_path: string): Promise<boolean> {
+    // Browsers cannot open local folders for security reasons
+    // The UI will show the path as a read-only text instead
+    return false;
+  },
 };
diff --git a/web/src/platform/updater.ts b/web/src/platform/updater.ts
index 32ed0148..2f8be445 100644
--- a/web/src/platform/updater.ts
+++ b/web/src/platform/updater.ts
@@ -11,10 +11,6 @@ class WebUpdater implements PlatformUpdater {
 
   private subscribers: Set<(status: UpdateStatus) => void> = new Set();
 
-  private notifySubscribers() {
-    this.subscribers.forEach((callback) => callback(this.status));
-  }
-
   subscribe(callback: (status: UpdateStatus) => void): () => void {
     this.subscribers.add(callback);
     callback(this.status);
diff --git a/web/src/vite-env.d.ts b/web/src/vite-env.d.ts
new file mode 100644
index 00000000..31a365f5
--- /dev/null
+++ b/web/src/vite-env.d.ts
@@ -0,0 +1,12 @@
+/// <reference types="vite/client" />
+
+interface ImportMetaEnv {
+  readonly VITE_SERVER_URL?: string;
+  readonly VITE_APP_VERSION?: string;
+  readonly PROD?: boolean;
+  readonly DEV?: boolean;
+}
+
+interface ImportMeta {
+  readonly env: ImportMetaEnv;
+}
diff --git a/web/tsconfig.json b/web/tsconfig.json
index 629bcb7f..1c148061 100644
--- a/web/tsconfig.json
+++ b/web/tsconfig.json
@@ -15,6 +15,7 @@
     "noUnusedLocals": true,
     "noUnusedParameters": true,
     "noFallthroughCasesInSwitch": true,
+    "types": ["vite/client"],
     "baseUrl": ".",
     "paths": {
       "@/*": ["../app/src/*"]
diff --git a/web/vite.config.ts b/web/vite.config.ts
index 27a79a73..e418b3ef 100644
--- a/web/vite.config.ts
+++ b/web/vite.config.ts
@@ -1,9 +1,10 @@
 import path from 'node:path';
+import tailwindcss from '@tailwindcss/vite';
 import react from '@vitejs/plugin-react';
 import { defineConfig } from 'vite';
 
 export default defineConfig({
-  plugins: [react()],
+  plugins: [tailwindcss(), react()],
   resolve: {
     alias: {
       '@': path.resolve(__dirname, '../app/src'),