From 80689ad8ce53b0c7b440a8b1dc0b95239eeacaad Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 03:05:50 -0800
Subject: [PATCH 01/33] Implement TTS provider management system and update
 release workflow

- Added support for TTS providers in the backend, including endpoints for listing, starting, stopping, and downloading providers.
- Enhanced the release workflow to build and upload TTS provider binaries for both Windows and Linux platforms.
- Updated the architecture documentation to reflect the new provider system and its benefits for modularity and user experience.
- Introduced a new `ProviderSettings` component in the frontend for managing provider configurations.
---
 .github/workflows/release.yml                 | 144 ++++++-
 .../ServerSettings/ProviderSettings.tsx       | 395 ++++++++++++++++++
 app/src/components/ServerTab/ServerTab.tsx    |   2 +
 app/src/lib/api/client.ts                     |  71 ++++
 backend/build_binary.py                       |  32 +-
 backend/main.py                               | 215 +++++++++-
 backend/providers/__init__.py                 | 220 ++++++++++
 backend/providers/base.py                     |  97 +++++
 backend/providers/bundled.py                  | 139 ++++++
 backend/providers/installer.py                | 211 ++++++++++
 backend/providers/local.py                    | 187 +++++++++
 backend/providers/types.py                    |  34 ++
 backend/tts.py                                |  52 ++-
 docs/plans/TTS_PROVIDER_ARCHITECTURE.md       | 232 +++++-----
 providers/README.md                           | 291 +++++++++++++
 providers/pytorch-cpu/build.py                |  82 ++++
 providers/pytorch-cpu/main.py                 | 238 +++++++++++
 providers/pytorch-cpu/requirements.txt        |   8 +
 providers/pytorch-cuda/build.py               |  84 ++++
 providers/pytorch-cuda/main.py                | 238 +++++++++++
 providers/pytorch-cuda/requirements.txt       |  10 +
 21 files changed, 2811 insertions(+), 171 deletions(-)
 create mode 100644 app/src/components/ServerSettings/ProviderSettings.tsx
 create mode 100644 backend/providers/__init__.py
 create mode 100644 backend/providers/base.py
 create mode 100644 backend/providers/bundled.py
 create mode 100644 backend/providers/installer.py
 create mode 100644 backend/providers/local.py
 create mode 100644 backend/providers/types.py
 create mode 100644 providers/README.md
 create mode 100644 providers/pytorch-cpu/build.py
 create mode 100644 providers/pytorch-cpu/main.py
 create mode 100644 providers/pytorch-cpu/requirements.txt
 create mode 100644 providers/pytorch-cuda/build.py
 create mode 100644 providers/pytorch-cuda/main.py
 create mode 100644 providers/pytorch-cuda/requirements.txt

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 9e65f520..de067112 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -6,7 +6,114 @@ on:
     tags:
       - "v*"
 
+env:
+  PROVIDER_VERSION: "1.0.0"
+
 jobs:
+  # ============================================
+  # Build TTS Providers (uploaded to R2, not GitHub)
+  # ============================================
+  build-providers:
+    runs-on: ${{ matrix.platform }}
+    strategy:
+      fail-fast: false
+      matrix:
+        include:
+          # PyTorch CPU provider (Windows)
+          - platform: "windows-latest"
+            provider: "pytorch-cpu"
+            python-version: "3.12"
+          # PyTorch CUDA provider (Windows) - large binary, uploaded to R2
+          - platform: "windows-latest"
+            provider: "pytorch-cuda"
+            python-version: "3.12"
+          # PyTorch CPU provider (Linux)
+          - platform: "ubuntu-22.04"
+            provider: "pytorch-cpu"
+            python-version: "3.12"
+          # PyTorch CUDA provider (Linux) - large binary, uploaded to R2
+          - platform: "ubuntu-22.04"
+            provider: "pytorch-cuda"
+            python-version: "3.12"
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Install dependencies (ubuntu only)
+        if: matrix.platform == 'ubuntu-22.04'
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y llvm-dev
+
+      - name: Setup Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+          cache: "pip"
+
+      - name: Install Python dependencies (CPU)
+        if: matrix.provider == 'pytorch-cpu'
+        run: |
+          python -m pip install --upgrade pip
+          pip install pyinstaller
+          pip install -r providers/pytorch-cpu/requirements.txt
+          pip install -r backend/requirements.txt
+
+      - name: Install Python dependencies (CUDA)
+        if: matrix.provider == 'pytorch-cuda'
+        run: |
+          python -m pip install --upgrade pip
+          pip install pyinstaller
+          pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
+          pip install -r providers/pytorch-cuda/requirements.txt
+          pip install -r backend/requirements.txt
+
+      - name: Build provider binary
+        shell: bash
+        run: |
+          cd providers/${{ matrix.provider }}
+          python build.py
+
+      - name: Upload provider to R2
+        shell: bash
+        env:
+          R2_ACCESS_KEY_ID: ${{ secrets.R2_ACCESS_KEY_ID }}
+          R2_SECRET_ACCESS_KEY: ${{ secrets.R2_SECRET_ACCESS_KEY }}
+          R2_ENDPOINT: ${{ secrets.R2_ENDPOINT }}
+        run: |
+          # Install AWS CLI (compatible with R2)
+          pip install awscli
+
+          # Configure AWS CLI for R2
+          aws configure set aws_access_key_id $R2_ACCESS_KEY_ID
+          aws configure set aws_secret_access_key $R2_SECRET_ACCESS_KEY
+          aws configure set region auto
+
+          # Determine binary name based on platform
+          if [ "${{ matrix.platform }}" == "windows-latest" ]; then
+            BINARY_NAME="tts-provider-${{ matrix.provider }}.exe"
+            BINARY_PATH="providers/${{ matrix.provider }}/dist/tts-provider-${{ matrix.provider }}.exe"
+          else
+            BINARY_NAME="tts-provider-${{ matrix.provider }}"
+            BINARY_PATH="providers/${{ matrix.provider }}/dist/tts-provider-${{ matrix.provider }}"
+          fi
+
+          # Add platform suffix for clarity
+          if [ "${{ matrix.platform }}" == "windows-latest" ]; then
+            UPLOAD_NAME="tts-provider-${{ matrix.provider }}-windows.exe"
+          else
+            UPLOAD_NAME="tts-provider-${{ matrix.provider }}-linux"
+          fi
+
+          # Upload to R2 (bucket: voicebox)
+          aws s3 cp "$BINARY_PATH" "s3://voicebox/providers/v${{ env.PROVIDER_VERSION }}/$UPLOAD_NAME" \
+            --endpoint-url "$R2_ENDPOINT"
+
+          echo "Uploaded $UPLOAD_NAME to R2"
+
+  # ============================================
+  # Build Main App (without bundled TTS on Win/Linux)
+  # ============================================
   release:
     permissions:
       contents: write
@@ -14,22 +121,26 @@ jobs:
       fail-fast: false
       matrix:
         include:
+          # macOS Apple Silicon - MLX bundled (works out of the box)
           - platform: "macos-latest"
             args: "--target aarch64-apple-darwin"
             python-version: "3.12"
             backend: "mlx"
+          # macOS Intel - PyTorch bundled (smaller user base, keep simple)
           - platform: "macos-15-intel"
             args: "--target x86_64-apple-darwin"
             python-version: "3.12"
             backend: "pytorch"
+          # Linux - No TTS bundled, providers downloaded separately
           # - platform: 'ubuntu-22.04'
           #   args: ''
           #   python-version: '3.12'
-          #   backend: 'pytorch'
+          #   backend: 'none'
+          # Windows - No TTS bundled, providers downloaded separately
           - platform: "windows-latest"
             args: ""
             python-version: "3.12"
-            backend: "pytorch"
+            backend: "none"
 
     runs-on: ${{ matrix.platform }}
 
@@ -55,23 +166,27 @@ jobs:
           python-version: ${{ matrix.python-version }}
           cache: "pip"
 
-      - name: Install Python dependencies
+      - name: Install Python dependencies (with TTS)
+        if: matrix.backend != 'none'
         run: |
           python -m pip install --upgrade pip
           pip install pyinstaller
           pip install -r backend/requirements.txt
 
+      - name: Install Python dependencies (without TTS)
+        if: matrix.backend == 'none'
+        run: |
+          python -m pip install --upgrade pip
+          pip install pyinstaller
+          # Install base requirements without PyTorch/Qwen-TTS
+          pip install fastapi uvicorn sqlalchemy librosa soundfile numpy httpx
+          pip install huggingface_hub  # For Whisper downloads
+
       - name: Install MLX dependencies (Apple Silicon only)
         if: matrix.backend == 'mlx'
         run: |
           pip install -r backend/requirements-mlx.txt
 
-      # - name: Install PyTorch with CUDA (Windows only)
-      #   if: matrix.platform == 'windows-latest'
-      #   run: |
-      #     pip install torch --index-url https://download.pytorch.org/whl/cu121 --force-reinstall --no-deps
-      #     pip install torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
-
       - name: Build Python server (Linux/macOS)
         if: matrix.platform != 'windows-latest'
         run: |
@@ -148,10 +263,15 @@ jobs:
             See the assets below to download and install this version.
 
             ### Installation
-            - **macOS (Apple Silicon)**: Download the `aarch64.dmg` file - uses MLX for fast native inference
+            - **macOS (Apple Silicon)**: Download the `aarch64.dmg` file - uses MLX for fast native inference (works out of the box)
             - **macOS (Intel)**: Download the `x64.dmg` file - uses PyTorch
-            - **Windows**: Download the `.msi` installer
-            - **Linux**: Download the `.AppImage` or `.deb` package
+            - **Windows**: Download the `.msi` installer - requires downloading a TTS provider on first use
+            - **Linux**: Download the `.AppImage` or `.deb` package - requires downloading a TTS provider on first use
+
+            ### TTS Providers (Windows/Linux)
+            Windows and Linux users will be prompted to download a TTS provider on first launch:
+            - **PyTorch CPU** (~300MB) - Works on any system
+            - **PyTorch CUDA** (~2.4GB) - 4-5x faster on NVIDIA GPUs
 
             The app includes automatic updates - future updates will be installed automatically.
           releaseDraft: true
diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
new file mode 100644
index 00000000..c18874a9
--- /dev/null
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -0,0 +1,395 @@
+import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
+import { Download, Loader2, Trash2 } from 'lucide-react';
+import { useCallback, useState } from 'react';
+import {
+  AlertDialog,
+  AlertDialogAction,
+  AlertDialogCancel,
+  AlertDialogContent,
+  AlertDialogDescription,
+  AlertDialogFooter,
+  AlertDialogHeader,
+  AlertDialogTitle,
+} from '@/components/ui/alert-dialog';
+import { Badge } from '@/components/ui/badge';
+import { Button } from '@/components/ui/button';
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card';
+import { Label } from '@/components/ui/label';
+import { RadioGroup, RadioGroupItem } from '@/components/ui/radio-group';
+import { useToast } from '@/components/ui/use-toast';
+import { apiClient } from '@/lib/api/client';
+import { useModelDownloadToast } from '@/lib/hooks/useModelDownloadToast';
+
+const isMacOS = () => navigator.platform.toLowerCase().includes('mac');
+
+type ProviderType = 'auto' | 'bundled-mlx' | 'bundled-pytorch' | 'pytorch-cpu' | 'pytorch-cuda' | 'remote' | 'openai';
+
+export function ProviderSettings() {
+  const { toast } = useToast();
+  const queryClient = useQueryClient();
+  const [selectedProvider, setSelectedProvider] = useState<ProviderType>('auto');
+  const [downloadingProvider, setDownloadingProvider] = useState<string | null>(null);
+
+  const { data: providersData, isLoading } = useQuery({
+    queryKey: ['providers'],
+    queryFn: async () => {
+      return await apiClient.listProviders();
+    },
+    refetchInterval: 5000,
+  });
+
+  const { data: activeProvider } = useQuery({
+    queryKey: ['activeProvider'],
+    queryFn: async () => {
+      return await apiClient.getActiveProvider();
+    },
+    refetchInterval: 5000,
+  });
+
+  // Callbacks for download completion
+  const handleDownloadComplete = useCallback(() => {
+    setDownloadingProvider(null);
+    queryClient.invalidateQueries({ queryKey: ['providers'] });
+  }, [queryClient]);
+
+  const handleDownloadError = useCallback(() => {
+    setDownloadingProvider(null);
+  }, []);
+
+  // Use progress toast hook for the downloading provider
+  useModelDownloadToast({
+    modelName: downloadingProvider || '',
+    displayName: downloadingProvider || '',
+    enabled: !!downloadingProvider,
+    onComplete: handleDownloadComplete,
+    onError: handleDownloadError,
+  });
+
+  const [deleteDialogOpen, setDeleteDialogOpen] = useState(false);
+  const [providerToDelete, setProviderToDelete] = useState<string | null>(null);
+
+  const downloadMutation = useMutation({
+    mutationFn: async (providerType: string) => {
+      return await apiClient.downloadProvider(providerType);
+    },
+    onSuccess: (_, providerType) => {
+      setDownloadingProvider(providerType);
+      queryClient.invalidateQueries({ queryKey: ['providers'] });
+    },
+    onError: (error: Error) => {
+      toast({
+        title: 'Download failed',
+        description: error.message,
+        variant: 'destructive',
+      });
+    },
+  });
+
+  const startMutation = useMutation({
+    mutationFn: async (providerType: string) => {
+      return await apiClient.startProvider(providerType);
+    },
+    onSuccess: () => {
+      queryClient.invalidateQueries({ queryKey: ['activeProvider'] });
+      toast({
+        title: 'Provider started',
+        description: 'The provider has been started successfully',
+      });
+    },
+    onError: (error: Error) => {
+      toast({
+        title: 'Failed to start provider',
+        description: error.message,
+        variant: 'destructive',
+      });
+    },
+  });
+
+  const deleteMutation = useMutation({
+    mutationFn: async (providerType: string) => {
+      return await apiClient.deleteProvider(providerType);
+    },
+    onSuccess: () => {
+      queryClient.invalidateQueries({ queryKey: ['providers'] });
+      toast({
+        title: 'Provider deleted',
+        description: 'The provider has been deleted successfully',
+      });
+    },
+    onError: (error: Error) => {
+      toast({
+        title: 'Failed to delete provider',
+        description: error.message,
+        variant: 'destructive',
+      });
+    },
+  });
+
+  const handleDownload = async (providerType: string) => {
+    downloadMutation.mutate(providerType);
+  };
+
+  const handleStart = async (providerType: string) => {
+    startMutation.mutate(providerType);
+  };
+
+  const handleDelete = (providerType: string) => {
+    setProviderToDelete(providerType);
+    setDeleteDialogOpen(true);
+  };
+
+  const confirmDelete = () => {
+    if (providerToDelete) {
+      deleteMutation.mutate(providerToDelete);
+      setDeleteDialogOpen(false);
+      setProviderToDelete(null);
+    }
+  };
+
+  if (isLoading) {
+    return (
+      <Card>
+        <CardHeader>
+          <CardTitle>TTS Provider</CardTitle>
+          <CardDescription>Choose how Voicebox generates speech</CardDescription>
+        </CardHeader>
+        <CardContent>
+          <div className="flex items-center justify-center py-8">
+            <Loader2 className="h-6 w-6 animate-spin" />
+          </div>
+        </CardContent>
+      </Card>
+    );
+  }
+
+  const installedProviders = providersData?.installed || [];
+
+  // Determine current active provider
+  const currentProvider = activeProvider?.provider || 'auto';
+
+  return (
+    <>
+      <Card>
+        <CardHeader>
+          <CardTitle>TTS Provider</CardTitle>
+          <CardDescription>Choose how Voicebox generates speech</CardDescription>
+        </CardHeader>
+        <CardContent>
+          <RadioGroup
+            value={selectedProvider}
+            onValueChange={(value) => setSelectedProvider(value as ProviderType)}
+          >
+            {/* Auto-detect */}
+            <div className="flex items-center space-x-2 py-2">
+              <RadioGroupItem value="auto" id="auto" />
+              <Label htmlFor="auto" className="flex-1 cursor-pointer">
+                <div className="font-medium">Auto-detect (Recommended)</div>
+                <div className="text-sm text-muted-foreground">
+                  Automatically choose the best available provider
+                </div>
+              </Label>
+              {currentProvider === 'auto' && (
+                <Badge variant="outline" className="ml-2">
+                  Active
+                </Badge>
+              )}
+            </div>
+
+            {/* PyTorch CUDA */}
+            <div className="flex items-center justify-between py-2">
+              <div className="flex items-center space-x-2 flex-1">
+                <RadioGroupItem value="pytorch-cuda" id="cuda" />
+                <Label htmlFor="cuda" className="flex-1 cursor-pointer">
+                  <div className="font-medium">PyTorch CUDA (NVIDIA GPU)</div>
+                  <div className="text-sm text-muted-foreground">
+                    4-5x faster inference on NVIDIA GPUs
+                  </div>
+                </Label>
+              </div>
+              <div className="flex items-center gap-2">
+                {currentProvider === 'pytorch-cuda' && (
+                  <Badge variant="outline">Active</Badge>
+                )}
+                {!installedProviders.includes('pytorch-cuda') && (
+                  <Button
+                    onClick={() => handleDownload('pytorch-cuda')}
+                    size="sm"
+                    disabled={downloadingProvider === 'pytorch-cuda'}
+                  >
+                    {downloadingProvider === 'pytorch-cuda' ? (
+                      <Loader2 className="h-4 w-4 animate-spin" />
+                    ) : (
+                      <>
+                        <Download className="h-4 w-4 mr-1" />
+                        Download (2.4GB)
+                      </>
+                    )}
+                  </Button>
+                )}
+                {installedProviders.includes('pytorch-cuda') && selectedProvider !== 'pytorch-cuda' && (
+                  <Button
+                    onClick={() => handleStart('pytorch-cuda')}
+                    size="sm"
+                    variant="outline"
+                  >
+                    Start
+                  </Button>
+                )}
+                {installedProviders.includes('pytorch-cuda') && (
+                  <Button
+                    onClick={() => handleDelete('pytorch-cuda')}
+                    size="sm"
+                    variant="ghost"
+                  >
+                    <Trash2 className="h-4 w-4" />
+                  </Button>
+                )}
+              </div>
+            </div>
+
+            {/* PyTorch CPU (Windows/Linux only) */}
+            {!isMacOS() && (
+              <div className="flex items-center justify-between py-2">
+                <div className="flex items-center space-x-2 flex-1">
+                  <RadioGroupItem value="pytorch-cpu" id="cpu" />
+                  <Label htmlFor="cpu" className="flex-1 cursor-pointer">
+                    <div className="font-medium">PyTorch CPU</div>
+                    <div className="text-sm text-muted-foreground">
+                      Works on any system, slower inference
+                    </div>
+                  </Label>
+                </div>
+                <div className="flex items-center gap-2">
+                  {currentProvider === 'pytorch-cpu' && (
+                    <Badge variant="outline">Active</Badge>
+                  )}
+                  {!installedProviders.includes('pytorch-cpu') && (
+                    <Button
+                      onClick={() => handleDownload('pytorch-cpu')}
+                      size="sm"
+                      disabled={downloadingProvider === 'pytorch-cpu'}
+                    >
+                      {downloadingProvider === 'pytorch-cpu' ? (
+                        <Loader2 className="h-4 w-4 animate-spin" />
+                      ) : (
+                        <>
+                          <Download className="h-4 w-4 mr-1" />
+                          Download (300MB)
+                        </>
+                      )}
+                    </Button>
+                  )}
+                  {installedProviders.includes('pytorch-cpu') && selectedProvider !== 'pytorch-cpu' && (
+                    <Button
+                      onClick={() => handleStart('pytorch-cpu')}
+                      size="sm"
+                      variant="outline"
+                    >
+                      Start
+                    </Button>
+                  )}
+                  {installedProviders.includes('pytorch-cpu') && (
+                    <Button
+                      onClick={() => handleDelete('pytorch-cpu')}
+                      size="sm"
+                      variant="ghost"
+                    >
+                      <Trash2 className="h-4 w-4" />
+                    </Button>
+                  )}
+                </div>
+              </div>
+            )}
+
+            {/* MLX bundled (macOS only) */}
+            {isMacOS() && (
+              <div className="p-3 bg-muted rounded-md">
+                <div className="text-sm">
+                  <div className="font-medium flex items-center gap-2">
+                    MLX (Apple Silicon)
+                    {currentProvider === 'bundled-mlx' && (
+                      <Badge variant="outline">Active</Badge>
+                    )}
+                  </div>
+                  <div className="text-muted-foreground mt-1">
+                    Bundled with the app - optimized for M1/M2/M3 chips
+                  </div>
+                </div>
+              </div>
+            )}
+
+            {/* Remote */}
+            <div className="space-y-2 py-2">
+              <div className="flex items-center space-x-2">
+                <RadioGroupItem value="remote" id="remote" />
+                <Label htmlFor="remote" className="flex-1 cursor-pointer">
+                  <div className="font-medium">Remote Server</div>
+                  <div className="text-sm text-muted-foreground">
+                    Connect to your own TTS server
+                  </div>
+                </Label>
+              </div>
+              {selectedProvider === 'remote' && (
+                <div className="ml-6">
+                  <input
+                    type="text"
+                    placeholder="http://your-server:8000"
+                    className="w-full px-3 py-2 border rounded-md"
+                    disabled
+                  />
+                  <div className="text-xs text-muted-foreground mt-1">
+                    Remote provider support coming soon
+                  </div>
+                </div>
+              )}
+            </div>
+
+            {/* OpenAI */}
+            <div className="space-y-2 py-2">
+              <div className="flex items-center space-x-2">
+                <RadioGroupItem value="openai" id="openai" />
+                <Label htmlFor="openai" className="flex-1 cursor-pointer">
+                  <div className="font-medium">OpenAI API</div>
+                  <div className="text-sm text-muted-foreground">
+                    Use OpenAI's TTS API (requires API key)
+                  </div>
+                </Label>
+              </div>
+              {selectedProvider === 'openai' && (
+                <div className="ml-6">
+                  <input
+                    type="password"
+                    placeholder="sk-..."
+                    className="w-full px-3 py-2 border rounded-md"
+                    disabled
+                  />
+                  <div className="text-xs text-muted-foreground mt-1">
+                    OpenAI provider support coming soon
+                  </div>
+                </div>
+              )}
+            </div>
+          </RadioGroup>
+        </CardContent>
+      </Card>
+
+      <AlertDialog open={deleteDialogOpen} onOpenChange={setDeleteDialogOpen}>
+        <AlertDialogContent>
+          <AlertDialogHeader>
+            <AlertDialogTitle>Delete Provider</AlertDialogTitle>
+            <AlertDialogDescription>
+              Are you sure you want to delete {providerToDelete}? This will remove the provider
+              binary from your system. You can download it again later if needed.
+            </AlertDialogDescription>
+          </AlertDialogHeader>
+          <AlertDialogFooter>
+            <AlertDialogCancel>Cancel</AlertDialogCancel>
+            <AlertDialogAction onClick={confirmDelete} className="bg-destructive text-destructive-foreground">
+              Delete
+            </AlertDialogAction>
+          </AlertDialogFooter>
+        </AlertDialogContent>
+      </AlertDialog>
+    </>
+  );
+}
diff --git a/app/src/components/ServerTab/ServerTab.tsx b/app/src/components/ServerTab/ServerTab.tsx
index abf91ac2..5a512027 100644
--- a/app/src/components/ServerTab/ServerTab.tsx
+++ b/app/src/components/ServerTab/ServerTab.tsx
@@ -1,6 +1,7 @@
 import { ConnectionForm } from '@/components/ServerSettings/ConnectionForm';
 import { ServerStatus } from '@/components/ServerSettings/ServerStatus';
 import { UpdateStatus } from '@/components/ServerSettings/UpdateStatus';
+import { ProviderSettings } from '@/components/ServerSettings/ProviderSettings';
 import { usePlatform } from '@/platform/PlatformContext';
 
 export function ServerTab() {
@@ -11,6 +12,7 @@ export function ServerTab() {
         <ConnectionForm />
         <ServerStatus />
       </div>
+      <ProviderSettings />
       {platform.metadata.isTauri && <UpdateStatus />}
       <div className="py-8 text-center text-sm text-muted-foreground">
         Created by{' '}
diff --git a/app/src/lib/api/client.ts b/app/src/lib/api/client.ts
index c5b079b2..b5da41a6 100644
--- a/app/src/lib/api/client.ts
+++ b/app/src/lib/api/client.ts
@@ -199,6 +199,77 @@ class ApiClient {
     });
   }
 
+  // Providers
+  async listProviders(): Promise<{
+    providers: Array<{
+      type: string;
+      name: string;
+      installed: boolean;
+      size_mb: number | null;
+    }>;
+    installed: string[];
+  }> {
+    return this.request('/providers');
+  }
+
+  async getActiveProvider(): Promise<{
+    provider: string;
+    health: {
+      status: string;
+      provider: string;
+      version: string | null;
+      model: string | null;
+      device: string | null;
+    };
+    status: {
+      model_loaded: boolean;
+      model_size: string | null;
+      available_sizes: string[];
+      gpu_available: boolean | null;
+      vram_used_mb: number | null;
+    };
+  }> {
+    return this.request('/providers/active');
+  }
+
+  async startProvider(providerType: string): Promise<{
+    message: string;
+    provider: {
+      status: string;
+      provider: string;
+      version: string | null;
+      model: string | null;
+      device: string | null;
+    };
+  }> {
+    return this.request('/providers/start', {
+      method: 'POST',
+      body: JSON.stringify({ provider_type: providerType }),
+    });
+  }
+
+  async stopProvider(): Promise<{ message: string }> {
+    return this.request('/providers/stop', {
+      method: 'POST',
+    });
+  }
+
+  async downloadProvider(providerType: string): Promise<{
+    message: string;
+    provider_type: string;
+  }> {
+    return this.request('/providers/download', {
+      method: 'POST',
+      body: JSON.stringify({ provider_type: providerType }),
+    });
+  }
+
+  async deleteProvider(providerType: string): Promise<{ message: string }> {
+    return this.request(`/providers/${providerType}`, {
+      method: 'DELETE',
+    });
+  }
+
   // History
   async listHistory(query?: HistoryQuery): Promise<HistoryListResponse> {
     const params = new URLSearchParams();
diff --git a/backend/build_binary.py b/backend/build_binary.py
index a2973cd4..fb65863e 100644
--- a/backend/build_binary.py
+++ b/backend/build_binary.py
@@ -30,7 +30,7 @@ def build_server():
         args.extend(['--paths', str(qwen_tts_path)])
         print(f"Using local qwen_tts source from: {qwen_tts_path}")
 
-    # Add common hidden imports
+    # Add common hidden imports (always included)
     args.extend([
         '--hidden-import', 'backend',
         '--hidden-import', 'backend.main',
@@ -42,38 +42,30 @@ def build_server():
         '--hidden-import', 'backend.tts',
         '--hidden-import', 'backend.transcribe',
         '--hidden-import', 'backend.platform_detect',
-        '--hidden-import', 'backend.backends',
-        '--hidden-import', 'backend.backends.pytorch_backend',
+        '--hidden-import', 'backend.providers',
+        '--hidden-import', 'backend.providers.base',
+        '--hidden-import', 'backend.providers.bundled',
+        '--hidden-import', 'backend.providers.types',
         '--hidden-import', 'backend.utils.audio',
         '--hidden-import', 'backend.utils.cache',
         '--hidden-import', 'backend.utils.progress',
         '--hidden-import', 'backend.utils.hf_progress',
         '--hidden-import', 'backend.utils.validation',
-        '--hidden-import', 'torch',
-        '--hidden-import', 'transformers',
         '--hidden-import', 'fastapi',
         '--hidden-import', 'uvicorn',
         '--hidden-import', 'sqlalchemy',
         '--hidden-import', 'librosa',
         '--hidden-import', 'soundfile',
-        '--hidden-import', 'qwen_tts',
-        '--hidden-import', 'qwen_tts.inference',
-        '--hidden-import', 'qwen_tts.inference.qwen3_tts_model',
-        '--hidden-import', 'qwen_tts.inference.qwen3_tts_tokenizer',
-        '--hidden-import', 'qwen_tts.core',
-        '--hidden-import', 'qwen_tts.cli',
-        '--copy-metadata', 'qwen-tts',
-        '--collect-submodules', 'qwen_tts',
-        '--collect-data', 'qwen_tts',
         # Fix for pkg_resources and jaraco namespace packages
         '--hidden-import', 'pkg_resources.extern',
         '--collect-submodules', 'jaraco',
     ])
 
-    # Add MLX-specific imports if building on Apple Silicon
+    # Platform-specific TTS backend handling
     if is_apple_silicon():
-        print("Building for Apple Silicon - including MLX dependencies")
+        print("Building for Apple Silicon - including MLX dependencies (bundled)")
         args.extend([
+            '--hidden-import', 'backend.backends',
             '--hidden-import', 'backend.backends.mlx_backend',
             '--hidden-import', 'mlx',
             '--hidden-import', 'mlx.core',
@@ -88,7 +80,13 @@ def build_server():
             '--collect-data', 'mlx_audio',
         ])
     else:
-        print("Building for non-Apple Silicon platform - PyTorch only")
+        print("Building for Windows/Linux - excluding PyTorch/Qwen-TTS (providers downloaded separately)")
+        # Note: PyTorch and Qwen-TTS are NOT included - users will download providers separately
+        # Only include backend abstraction (no actual TTS implementation)
+        args.extend([
+            '--hidden-import', 'backend.backends',
+            '--hidden-import', 'backend.backends.pytorch_backend',  # Keep for reference, but won't work without PyTorch
+        ])
 
     args.extend([
         '--noconfirm',
diff --git a/backend/main.py b/backend/main.py
index 59fb9e18..3bd4b7e6 100644
--- a/backend/main.py
+++ b/backend/main.py
@@ -29,6 +29,8 @@
 from .utils.tasks import get_task_manager
 from .utils.cache import clear_voice_prompt_cache
 from .platform_detect import get_backend_type
+from .providers import get_provider_manager
+from .providers.types import ProviderType
 
 app = FastAPI(
     title="voicebox API",
@@ -74,7 +76,7 @@ async def health():
     from pathlib import Path
     import os
 
-    tts_model = tts.get_tts_model()
+    tts_model = await tts.get_tts_model_async()
     backend_type = get_backend_type()
 
     # Check for GPU availability (CUDA or MPS)
@@ -549,7 +551,7 @@ async def generate_speech(
         )
         
         # Generate audio
-        tts_model = tts.get_tts_model()
+        tts_model = await tts.get_tts_model_async()
         # Load the requested model size if different from current (async to not block)
         model_size = data.model_size or "1.7B"
 
@@ -1113,8 +1115,8 @@ async def get_sample_audio(sample_id: str, db: Session = Depends(get_db)):
 async def load_model(model_size: str = "1.7B"):
     """Manually load TTS model."""
     try:
-        tts_model = tts.get_tts_model()
-        await tts_model.load_model_async(model_size)
+        tts_model = await tts.get_tts_model_async()
+        await tts_model.load_model(model_size)
         return {"message": f"Model {model_size} loaded successfully"}
     except Exception as e:
         raise HTTPException(status_code=500, detail=str(e))
@@ -1172,10 +1174,10 @@ async def get_model_status():
     except ImportError:
         use_scan_cache = False
     
-    def check_tts_loaded(model_size: str):
+    async def check_tts_loaded(model_size: str):
         """Check if TTS model is loaded with specific size."""
         try:
-            tts_model = tts.get_tts_model()
+            tts_model = await tts.get_tts_model_async()
             return tts_model.is_loaded() and getattr(tts_model, 'model_size', None) == model_size
         except Exception:
             return False
@@ -1211,14 +1213,14 @@ def check_whisper_loaded(model_size: str):
             "display_name": "Qwen TTS 1.7B",
             "hf_repo_id": tts_1_7b_id,
             "model_size": "1.7B",
-            "check_loaded": lambda: check_tts_loaded("1.7B"),
+            "check_loaded": lambda: check_tts_loaded("1.7B"),  # Async function
         },
         {
             "model_name": "qwen-tts-0.6B",
             "display_name": "Qwen TTS 0.6B",
             "hf_repo_id": tts_0_6b_id,
             "model_size": "0.6B",
-            "check_loaded": lambda: check_tts_loaded("0.6B"),
+            "check_loaded": lambda: check_tts_loaded("0.6B"),  # Async function
         },
         {
             "model_name": "whisper-base",
@@ -1356,7 +1358,11 @@ def check_whisper_loaded(model_size: str):
             
             # Check if loaded in memory
             try:
-                loaded = config["check_loaded"]()
+                check_func = config["check_loaded"]
+                if asyncio.iscoroutinefunction(check_func):
+                    loaded = await check_func()
+                else:
+                    loaded = check_func()
             except Exception:
                 loaded = False
             
@@ -1379,7 +1385,11 @@ def check_whisper_loaded(model_size: str):
         except Exception as e:
             # If check fails, try to at least check if loaded
             try:
-                loaded = config["check_loaded"]()
+                check_func = config["check_loaded"]
+                if asyncio.iscoroutinefunction(check_func):
+                    loaded = await check_func()
+                else:
+                    loaded = check_func()
             except Exception:
                 loaded = False
             
@@ -1406,14 +1416,24 @@ async def trigger_model_download(request: models.ModelDownloadRequest):
     task_manager = get_task_manager()
     progress_manager = get_progress_manager()
     
+    async def load_tts_model_1_7b():
+        """Load 1.7B TTS model."""
+        tts_model = await tts.get_tts_model_async()
+        await tts_model.load_model("1.7B")
+    
+    async def load_tts_model_0_6b():
+        """Load 0.6B TTS model."""
+        tts_model = await tts.get_tts_model_async()
+        await tts_model.load_model("0.6B")
+    
     model_configs = {
         "qwen-tts-1.7B": {
             "model_size": "1.7B",
-            "load_func": lambda: tts.get_tts_model().load_model("1.7B"),
+            "load_func": load_tts_model_1_7b,
         },
         "qwen-tts-0.6B": {
             "model_size": "0.6B",
-            "load_func": lambda: tts.get_tts_model().load_model("0.6B"),
+            "load_func": load_tts_model_0_6b,
         },
         "whisper-base": {
             "model_size": "base",
@@ -1472,6 +1492,171 @@ async def download_in_background():
     return {"message": f"Model {request.model_name} download started"}
 
 
+# ============================================
+# PROVIDER ENDPOINTS
+# ============================================
+
+@app.get("/providers")
+async def list_providers():
+    """List all available provider types."""
+    manager = get_provider_manager()
+    installed = await manager.list_installed()
+    
+    # Get info for all known provider types
+    all_providers = [
+        "bundled-mlx",
+        "bundled-pytorch",
+        "pytorch-cpu",
+        "pytorch-cuda",
+        "remote",
+        "openai",
+    ]
+    
+    providers_info = []
+    for provider_type in all_providers:
+        info = await manager.get_provider_info(provider_type)
+        providers_info.append(info)
+    
+    return {
+        "providers": providers_info,
+        "installed": installed,
+    }
+
+
+@app.get("/providers/installed")
+async def list_installed_providers():
+    """List installed provider types."""
+    manager = get_provider_manager()
+    installed = await manager.list_installed()
+    return {"installed": installed}
+
+
+@app.get("/providers/active")
+async def get_active_provider():
+    """Get information about the currently active provider."""
+    manager = get_provider_manager()
+    provider = await manager.get_active_provider()
+    
+    health = await provider.health()
+    status = await provider.status()
+    
+    return {
+        "provider": health["provider"],
+        "health": health,
+        "status": status,
+    }
+
+
+@app.post("/providers/start")
+async def start_provider(data: dict):
+    """Start a specific provider."""
+    provider_type = data.get("provider_type")
+    if not provider_type:
+        raise HTTPException(status_code=400, detail="provider_type is required")
+    
+    manager = get_provider_manager()
+    try:
+        await manager.start_provider(provider_type)
+        provider = await manager.get_active_provider()
+        health = await provider.health()
+        return {
+            "message": f"Provider {provider_type} started",
+            "provider": health,
+        }
+    except NotImplementedError as e:
+        raise HTTPException(status_code=501, detail=str(e))
+    except ValueError as e:
+        raise HTTPException(status_code=400, detail=str(e))
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+
+
+@app.post("/providers/stop")
+async def stop_provider():
+    """Stop the currently active provider."""
+    manager = get_provider_manager()
+    await manager.stop_provider()
+    return {"message": "Provider stopped"}
+
+
+@app.post("/providers/download")
+async def download_provider_endpoint(data: dict):
+    """Download a provider binary."""
+    from .providers.installer import download_provider
+    
+    provider_type = data.get("provider_type")
+    if not provider_type:
+        raise HTTPException(status_code=400, detail="provider_type is required")
+    
+    if provider_type not in ["pytorch-cpu", "pytorch-cuda"]:
+        raise HTTPException(
+            status_code=400,
+            detail=f"Provider type {provider_type} cannot be downloaded"
+        )
+    
+    try:
+        # Start download in background
+        asyncio.create_task(download_provider(provider_type))
+        return {
+            "message": f"Provider {provider_type} download started",
+            "provider_type": provider_type,
+        }
+    except Exception as e:
+        raise HTTPException(status_code=500, detail=str(e))
+
+
+@app.get("/providers/download/progress/{provider_type}")
+async def get_provider_download_progress(provider_type: str):
+    """Get provider download progress via Server-Sent Events."""
+    from fastapi.responses import StreamingResponse
+    from .utils.progress import get_progress_manager
+    
+    progress_manager = get_progress_manager()
+    
+    async def event_generator():
+        """Generate SSE events for provider download progress."""
+        import asyncio
+        import json
+        
+        last_progress = None
+        
+        while True:
+            progress = progress_manager.get_progress(provider_type)
+            
+            if progress and progress != last_progress:
+                yield f"data: {json.dumps(progress)}\n\n"
+                last_progress = progress
+                
+                if progress.get("status") in ["complete", "error"]:
+                    break
+            
+            await asyncio.sleep(0.5)
+    
+    return StreamingResponse(event_generator(), media_type="text/event-stream")
+
+
+@app.delete("/providers/{provider_type}")
+async def delete_provider_endpoint(provider_type: str):
+    """Delete an installed provider."""
+    from .providers.installer import delete_provider
+    
+    if provider_type not in ["pytorch-cpu", "pytorch-cuda"]:
+        raise HTTPException(
+            status_code=400,
+            detail=f"Provider type {provider_type} cannot be deleted"
+        )
+    
+    deleted = delete_provider(provider_type)
+    
+    if deleted:
+        return {"message": f"Provider {provider_type} deleted successfully"}
+    else:
+        raise HTTPException(
+            status_code=404,
+            detail=f"Provider {provider_type} not found"
+        )
+
+
 @app.delete("/models/{model_name}")
 async def delete_model(model_name: str):
     """Delete a downloaded model from the HuggingFace cache."""
@@ -1522,9 +1707,9 @@ async def delete_model(model_name: str):
     try:
         # Check if model is loaded and unload it first
         if config["model_type"] == "tts":
-            tts_model = tts.get_tts_model()
-            if tts_model.is_loaded() and tts_model.model_size == config["model_size"]:
-                tts.unload_tts_model()
+            tts_model = await tts.get_tts_model_async()
+            if tts_model.is_loaded() and getattr(tts_model, 'model_size', None) == config["model_size"]:
+                tts_model.unload_model()
         elif config["model_type"] == "whisper":
             whisper_model = transcribe.get_whisper_model()
             if whisper_model.is_loaded() and whisper_model.model_size == config["model_size"]:
diff --git a/backend/providers/__init__.py b/backend/providers/__init__.py
new file mode 100644
index 00000000..09854d77
--- /dev/null
+++ b/backend/providers/__init__.py
@@ -0,0 +1,220 @@
+"""
+Provider management system for TTS providers.
+"""
+
+from typing import Optional
+import platform
+from pathlib import Path
+
+from .base import TTSProvider
+from .types import ProviderType
+from .bundled import BundledProvider
+from .local import LocalProvider
+from .installer import get_provider_binary_path
+from ..config import get_data_dir
+import subprocess
+import socket
+
+
+class ProviderManager:
+    """Manages TTS provider lifecycle."""
+    
+    def __init__(self):
+        self.active_provider: Optional[TTSProvider] = None
+        self._default_provider: Optional[TTSProvider] = None
+        self._provider_process: Optional[subprocess.Popen] = None
+        self._provider_port: Optional[int] = None
+    
+    def _get_default_provider(self) -> TTSProvider:
+        """Get the default bundled provider."""
+        if self._default_provider is None:
+            self._default_provider = BundledProvider()
+        return self._default_provider
+    
+    async def get_active_provider(self) -> TTSProvider:
+        """
+        Get the currently active provider.
+        
+        Returns:
+            Active TTS provider instance
+        """
+        if self.active_provider is None:
+            # Default to bundled provider
+            self.active_provider = self._get_default_provider()
+        return self.active_provider
+    
+    async def start_provider(self, provider_type: str) -> None:
+        """
+        Start a TTS provider.
+        
+        Args:
+            provider_type: Type of provider to start
+        """
+        if provider_type in ["bundled-mlx", "bundled-pytorch"]:
+            # Use bundled provider
+            self.active_provider = self._get_default_provider()
+        elif provider_type in ["pytorch-cpu", "pytorch-cuda"]:
+            # Start local provider subprocess
+            provider_path = get_provider_binary_path(provider_type)
+            if not provider_path or not provider_path.exists():
+                raise ValueError(f"Provider {provider_type} is not installed. Please download it first.")
+            
+            # Find a free port
+            port = self._get_free_port()
+            
+            # Start provider subprocess
+            from ..config import get_data_dir
+            process = subprocess.Popen(
+                [
+                    str(provider_path),
+                    "--port", str(port),
+                    "--data-dir", str(get_data_dir()),
+                ],
+                stdout=subprocess.PIPE,
+                stderr=subprocess.PIPE,
+            )
+            
+            # Wait for provider to be ready
+            base_url = f"http://127.0.0.1:{port}"
+            await self._wait_for_provider_health(base_url, timeout=30)
+            
+            # Create LocalProvider instance
+            self.active_provider = LocalProvider(base_url)
+            self._provider_process = process
+            self._provider_port = port
+        elif provider_type == "remote":
+            # Remote provider - will be implemented in Phase 5
+            raise NotImplementedError("Remote provider not yet implemented")
+        elif provider_type == "openai":
+            # OpenAI provider - will be implemented in Phase 5
+            raise NotImplementedError("OpenAI provider not yet implemented")
+        else:
+            raise ValueError(f"Unknown provider type: {provider_type}")
+    
+    async def stop_provider(self) -> None:
+        """Stop the active provider."""
+        if self.active_provider:
+            # Only stop if it's not the default bundled provider
+            if self.active_provider is not self._default_provider:
+                if hasattr(self.active_provider, 'stop'):
+                    await self.active_provider.stop()
+                self.active_provider = None
+            
+            # Stop subprocess if running
+            if self._provider_process:
+                self._provider_process.terminate()
+                try:
+                    self._provider_process.wait(timeout=5)
+                except subprocess.TimeoutExpired:
+                    self._provider_process.kill()
+                self._provider_process = None
+                self._provider_port = None
+    
+    async def list_installed(self) -> list[str]:
+        """
+        List installed provider types.
+        
+        Returns:
+            List of installed provider type strings
+        """
+        installed = []
+        
+        # Bundled providers are always available
+        system = platform.system()
+        machine = platform.machine()
+        
+        if system == "Darwin" and machine == "arm64":
+            installed.append("bundled-mlx")
+        else:
+            installed.append("bundled-pytorch")
+        
+        # Check for downloaded providers (Phase 2)
+        providers_dir = _get_providers_dir()
+        if providers_dir.exists():
+            for provider_file in providers_dir.glob("tts-provider-*"):
+                if provider_file.is_file() and provider_file.stat().st_size > 0:
+                    name = provider_file.name
+                    if "pytorch-cpu" in name:
+                        installed.append("pytorch-cpu")
+                    elif "pytorch-cuda" in name:
+                        installed.append("pytorch-cuda")
+        
+        return installed
+    
+    async def get_provider_info(self, provider_type: str) -> dict:
+        """
+        Get information about a provider.
+        
+        Args:
+            provider_type: Type of provider
+            
+        Returns:
+            Provider information dictionary
+        """
+        if provider_type in ["bundled-mlx", "bundled-pytorch"]:
+            return {
+                "type": provider_type,
+                "name": "Bundled Provider",
+                "installed": True,
+                "size_mb": None,  # Bundled, no separate size
+            }
+        elif provider_type == "pytorch-cpu":
+            return {
+                "type": provider_type,
+                "name": "PyTorch CPU",
+                "installed": provider_type in await self.list_installed(),
+                "size_mb": 300,
+            }
+        elif provider_type == "pytorch-cuda":
+            return {
+                "type": provider_type,
+                "name": "PyTorch CUDA",
+                "installed": provider_type in await self.list_installed(),
+                "size_mb": 2400,
+            }
+        else:
+            return {
+                "type": provider_type,
+                "name": provider_type,
+                "installed": False,
+                "size_mb": None,
+            }
+
+
+    def _get_free_port(self) -> int:
+        """Get a free port for the provider server."""
+        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+            s.bind(('', 0))
+            return s.getsockname()[1]
+    
+    async def _wait_for_provider_health(self, base_url: str, timeout: int = 30) -> None:
+        """Wait for provider to become healthy."""
+        import httpx
+        import asyncio
+        
+        start_time = asyncio.get_event_loop().time()
+        while True:
+            try:
+                async with httpx.AsyncClient(timeout=2.0) as client:
+                    response = await client.get(f"{base_url}/tts/health")
+                    if response.status_code == 200:
+                        return
+            except Exception:
+                pass
+            
+            if asyncio.get_event_loop().time() - start_time > timeout:
+                raise TimeoutError(f"Provider did not become healthy within {timeout} seconds")
+            
+            await asyncio.sleep(0.5)
+
+
+# Global provider manager instance
+_provider_manager: Optional[ProviderManager] = None
+
+
+def get_provider_manager() -> ProviderManager:
+    """Get the global provider manager instance."""
+    global _provider_manager
+    if _provider_manager is None:
+        _provider_manager = ProviderManager()
+    return _provider_manager
diff --git a/backend/providers/base.py b/backend/providers/base.py
new file mode 100644
index 00000000..f3a6b4c2
--- /dev/null
+++ b/backend/providers/base.py
@@ -0,0 +1,97 @@
+"""
+Base protocol for TTS providers.
+"""
+
+from typing import Protocol, Optional, Tuple
+from typing_extensions import runtime_checkable
+import numpy as np
+
+from .types import ProviderHealth, ProviderStatus
+
+
+@runtime_checkable
+class TTSProvider(Protocol):
+    """Protocol for TTS provider implementations."""
+    
+    async def generate(
+        self,
+        text: str,
+        voice_prompt: dict,
+        language: str = "en",
+        seed: Optional[int] = None,
+        instruct: Optional[str] = None,
+    ) -> Tuple[np.ndarray, int]:
+        """
+        Generate speech audio from text.
+        
+        Args:
+            text: Text to synthesize
+            voice_prompt: Voice prompt dictionary
+            language: Language code
+            seed: Random seed for reproducibility
+            instruct: Delivery instructions
+            
+        Returns:
+            Tuple of (audio_array, sample_rate)
+        """
+        ...
+    
+    async def create_voice_prompt(
+        self,
+        audio_path: str,
+        reference_text: str,
+        use_cache: bool = True,
+    ) -> Tuple[dict, bool]:
+        """
+        Create voice prompt from reference audio.
+        
+        Args:
+            audio_path: Path to reference audio file
+            reference_text: Transcript of the audio
+            use_cache: Whether to use cached prompts
+            
+        Returns:
+            Tuple of (voice_prompt_dict, was_cached)
+        """
+        ...
+    
+    async def combine_voice_prompts(
+        self,
+        audio_paths: list[str],
+        reference_texts: list[str],
+    ) -> Tuple[np.ndarray, str]:
+        """
+        Combine multiple voice prompts.
+        
+        Args:
+            audio_paths: List of audio file paths
+            reference_texts: List of reference texts
+            
+        Returns:
+            Tuple of (combined_audio_array, combined_text)
+        """
+        ...
+    
+    async def load_model(self, model_size: str) -> None:
+        """Load TTS model."""
+        ...
+    
+    def unload_model(self) -> None:
+        """Unload model to free memory."""
+        ...
+    
+    def is_loaded(self) -> bool:
+        """Check if model is loaded."""
+        ...
+    
+    def _get_model_path(self, model_size: str) -> str:
+        """Get model path for a given size."""
+        ...
+    
+    async def health(self) -> ProviderHealth:
+        """Get provider health status."""
+        ...
+    
+    async def status(self) -> ProviderStatus:
+        """Get provider model status."""
+        ...
diff --git a/backend/providers/bundled.py b/backend/providers/bundled.py
new file mode 100644
index 00000000..b4a5e2ca
--- /dev/null
+++ b/backend/providers/bundled.py
@@ -0,0 +1,139 @@
+"""
+Bundled provider that wraps existing MLX/PyTorch backends.
+"""
+
+from typing import Optional, Tuple
+import numpy as np
+import platform
+
+from .base import TTSProvider
+from .types import ProviderHealth, ProviderStatus
+from ..backends import get_tts_backend, TTSBackend
+from ..platform_detect import get_backend_type
+
+
+class BundledProvider:
+    """Provider that wraps the existing bundled TTS backend."""
+    
+    def __init__(self):
+        self._backend: Optional[TTSBackend] = None
+    
+    def _get_backend(self) -> TTSBackend:
+        """Get or create backend instance."""
+        if self._backend is None:
+            self._backend = get_tts_backend()
+        return self._backend
+    
+    async def generate(
+        self,
+        text: str,
+        voice_prompt: dict,
+        language: str = "en",
+        seed: Optional[int] = None,
+        instruct: Optional[str] = None,
+    ) -> Tuple[np.ndarray, int]:
+        """Generate speech audio."""
+        backend = self._get_backend()
+        return await backend.generate(text, voice_prompt, language, seed, instruct)
+    
+    async def create_voice_prompt(
+        self,
+        audio_path: str,
+        reference_text: str,
+        use_cache: bool = True,
+    ) -> Tuple[dict, bool]:
+        """Create voice prompt from reference audio."""
+        backend = self._get_backend()
+        return await backend.create_voice_prompt(audio_path, reference_text, use_cache)
+    
+    async def combine_voice_prompts(
+        self,
+        audio_paths: list[str],
+        reference_texts: list[str],
+    ) -> Tuple[np.ndarray, str]:
+        """Combine multiple voice prompts."""
+        backend = self._get_backend()
+        return await backend.combine_voice_prompts(audio_paths, reference_texts)
+    
+    async def load_model(self, model_size: str) -> None:
+        """Load TTS model."""
+        backend = self._get_backend()
+        # Backends use load_model_async, but Protocol defines load_model
+        if hasattr(backend, 'load_model_async'):
+            await backend.load_model_async(model_size)
+        else:
+            await backend.load_model(model_size)
+    
+    def unload_model(self) -> None:
+        """Unload model to free memory."""
+        backend = self._get_backend()
+        backend.unload_model()
+    
+    def is_loaded(self) -> bool:
+        """Check if model is loaded."""
+        backend = self._get_backend()
+        return backend.is_loaded()
+    
+    def _get_model_path(self, model_size: str) -> str:
+        """Get model path for a given size."""
+        backend = self._get_backend()
+        return backend._get_model_path(model_size)
+    
+    async def health(self) -> ProviderHealth:
+        """Get provider health status."""
+        backend = self._get_backend()
+        backend_type = get_backend_type()
+        
+        model_size = None
+        if backend.is_loaded():
+            # Try to get current model size from backend
+            if hasattr(backend, '_current_model_size') and backend._current_model_size:
+                model_size = backend._current_model_size
+        
+        device = None
+        if backend_type == "mlx":
+            device = "metal"
+        elif hasattr(backend, 'device'):
+            device = backend.device
+        
+        return ProviderHealth(
+            status="healthy",
+            provider=f"bundled-{backend_type}",
+            version=None,  # Provider versioning not implemented yet
+            model=model_size,
+            device=device,
+        )
+    
+    async def status(self) -> ProviderStatus:
+        """Get provider model status."""
+        backend = self._get_backend()
+        backend_type = get_backend_type()
+        
+        model_size = None
+        if backend.is_loaded():
+            if hasattr(backend, '_current_model_size') and backend._current_model_size:
+                model_size = backend._current_model_size
+        
+        available_sizes = ["1.7B"]
+        if backend_type == "pytorch":
+            available_sizes.append("0.6B")
+        
+        gpu_available = None
+        vram_used_mb = None
+        
+        if backend_type == "pytorch":
+            try:
+                import torch
+                gpu_available = torch.cuda.is_available()
+                if gpu_available:
+                    vram_used_mb = torch.cuda.memory_allocated() / 1024 / 1024
+            except ImportError:
+                pass
+        
+        return ProviderStatus(
+            model_loaded=backend.is_loaded(),
+            model_size=model_size,
+            available_sizes=available_sizes,
+            gpu_available=gpu_available,
+            vram_used_mb=int(vram_used_mb) if vram_used_mb else None,
+        )
diff --git a/backend/providers/installer.py b/backend/providers/installer.py
new file mode 100644
index 00000000..08297b9d
--- /dev/null
+++ b/backend/providers/installer.py
@@ -0,0 +1,211 @@
+"""
+Provider download and installation manager.
+"""
+
+import asyncio
+import httpx
+import platform
+from pathlib import Path
+from typing import Optional
+
+from .types import ProviderType
+from ..utils.progress import get_progress_manager
+from ..utils.tasks import get_task_manager
+
+
+# Provider version (independent of app version)
+PROVIDER_VERSION = "1.0.0"
+
+# Base URL for provider downloads (Cloudflare R2)
+PROVIDER_DOWNLOAD_BASE_URL = "https://downloads.voicebox.sh/providers"
+
+
+def _get_providers_dir() -> Path:
+    """Get the directory where providers are stored."""
+    system = platform.system()
+    
+    if system == "Windows":
+        appdata = Path.home() / "AppData" / "Roaming"
+    elif system == "Darwin":
+        appdata = Path.home() / "Library" / "Application Support"
+    else:  # Linux
+        appdata = Path.home() / ".local" / "share"
+    
+    providers_dir = appdata / "voicebox" / "providers"
+    providers_dir.mkdir(parents=True, exist_ok=True)
+    return providers_dir
+
+
+def _get_provider_binary_name(provider_type: str) -> str:
+    """Get the local binary filename for a provider type."""
+    system = platform.system()
+    ext = ".exe" if system == "Windows" else ""
+    
+    binary_map = {
+        "pytorch-cpu": f"tts-provider-pytorch-cpu{ext}",
+        "pytorch-cuda": f"tts-provider-pytorch-cuda{ext}",
+    }
+    
+    if provider_type not in binary_map:
+        raise ValueError(f"Unknown provider type: {provider_type}")
+    
+    return binary_map[provider_type]
+
+
+def _get_provider_download_name(provider_type: str) -> str:
+    """Get the remote download filename for a provider type (includes platform suffix)."""
+    system = platform.system()
+    
+    if system == "Windows":
+        platform_suffix = "windows"
+        ext = ".exe"
+    elif system == "Linux":
+        platform_suffix = "linux"
+        ext = ""
+    else:
+        raise ValueError(f"Provider downloads not supported on {system}")
+    
+    return f"tts-provider-{provider_type}-{platform_suffix}{ext}"
+
+
+def _get_provider_download_url(provider_type: str) -> str:
+    """Get the download URL for a provider."""
+    download_name = _get_provider_download_name(provider_type)
+    return f"{PROVIDER_DOWNLOAD_BASE_URL}/v{PROVIDER_VERSION}/{download_name}"
+
+
+async def download_provider(provider_type: str) -> Path:
+    """
+    Download a provider binary from Cloudflare R2.
+    
+    Args:
+        provider_type: Type of provider to download (e.g., "pytorch-cpu")
+        
+    Returns:
+        Path to the downloaded provider binary
+        
+    Raises:
+        ValueError: If provider_type is invalid
+        httpx.HTTPError: If download fails
+    """
+    if provider_type not in ["pytorch-cpu", "pytorch-cuda"]:
+        raise ValueError(f"Provider type {provider_type} cannot be downloaded")
+    
+    progress_manager = get_progress_manager()
+    task_manager = get_task_manager()
+    
+    binary_name = _get_provider_binary_name(provider_type)
+    download_url = _get_provider_download_url(provider_type)
+    destination = _get_providers_dir() / binary_name
+    
+    # Start tracking download
+    task_manager.start_download(provider_type)
+    
+    # Initialize progress state
+    progress_manager.update_progress(
+        model_name=provider_type,
+        current=0,
+        total=0,  # Will be updated once we get Content-Length
+        filename=binary_name,
+        status="downloading",
+    )
+    
+    try:
+        async with httpx.AsyncClient(timeout=300.0) as client:
+            # First, get the file size
+            async with client.stream("GET", download_url) as response:
+                response.raise_for_status()
+                
+                # Get total size from Content-Length header
+                total_size = int(response.headers.get("Content-Length", 0))
+                
+                if total_size > 0:
+                    progress_manager.update_progress(
+                        model_name=provider_type,
+                        current=0,
+                        total=total_size,
+                        filename=binary_name,
+                        status="downloading",
+                    )
+                
+                # Download with progress tracking
+                downloaded = 0
+                with open(destination, "wb") as f:
+                    async for chunk in response.aiter_bytes(chunk_size=8192):
+                        f.write(chunk)
+                        downloaded += len(chunk)
+                        
+                        # Update progress
+                        progress_manager.update_progress(
+                            model_name=provider_type,
+                            current=downloaded,
+                            total=total_size if total_size > 0 else downloaded,
+                            filename=binary_name,
+                            status="downloading",
+                        )
+        
+        # Mark as complete
+        progress_manager.update_progress(
+            model_name=provider_type,
+            current=downloaded,
+            total=downloaded,
+            filename=binary_name,
+            status="complete",
+        )
+        task_manager.complete_download(provider_type)
+        
+        # Make executable on Unix systems
+        if platform.system() != "Windows":
+            destination.chmod(0o755)
+        
+        return destination
+        
+    except Exception as e:
+        # Mark as error
+        progress_manager.update_progress(
+            model_name=provider_type,
+            current=0,
+            total=0,
+            filename=binary_name,
+            status="error",
+        )
+        task_manager.error_download(provider_type, str(e))
+        raise
+
+
+def get_provider_binary_path(provider_type: str) -> Optional[Path]:
+    """
+    Get the path to an installed provider binary.
+    
+    Args:
+        provider_type: Type of provider
+        
+    Returns:
+        Path to provider binary, or None if not installed
+    """
+    binary_name = _get_provider_binary_name(provider_type)
+    provider_path = _get_providers_dir() / binary_name
+    
+    if provider_path.exists() and provider_path.is_file():
+        return provider_path
+    
+    return None
+
+
+def delete_provider(provider_type: str) -> bool:
+    """
+    Delete an installed provider binary.
+    
+    Args:
+        provider_type: Type of provider to delete
+        
+    Returns:
+        True if deleted, False if not found
+    """
+    provider_path = get_provider_binary_path(provider_type)
+    
+    if provider_path and provider_path.exists():
+        provider_path.unlink()
+        return True
+    
+    return False
diff --git a/backend/providers/local.py b/backend/providers/local.py
new file mode 100644
index 00000000..1bde7bfe
--- /dev/null
+++ b/backend/providers/local.py
@@ -0,0 +1,187 @@
+"""
+Local provider that communicates with standalone provider servers via HTTP.
+"""
+
+from typing import Optional, Tuple
+import base64
+import io
+import numpy as np
+import httpx
+import soundfile as sf
+
+from .base import TTSProvider
+from .types import ProviderHealth, ProviderStatus
+
+
+class LocalProvider:
+    """Provider that communicates with local subprocess via HTTP."""
+    
+    def __init__(self, base_url: str):
+        """
+        Initialize local provider.
+        
+        Args:
+            base_url: Base URL of the provider server (e.g., "http://localhost:8000")
+        """
+        self.base_url = base_url.rstrip('/')
+        self.client = httpx.AsyncClient(timeout=300.0)  # 5 minute timeout for generation
+    
+    async def generate(
+        self,
+        text: str,
+        voice_prompt: dict,
+        language: str = "en",
+        seed: Optional[int] = None,
+        instruct: Optional[str] = None,
+    ) -> Tuple[np.ndarray, int]:
+        """Generate speech audio."""
+        response = await self.client.post(
+            f"{self.base_url}/tts/generate",
+            json={
+                "text": text,
+                "voice_prompt": voice_prompt,
+                "language": language,
+                "seed": seed,
+                "model_size": "1.7B",  # TODO: Make configurable
+            }
+        )
+        response.raise_for_status()
+        data = response.json()
+        
+        # Decode base64 audio
+        audio_bytes = base64.b64decode(data["audio"])
+        audio_buffer = io.BytesIO(audio_bytes)
+        audio, sample_rate = sf.read(audio_buffer)
+        
+        return audio, data["sample_rate"]
+    
+    async def create_voice_prompt(
+        self,
+        audio_path: str,
+        reference_text: str,
+        use_cache: bool = True,
+    ) -> Tuple[dict, bool]:
+        """Create voice prompt from reference audio."""
+        # Read audio file
+        with open(audio_path, 'rb') as f:
+            audio_data = f.read()
+        
+        # Send multipart form data
+        files = {
+            "audio": ("audio.wav", audio_data, "audio/wav")
+        }
+        data = {
+            "reference_text": reference_text,
+            "use_cache": str(use_cache).lower(),
+        }
+        
+        response = await self.client.post(
+            f"{self.base_url}/tts/create_voice_prompt",
+            files=files,
+            data=data,
+        )
+        response.raise_for_status()
+        result = response.json()
+        
+        return result["voice_prompt"], result.get("was_cached", False)
+    
+    async def combine_voice_prompts(
+        self,
+        audio_paths: list[str],
+        reference_texts: list[str],
+    ) -> Tuple[np.ndarray, str]:
+        """
+        Combine multiple voice prompts.
+        
+        Note: This is not implemented in the provider API yet.
+        For now, we'll combine locally by concatenating audio.
+        """
+        import numpy as np
+        from ..utils.audio import load_audio, normalize_audio
+        
+        combined_audio = []
+        for audio_path in audio_paths:
+            audio, sr = load_audio(audio_path)
+            audio = normalize_audio(audio)
+            combined_audio.append(audio)
+        
+        # Concatenate audio
+        mixed = np.concatenate(combined_audio)
+        mixed = normalize_audio(mixed)
+        
+        # Combine texts
+        combined_text = " ".join(reference_texts)
+        
+        return mixed, combined_text
+    
+    async def load_model(self, model_size: str) -> None:
+        """Load TTS model."""
+        # Model loading is handled automatically by the provider server
+        # when generate() is called, so this is a no-op
+        pass
+    
+    def unload_model(self) -> None:
+        """Unload model to free memory."""
+        # Model unloading is handled by the provider server
+        # This is a no-op for local providers
+        pass
+    
+    def is_loaded(self) -> bool:
+        """Check if model is loaded."""
+        # We can't know this without querying the provider
+        # Return True optimistically
+        return True
+    
+    def _get_model_path(self, model_size: str) -> str:
+        """Get model path for a given size."""
+        # For local providers, model paths are handled by the provider server
+        # Return a placeholder
+        return f"Qwen/Qwen3-TTS-12Hz-{model_size}-Base"
+    
+    async def health(self) -> ProviderHealth:
+        """Get provider health status."""
+        try:
+            response = await self.client.get(f"{self.base_url}/tts/health")
+            response.raise_for_status()
+            data = response.json()
+            return ProviderHealth(
+                status=data["status"],
+                provider=data["provider"],
+                version=data.get("version"),
+                model=data.get("model"),
+                device=data.get("device"),
+            )
+        except Exception as e:
+            return ProviderHealth(
+                status="unhealthy",
+                provider="local",
+                version=None,
+                model=None,
+                device=None,
+            )
+    
+    async def status(self) -> ProviderStatus:
+        """Get provider model status."""
+        try:
+            response = await self.client.get(f"{self.base_url}/tts/status")
+            response.raise_for_status()
+            data = response.json()
+            return ProviderStatus(
+                model_loaded=data["model_loaded"],
+                model_size=data.get("model_size"),
+                available_sizes=data.get("available_sizes", []),
+                gpu_available=data.get("gpu_available"),
+                vram_used_mb=data.get("vram_used_mb"),
+            )
+        except Exception as e:
+            return ProviderStatus(
+                model_loaded=False,
+                model_size=None,
+                available_sizes=[],
+                gpu_available=None,
+                vram_used_mb=None,
+            )
+    
+    async def stop(self) -> None:
+        """Stop the provider (close HTTP client)."""
+        await self.client.aclose()
diff --git a/backend/providers/types.py b/backend/providers/types.py
new file mode 100644
index 00000000..8229cb74
--- /dev/null
+++ b/backend/providers/types.py
@@ -0,0 +1,34 @@
+"""
+Shared types for TTS providers.
+"""
+
+from typing import Optional, TypedDict
+from enum import Enum
+
+
+class ProviderType(str, Enum):
+    """Available provider types."""
+    BUNDLED_MLX = "bundled-mlx"
+    BUNDLED_PYTORCH = "bundled-pytorch"
+    PYTORCH_CPU = "pytorch-cpu"
+    PYTORCH_CUDA = "pytorch-cuda"
+    REMOTE = "remote"
+    OPENAI = "openai"
+
+
+class ProviderHealth(TypedDict):
+    """Provider health status."""
+    status: str  # "healthy", "unhealthy", "starting"
+    provider: str
+    version: Optional[str]
+    model: Optional[str]
+    device: Optional[str]
+
+
+class ProviderStatus(TypedDict):
+    """Provider model status."""
+    model_loaded: bool
+    model_size: Optional[str]
+    available_sizes: list[str]
+    gpu_available: Optional[bool]
+    vram_used_mb: Optional[int]
diff --git a/backend/tts.py b/backend/tts.py
index 98db3412..0f9cfd5f 100644
--- a/backend/tts.py
+++ b/backend/tts.py
@@ -1,5 +1,5 @@
 """
-TTS inference module - delegates to backend abstraction layer.
+TTS inference module - delegates to provider abstraction layer.
 """
 
 from typing import Optional
@@ -7,31 +7,51 @@
 import io
 import soundfile as sf
 
-from .backends import get_tts_backend, TTSBackend
+from .backends import TTSBackend
+from .providers import get_provider_manager
+from .providers.base import TTSProvider
 
 
-def get_tts_model() -> TTSBackend:
+def get_tts_model() -> TTSProvider:
     """
-    Get TTS backend instance (MLX or PyTorch based on platform).
+    Get TTS provider instance (via ProviderManager).
     
     Returns:
-        TTS backend instance
+        TTS provider instance
     """
-    return get_tts_backend()
+    manager = get_provider_manager()
+    # Note: This is async but we need sync interface for backward compatibility
+    # In practice, this will be called from async contexts
+    import asyncio
+    try:
+        loop = asyncio.get_event_loop()
+        if loop.is_running():
+            # We're in an async context, but can't await here
+            # Return a wrapper that will use the provider manager
+            return manager._get_default_provider()
+        else:
+            return loop.run_until_complete(manager.get_active_provider())
+    except RuntimeError:
+        # No event loop, return default
+        return manager._get_default_provider()
+
+
+async def get_tts_model_async() -> TTSProvider:
+    """
+    Get TTS provider instance asynchronously.
+    
+    Returns:
+        TTS provider instance
+    """
+    manager = get_provider_manager()
+    return await manager.get_active_provider()
 
 
 def unload_tts_model():
     """Unload TTS model to free memory."""
-    backend = get_tts_backend()
-    backend.unload_model()
-
-
-def audio_to_wav_bytes(audio: np.ndarray, sample_rate: int) -> bytes:
-    """Convert audio array to WAV bytes."""
-    buffer = io.BytesIO()
-    sf.write(buffer, audio, sample_rate, format="WAV")
-    buffer.seek(0)
-    return buffer.read()
+    manager = get_provider_manager()
+    provider = manager._get_default_provider()
+    provider.unload_model()
 
 
 def audio_to_wav_bytes(audio: np.ndarray, sample_rate: int) -> bytes:
diff --git a/docs/plans/TTS_PROVIDER_ARCHITECTURE.md b/docs/plans/TTS_PROVIDER_ARCHITECTURE.md
index 8d35a7e5..14d87317 100644
--- a/docs/plans/TTS_PROVIDER_ARCHITECTURE.md
+++ b/docs/plans/TTS_PROVIDER_ARCHITECTURE.md
@@ -10,14 +10,17 @@
 
 Split the monolithic backend into modular components:
 
-1. **Main App** (~150-200MB): Tauri + FastAPI backend + Whisper + UI/profiles/history
-2. **TTS Providers** (downloadable plugins): Separate executables for model inference
+1. **Main App**:
+   - Windows/Linux (~150MB): Tauri + FastAPI backend + Whisper + UI/profiles/history
+   - macOS (~300MB): Same + MLX bundled for simplicity
+2. **TTS Providers** (Windows/Linux only): Downloadable executables for PyTorch CPU/CUDA inference
 
 This architecture solves:
 
 - ✅ GitHub 2GB release artifact limit
-- ✅ Frequent app updates without re-downloading large python binaries
-- ✅ User choice of compute backend (CPU/GPU/Cloud)
+- ✅ Frequent app updates without re-downloading large python binaries (Windows/Linux)
+- ✅ User choice of compute backend (CPU/GPU/Cloud) on Windows/Linux
+- ✅ Simplified out-of-the-box experience on macOS
 - ✅ External provider support (OpenAI, custom servers)
 - ✅ Future extensibility
 
@@ -25,6 +28,7 @@ This architecture solves:
 
 ## Architecture Diagram
 
+### Windows / Linux
 ```
 ┌─────────────────────────────────────────────────────────┐
 │  Voicebox App (Tauri + Backend)           ~150MB        │
@@ -39,27 +43,43 @@ This architecture solves:
                                           │
                             HTTP/IPC      │
                                           │
-         ┌────────────────────────────────┼─────────────────┐
-         │                                │                 │
-         ▼                                ▼                 ▼
-┌─────────────────┐      ┌─────────────────┐   ┌──────────────────┐
-│ TTS Provider:   │      │ TTS Provider:   │   │ TTS Provider:    │
-│ PyTorch CPU     │      │ PyTorch CUDA    │   │ MLX (Apple)      │
-│                 │      │                 │   │                  │
-│ ~300MB          │      │ ~2.4GB          │   │ ~800MB           │
-│                 │      │                 │   │                  │
-│ Local inference │      │ GPU inference   │   │ Metal inference  │
-└─────────────────┘      └─────────────────┘   └──────────────────┘
-         │                        │                     │
-         └────────────────────────┴─────────────────────┘
-                                  │
-                    ┌─────────────▼──────────────┐
-                    │  Future Providers:         │
-                    │  • Remote Server           │
-                    │  • OpenAI API              │
-                    │  • ElevenLabs              │
-                    │  • Custom Docker Container │
-                    └────────────────────────────┘
+                    ┌─────────────────────┴─────────────────┐
+                    │                                       │
+                    ▼                                       ▼
+       ┌─────────────────────┐              ┌─────────────────────┐
+       │ TTS Provider:       │              │ TTS Provider:       │
+       │ PyTorch CPU         │              │ PyTorch CUDA        │
+       │                     │              │                     │
+       │ ~300MB              │              │ ~2.4GB              │
+       │                     │              │                     │
+       │ Local inference     │              │ GPU inference       │
+       └─────────────────────┘              └─────────────────────┘
+                    │                                       │
+                    └───────────────┬───────────────────────┘
+                                    │
+                      ┌─────────────▼──────────────┐
+                      │  Future Providers:         │
+                      │  • Remote Server           │
+                      │  • OpenAI API              │
+                      │  • ElevenLabs              │
+                      │  • Custom Docker Container │
+                      └────────────────────────────┘
+```
+
+### macOS
+```
+┌─────────────────────────────────────────────────────────┐
+│  Voicebox App (Tauri + Backend)           ~300MB        │
+│  ├─ UI Layer (React)                                    │
+│  ├─ Backend (FastAPI)                                   │
+│  │  ├─ Voice Profiles                                   │
+│  │  ├─ Generation History                               │
+│  │  ├─ Audio Editing / Stories                          │
+│  │  └─ MLX Backend (bundled)                            │
+│  └─ Whisper (bundled, tiny ~50MB)                       │
+│                                                          │
+│  No provider downloads needed - works out of the box    │
+└─────────────────────────────────────────────────────────┘
 ```
 
 ---
@@ -91,18 +111,20 @@ This architecture solves:
 
 #### 1. Main App (voicebox.exe / .app / .AppImage)
 
-**Size:** ~100-150MB
+**Windows/Linux Size:** ~100-150MB
+**macOS Size:** ~300-350MB (includes MLX)
 
 **Includes:**
 
 - Tauri runtime + React UI
-- FastAPI backend (pure Python, no PyTorch)
+- FastAPI backend (pure Python, no PyTorch on Windows/Linux)
 - Whisper model (tiny, ~50MB)
 - SQLite database
 - Profile/history/audio editing logic
-- Provider management system
+- Provider management system (Windows/Linux only)
+- **MLX backend (macOS only, bundled)**
 
-**Does NOT include:**
+**Does NOT include (Windows/Linux only):**
 
 - PyTorch (CPU or CUDA)
 - TTS models (Qwen3-TTS)
@@ -147,23 +169,7 @@ This architecture solves:
 
 ---
 
-#### 4. TTS Provider: MLX
-
-**Binary:** `tts-provider-mlx`
-**Size:** ~150MB
-
-**Includes:**
-
-- MLX framework
-- MLX-optimized Qwen3-TTS
-- Metal acceleration
-
-**Platform:** macOS only (Apple Silicon)
-**Download source:** Cloudflare R2
-
----
-
-#### 5. TTS Provider: Remote
+#### 4. TTS Provider: Remote
 
 **Binary:** None (built-in config)
 **Size:** 0MB
@@ -182,7 +188,7 @@ This architecture solves:
 
 ---
 
-#### 6. TTS Provider: OpenAI
+#### 5. TTS Provider: OpenAI
 
 **Binary:** None (API wrapper)
 **Size:** 0MB
@@ -296,7 +302,10 @@ Model status.
 
 ```python
 class ProviderManager:
-    """Manages TTS provider lifecycle."""
+    """Manages TTS provider lifecycle (Windows/Linux only).
+
+    Note: macOS uses bundled MLX backend directly, no provider management needed.
+    """
 
     def __init__(self):
         self.active_provider: Optional[Provider] = None
@@ -308,8 +317,6 @@ class ProviderManager:
             return await self._start_local_provider("tts-provider-pytorch-cpu.exe")
         elif provider_type == "pytorch-cuda":
             return await self._start_local_provider("tts-provider-pytorch-cuda.exe")
-        elif provider_type == "mlx":
-            return await self._start_local_provider("tts-provider-mlx")
         elif provider_type == "remote":
             return self.config["remote_url"]
         elif provider_type == "openai":
@@ -434,15 +441,14 @@ class OpenAIProvider(TTSProvider):
 
 ```python
 class ProviderInstaller:
-    """Handles provider download and installation."""
+    """Handles provider download and installation (Windows/Linux only)."""
 
     async def download_provider(self, provider_type: str):
         """Download provider binary from R2."""
 
         binary_name = {
             "pytorch-cpu": "tts-provider-pytorch-cpu.exe",
-            "pytorch-cuda": "tts-provider-pytorch-cuda.exe",
-            "mlx": "tts-provider-mlx"
+            "pytorch-cuda": "tts-provider-pytorch-cuda.exe"
         }[provider_type]
 
         download_url = f"https://downloads.voicebox.sh/providers/v{PROVIDER_VERSION}/{binary_name}"
@@ -525,44 +531,38 @@ export function ProviderSettings() {
 						)}
 					</div>
 
-					{/* PyTorch CPU */}
-					<div className="flex items-center justify-between">
-						<div className="flex items-center space-x-2">
-							<RadioGroupItem value="pytorch-cpu" id="cpu" />
-							<Label htmlFor="cpu">
-								<div className="font-medium">PyTorch CPU</div>
-								<div className="text-sm text-muted-foreground">
-									Works on any system, slower inference
-								</div>
-							</Label>
-						</div>
-						{!installedProviders?.includes("pytorch-cpu") && (
-							<Button onClick={() => downloadProvider("pytorch-cpu")} size="sm">
-								Download (300MB)
-							</Button>
-						)}
-					</div>
-
-					{/* MLX (macOS only) */}
-					{isMacOS && (
+					{/* PyTorch CPU (Windows/Linux only) */}
+					{!isMacOS && (
 						<div className="flex items-center justify-between">
 							<div className="flex items-center space-x-2">
-								<RadioGroupItem value="mlx" id="mlx" />
-								<Label htmlFor="mlx">
-									<div className="font-medium">MLX (Apple Silicon)</div>
+								<RadioGroupItem value="pytorch-cpu" id="cpu" />
+								<Label htmlFor="cpu">
+									<div className="font-medium">PyTorch CPU</div>
 									<div className="text-sm text-muted-foreground">
-										Optimized for M1/M2/M3 chips
+										Works on any system, slower inference
 									</div>
 								</Label>
 							</div>
-							{!installedProviders?.includes("mlx") && (
-								<Button onClick={() => downloadProvider("mlx")} size="sm">
-									Download (800MB)
+							{!installedProviders?.includes("pytorch-cpu") && (
+								<Button onClick={() => downloadProvider("pytorch-cpu")} size="sm">
+									Download (300MB)
 								</Button>
 							)}
 						</div>
 					)}
 
+					{/* MLX bundled (macOS only) */}
+					{isMacOS && (
+						<div className="p-3 bg-muted rounded-md">
+							<div className="text-sm">
+								<div className="font-medium">MLX (Apple Silicon)</div>
+								<div className="text-muted-foreground mt-1">
+									Bundled with the app - optimized for M1/M2/M3 chips
+								</div>
+							</div>
+						</div>
+					)}
+
 					{/* Remote */}
 					<div className="space-y-2">
 						<div className="flex items-center space-x-2">
@@ -608,14 +608,18 @@ export function ProviderSettings() {
 ```
 voicebox/
 ├── backend/
-│   ├── main.py                    # Main FastAPI app (no TTS code)
+│   ├── main.py                    # Main FastAPI app (no TTS on Win/Linux)
+│   ├── backends/
+│   │   ├── __init__.py            # Backend abstraction (existing)
+│   │   ├── pytorch_backend.py     # PyTorch backend (existing, for reference)
+│   │   └── mlx_backend.py         # MLX backend (bundled in macOS build only)
 │   ├── providers/
-│   │   ├── __init__.py            # ProviderManager
-│   │   ├── base.py                # TTSProvider ABC
+│   │   ├── __init__.py            # ProviderManager (Windows/Linux)
+│   │   ├── base.py                # TTSProvider Protocol
 │   │   ├── local.py               # LocalProvider (subprocess)
 │   │   ├── remote.py              # RemoteProvider (HTTP)
 │   │   ├── openai.py              # OpenAIProvider (API wrapper)
-│   │   └── installer.py           # Provider download logic
+│   │   └── installer.py           # Provider download logic (Windows/Linux)
 │   ├── profiles.py                # Voice profile management
 │   ├── history.py                 # Generation history
 │   ├── transcribe.py              # Whisper (still bundled)
@@ -628,27 +632,22 @@ voicebox/
 │   │   ├── requirements.txt       # torch (CPU), qwen-tts, transformers
 │   │   └── build.spec             # PyInstaller spec
 │   │
-│   ├── pytorch-cuda/
-│   │   ├── main.py                # FastAPI server for TTS
-│   │   ├── tts_backend.py         # PyTorch TTS logic
-│   │   ├── requirements.txt       # torch+cu121, qwen-tts, transformers
-│   │   └── build.spec             # PyInstaller spec
-│   │
-│   └── mlx/
+│   └── pytorch-cuda/
 │       ├── main.py                # FastAPI server for TTS
-│       ├── mlx_backend.py         # MLX TTS logic
-│       ├── requirements.txt       # mlx, qwen-tts-mlx
+│       ├── tts_backend.py         # PyTorch TTS logic
+│       ├── requirements.txt       # torch+cu121, qwen-tts, transformers
 │       └── build.spec             # PyInstaller spec
 │
 ├── app/                           # Frontend (Tauri + React)
 │   └── src/
 │       └── components/
 │           └── ServerSettings/
-│               └── ProviderSettings.tsx
+│               └── ProviderSettings.tsx  # Only shown on Windows/Linux
 │
 └── tauri/
     └── src-tauri/
-        └── tauri.conf.json        # No externalBin for providers
+        └── tauri.conf.json        # No externalBin for providers (Windows/Linux)
+                                   # MLX bundled in macOS build
 ```
 
 ---
@@ -671,33 +670,35 @@ voicebox/
 
 ### Phase 2: Build Provider Binaries
 
-**Goal:** Create standalone TTS provider executables
+**Goal:** Create standalone TTS provider executables (Windows/Linux only)
 
 1. Create separate PyInstaller specs for each provider
 2. Build provider executables:
    - `tts-provider-pytorch-cpu.exe` (~300MB)
    - `tts-provider-pytorch-cuda.exe` (~2.4GB)
-   - `tts-provider-mlx` (~800MB, macOS)
 3. Test subprocess communication
 4. Upload providers to Cloudflare R2
 
 **Result:** Provider binaries exist but aren't used yet
 
+**Note:** macOS keeps MLX bundled in main app - no separate provider needed
+
 ---
 
 ### Phase 3: Remove PyTorch from Main App
 
-**Goal:** Split main app from providers
+**Goal:** Split main app from providers (Windows/Linux only)
 
-1. Exclude PyTorch/Qwen3-TTS from main app PyInstaller spec
-2. Main app now requires provider download
+1. Exclude PyTorch/Qwen3-TTS from Windows/Linux main app PyInstaller spec
+2. Windows/Linux app now requires provider download
 3. Update GitHub CI to build multiple artifacts:
-   - `voicebox-{version}-{platform}.exe` (~150MB)
+   - `voicebox-{version}-windows.exe` (~150MB, no TTS)
+   - `voicebox-{version}-linux.AppImage` (~150MB, no TTS)
+   - `voicebox-{version}-macos.app` (~300MB, MLX bundled)
    - `tts-provider-pytorch-cpu-{version}.exe`
    - `tts-provider-pytorch-cuda-{version}.exe`
-   - `tts-provider-mlx-{version}` (macOS)
 
-**Result:** Main app is small, providers downloaded separately
+**Result:** Windows/Linux apps are small with downloadable providers, macOS app is self-contained
 
 ---
 
@@ -767,7 +768,7 @@ async def check_provider_compatibility(provider_version: str) -> bool:
 
 ## User Flows
 
-### First-Time Setup
+### First-Time Setup (Windows/Linux)
 
 1. User downloads and installs Voicebox (~150MB)
 2. App launches → detects no TTS provider installed
@@ -784,10 +785,6 @@ async def check_provider_compatibility(provider_version: str) -> bool:
        ✓ Works on any system
        ✗ Slower inference
 
-   [ ] MLX (800MB)             [Download]
-       ✓ Fast on Apple Silicon
-       ✗ macOS only (M1/M2/M3)
-
    [ ] Remote Server
        URL: ___________________
 
@@ -799,19 +796,31 @@ async def check_provider_compatibility(provider_version: str) -> bool:
 5. Provider installs to AppData/Application Support
 6. App starts provider → ready to use
 
+### First-Time Setup (macOS)
+
+1. User downloads and installs Voicebox (~300MB with MLX bundled)
+2. App launches → MLX backend is ready immediately
+3. No provider setup needed - works out of the box
+
 ---
 
 ### App Update Flow (No Provider Change)
 
 **Scenario:** Bug fix in UI, no backend changes
 
+**Windows/Linux:**
 1. User gets update notification: "Voicebox v0.2.1 available"
 2. Downloads update (~150MB, not 2.4GB!)
 3. Installs and restarts
 4. **Provider stays the same** (no re-download needed)
 5. App starts using existing provider
 
-**User experience:** Fast updates, no multi-GB downloads
+**macOS:**
+1. User gets update notification: "Voicebox v0.2.1 available"
+2. Downloads update (~300MB with MLX bundled)
+3. Installs and restarts - ready to use
+
+**User experience:** Fast updates, no multi-GB downloads (especially for CUDA users)
 
 ---
 
@@ -846,9 +855,10 @@ async def check_provider_compatibility(provider_version: str) -> bool:
 
 | Benefit                       | Details                                                   |
 | ----------------------------- | --------------------------------------------------------- |
-| **GitHub Releases Work**      | Main app ~150MB << 2GB limit                              |
+| **GitHub Releases Work**      | Main app ~150MB (Win/Linux), ~300MB (macOS) << 2GB limit  |
 | **Fast Updates**              | UI/feature updates don't require re-downloading providers |
-| **User Choice**               | CPU, CUDA, MLX, OpenAI, remote server                     |
+| **User Choice**               | CPU, CUDA, OpenAI, remote server (Win/Linux)              |
+| **macOS Simplicity**          | MLX bundled - works immediately, no provider setup needed |
 | **External Provider Support** | Users can run their own TTS servers                       |
 | **Bandwidth Savings**         | Only download provider once, app updates are small        |
 | **Future-Proof**              | Easy to add new providers (ElevenLabs, custom models)     |
diff --git a/providers/README.md b/providers/README.md
new file mode 100644
index 00000000..9ca3e03b
--- /dev/null
+++ b/providers/README.md
@@ -0,0 +1,291 @@
+# TTS Provider Architecture
+
+This document explains how Voicebox's modular TTS provider system works.
+
+## Overview
+
+Voicebox uses a **pluggable provider architecture** that separates the main application from TTS inference. This solves several problems:
+
+- **GitHub's 2GB release limit** - CUDA builds are ~2.4GB, too large for GitHub releases
+- **Faster app updates** - UI/feature updates don't require re-downloading heavy ML binaries
+- **User choice** - Users can pick CPU, CUDA, or external providers based on their hardware
+
+## Architecture Diagram
+
+```
+┌─────────────────────────────────────────────────────────────┐
+│  Voicebox App                                               │
+│  ├─ UI (React)                                              │
+│  ├─ Backend (FastAPI)                                       │
+│  │   ├─ Voice Profiles                                      │
+│  │   ├─ Generation History                                  │
+│  │   ├─ Whisper STT (bundled)                               │
+│  │   └─ Provider Manager ◄────────────────┐                 │
+│  │                                         │                │
+│  └─ providers/                             │                │
+│      ├─ bundled.py (wraps backends/)       │                │
+│      └─ local.py (HTTP client)─────────────┼───┐            │
+│                                            │   │            │
+└────────────────────────────────────────────┼───┼────────────┘
+                                             │   │
+                        ┌────────────────────┘   │
+                        │                        │ HTTP
+                        ▼                        ▼
+              ┌──────────────────┐    ┌──────────────────────┐
+              │ backends/        │    │ Standalone Provider  │
+              │ (bundled on Mac) │    │ (subprocess)         │
+              │                  │    │                      │
+              │ - mlx_backend    │    │ - FastAPI server     │
+              │ - pytorch_backend│    │ - PyTorch + Qwen-TTS │
+              └──────────────────┘    │ - Runs on localhost  │
+                                      └──────────────────────┘
+```
+
+## Platform Behavior
+
+| Platform | App Size | TTS Backend | Provider Download |
+|----------|----------|-------------|-------------------|
+| macOS (Apple Silicon) | ~300MB | MLX bundled | Not needed |
+| macOS (Intel) | ~300MB | PyTorch bundled | Not needed |
+| Windows | ~150MB | None bundled | Required |
+| Linux | ~150MB | None bundled | Required |
+
+### macOS (Apple Silicon)
+- MLX backend is **bundled** in the app
+- Works immediately after install
+- Uses Metal for GPU acceleration
+
+### macOS (Intel)
+- PyTorch backend is **bundled** in the app
+- Works immediately after install
+- Uses CPU inference
+
+### Windows / Linux
+- **No TTS bundled** - keeps app small (~150MB)
+- On first use, prompts to download a provider
+- Provider options:
+  - **PyTorch CPU** (~300MB) - Works on any system
+  - **PyTorch CUDA** (~2.4GB) - Fast inference on NVIDIA GPUs
+
+## Directory Structure
+
+```
+voicebox/
+├── backend/
+│   ├── backends/                 # Actual TTS implementations
+│   │   ├── __init__.py          # TTSBackend Protocol
+│   │   ├── mlx_backend.py       # MLX implementation (macOS)
+│   │   └── pytorch_backend.py   # PyTorch implementation
+│   │
+│   └── providers/               # Provider abstraction layer
+│       ├── __init__.py          # ProviderManager
+│       ├── base.py              # TTSProvider Protocol
+│       ├── bundled.py           # Wraps backends/ for bundled use
+│       ├── local.py             # HTTP client for subprocess providers
+│       ├── installer.py         # Downloads providers from R2
+│       └── types.py             # Shared types
+│
+└── providers/                   # Standalone provider builds
+    ├── pytorch-cpu/
+    │   ├── main.py              # FastAPI server
+    │   ├── build.py             # PyInstaller build script
+    │   └── requirements.txt
+    │
+    └── pytorch-cuda/
+        ├── main.py              # FastAPI server
+        │   build.py              # PyInstaller build script
+        └── requirements.txt
+```
+
+## How Providers Work
+
+### 1. BundledProvider (macOS)
+
+On macOS, the `BundledProvider` directly calls the bundled `backends/` code:
+
+```python
+# backend/providers/bundled.py
+class BundledProvider:
+    def __init__(self):
+        self._backend = get_tts_backend()  # MLX or PyTorch
+    
+    async def generate(self, text, voice_prompt, ...):
+        return await self._backend.generate(text, voice_prompt, ...)
+```
+
+### 2. LocalProvider (Windows/Linux)
+
+On Windows/Linux, the `LocalProvider` communicates with a standalone provider via HTTP:
+
+```python
+# backend/providers/local.py
+class LocalProvider:
+    def __init__(self, base_url: str):
+        self.base_url = base_url  # e.g., "http://127.0.0.1:8765"
+    
+    async def generate(self, text, voice_prompt, ...):
+        response = await self.client.post(
+            f"{self.base_url}/tts/generate",
+            json={"text": text, "voice_prompt": voice_prompt, ...}
+        )
+        # Decode audio from response
+        return audio, sample_rate
+```
+
+### 3. Standalone Provider Server
+
+The standalone providers are self-contained FastAPI servers:
+
+```python
+# providers/pytorch-cpu/main.py
+@app.post("/tts/generate")
+async def generate(text: str, voice_prompt: dict, ...):
+    audio, sr = await backend.generate(text, voice_prompt, ...)
+    return {"audio": base64_encode(audio), "sample_rate": sr}
+```
+
+## Provider API Specification
+
+All providers (local or remote) must implement these HTTP endpoints:
+
+### POST /tts/generate
+Generate speech from text.
+
+**Request:**
+```json
+{
+    "text": "Hello world!",
+    "voice_prompt": { /* voice embedding */ },
+    "language": "en",
+    "seed": 12345,
+    "model_size": "1.7B"
+}
+```
+
+**Response:**
+```json
+{
+    "audio": "base64-encoded-wav",
+    "sample_rate": 24000,
+    "duration": 2.5
+}
+```
+
+### POST /tts/create_voice_prompt
+Create voice embedding from reference audio.
+
+**Request:** `multipart/form-data`
+- `audio`: Audio file
+- `reference_text`: Transcript
+
+**Response:**
+```json
+{
+    "voice_prompt": { /* voice embedding */ },
+    "was_cached": false
+}
+```
+
+### GET /tts/health
+Health check.
+
+**Response:**
+```json
+{
+    "status": "healthy",
+    "provider": "pytorch-cuda",
+    "version": "1.0.0",
+    "model": "1.7B",
+    "device": "cuda:0"
+}
+```
+
+### GET /tts/status
+Model status.
+
+**Response:**
+```json
+{
+    "model_loaded": true,
+    "model_size": "1.7B",
+    "available_sizes": ["0.6B", "1.7B"],
+    "gpu_available": true,
+    "vram_used_mb": 1234
+}
+```
+
+## Provider Lifecycle
+
+### Startup Flow (Windows/Linux)
+
+```
+1. App launches
+2. ProviderManager checks for installed providers
+3. If none installed:
+   └─ Show setup wizard, prompt download
+4. If installed:
+   ├─ Start provider subprocess on random port
+   ├─ Wait for /tts/health to return 200
+   └─ Create LocalProvider with that URL
+5. Generation requests go through LocalProvider → subprocess
+```
+
+### Download Flow
+
+```
+1. User clicks "Download PyTorch CUDA"
+2. Installer downloads from Cloudflare R2:
+   https://downloads.voicebox.sh/providers/v1.0.0/tts-provider-pytorch-cuda-windows.exe
+3. Saved to:
+   - Windows: %APPDATA%/voicebox/providers/
+   - Linux: ~/.local/share/voicebox/providers/
+4. Provider is now available to start
+```
+
+## Building Providers
+
+### Prerequisites
+- Python 3.12
+- PyInstaller
+
+### Build PyTorch CPU Provider
+```bash
+cd providers/pytorch-cpu
+pip install -r requirements.txt
+python build.py
+# Output: dist/tts-provider-pytorch-cpu.exe
+```
+
+### Build PyTorch CUDA Provider
+```bash
+cd providers/pytorch-cuda
+pip install torch --index-url https://download.pytorch.org/whl/cu121
+pip install -r requirements.txt
+python build.py
+# Output: dist/tts-provider-pytorch-cuda.exe (~2.4GB)
+```
+
+## Provider Versioning
+
+Providers have **independent versions** from the app:
+
+- **App version:** `v0.2.0` (frequent updates)
+- **Provider version:** `v1.0.0` (rare updates)
+
+Providers only need updates when:
+- TTS model changes (new Qwen3-TTS version)
+- API spec changes
+- Bug fixes in inference code
+
+The app checks provider compatibility on startup.
+
+## Future Providers
+
+The architecture supports additional providers:
+
+- **Remote Server** - Connect to your own TTS server
+- **OpenAI API** - Use OpenAI's TTS (requires API key)
+- **ElevenLabs** - Cloud TTS service
+- **Docker** - Run providers in containers
+
+These would implement the same HTTP API spec.
diff --git a/providers/pytorch-cpu/build.py b/providers/pytorch-cpu/build.py
new file mode 100644
index 00000000..2276b686
--- /dev/null
+++ b/providers/pytorch-cpu/build.py
@@ -0,0 +1,82 @@
+"""
+PyInstaller build script for PyTorch CPU provider.
+"""
+
+import PyInstaller.__main__
+import os
+import platform
+from pathlib import Path
+
+
+def build_provider():
+    """Build PyTorch CPU provider as standalone binary."""
+    provider_dir = Path(__file__).parent
+    backend_dir = provider_dir.parent.parent / "backend"
+    
+    # PyInstaller arguments
+    args = [
+        'main.py',
+        '--onefile',
+        '--name', 'tts-provider-pytorch-cpu',
+    ]
+    
+    # Add backend to path
+    args.extend([
+        '--paths', str(backend_dir.parent),
+    ])
+    
+    # Add hidden imports
+    args.extend([
+        '--hidden-import', 'backend',
+        '--hidden-import', 'backend.backends',
+        '--hidden-import', 'backend.backends.pytorch_backend',
+        '--hidden-import', 'backend.config',
+        '--hidden-import', 'backend.utils.audio',
+        '--hidden-import', 'backend.utils.cache',
+        '--hidden-import', 'backend.utils.progress',
+        '--hidden-import', 'backend.utils.hf_progress',
+        '--hidden-import', 'backend.utils.tasks',
+        '--hidden-import', 'torch',
+        '--hidden-import', 'transformers',
+        '--hidden-import', 'qwen_tts',
+        '--hidden-import', 'qwen_tts.inference',
+        '--hidden-import', 'qwen_tts.inference.qwen3_tts_model',
+        '--hidden-import', 'qwen_tts.inference.qwen3_tts_tokenizer',
+        '--hidden-import', 'qwen_tts.core',
+        '--hidden-import', 'qwen_tts.cli',
+        '--copy-metadata', 'qwen-tts',
+        '--collect-submodules', 'qwen_tts',
+        '--collect-data', 'qwen_tts',
+        '--hidden-import', 'pkg_resources.extern',
+        '--collect-submodules', 'jaraco',
+        '--hidden-import', 'fastapi',
+        '--hidden-import', 'uvicorn',
+        '--hidden-import', 'soundfile',
+        '--hidden-import', 'numpy',
+        '--hidden-import', 'librosa',
+    ])
+    
+    # Platform-specific extensions
+    if platform.system() == "Windows":
+        args[2] = 'tts-provider-pytorch-cpu.exe'
+    
+    args.extend([
+        '--noconfirm',
+        '--clean',
+    ])
+    
+    # Change to provider directory
+    os.chdir(provider_dir)
+    
+    # Run PyInstaller
+    PyInstaller.__main__.run(args)
+    
+    binary_name = 'tts-provider-pytorch-cpu'
+    if platform.system() == "Windows":
+        binary_name += '.exe'
+    
+    print(f"Binary built in {provider_dir / 'dist' / binary_name}")
+
+
+if __name__ == '__main__':
+    build_provider()
diff --git a/providers/pytorch-cpu/main.py b/providers/pytorch-cpu/main.py
new file mode 100644
index 00000000..e295e08b
--- /dev/null
+++ b/providers/pytorch-cpu/main.py
@@ -0,0 +1,238 @@
+"""
+Standalone TTS provider server for PyTorch CPU.
+"""
+
+import argparse
+import asyncio
+import base64
+import io
+import sys
+from pathlib import Path
+from typing import Optional
+
+import numpy as np
+import soundfile as sf
+from fastapi import FastAPI, File, Form, HTTPException, UploadFile
+from fastapi.middleware.cors import CORSMiddleware
+import uvicorn
+
+# Add parent directory to path to import backend modules
+sys.path.insert(0, str(Path(__file__).parent.parent.parent / "backend"))
+
+from backend.backends.pytorch_backend import PyTorchTTSBackend
+
+
+app = FastAPI(title="Voicebox TTS Provider - PyTorch CPU")
+
+# CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+# Global backend instance
+_backend: Optional[PyTorchTTSBackend] = None
+
+
+def get_backend() -> PyTorchTTSBackend:
+    """Get or create backend instance."""
+    global _backend
+    if _backend is None:
+        _backend = PyTorchTTSBackend()
+    return _backend
+
+
+@app.get("/tts/health")
+async def health():
+    """Health check endpoint."""
+    backend = get_backend()
+    backend_type = "pytorch-cpu"
+    
+    model_size = None
+    if backend.is_loaded():
+        if hasattr(backend, '_current_model_size') and backend._current_model_size:
+            model_size = backend._current_model_size
+    
+    device = backend.device if hasattr(backend, 'device') else "cpu"
+    
+    return {
+        "status": "healthy",
+        "provider": backend_type,
+        "version": "1.0.0",  # TODO: Get from version file
+        "model": model_size,
+        "device": device,
+    }
+
+
+@app.get("/tts/status")
+async def status():
+    """Model status endpoint."""
+    backend = get_backend()
+    
+    model_size = None
+    if backend.is_loaded():
+        if hasattr(backend, '_current_model_size') and backend._current_model_size:
+            model_size = backend._current_model_size
+    
+    available_sizes = ["1.7B", "0.6B"]
+    
+    gpu_available = False
+    vram_used_mb = None
+    
+    try:
+        import torch
+        gpu_available = torch.cuda.is_available()
+        if gpu_available:
+            vram_used_mb = int(torch.cuda.memory_allocated() / 1024 / 1024)
+    except ImportError:
+        pass
+    
+    return {
+        "model_loaded": backend.is_loaded(),
+        "model_size": model_size,
+        "available_sizes": available_sizes,
+        "gpu_available": gpu_available,
+        "vram_used_mb": vram_used_mb,
+    }
+
+
+@app.post("/tts/generate")
+async def generate(
+    text: str,
+    voice_prompt: dict,
+    language: str = "en",
+    seed: Optional[int] = None,
+    model_size: str = "1.7B",
+):
+    """
+    Generate speech from text.
+    
+    Request body (JSON):
+    {
+        "text": "Hello world!",
+        "voice_prompt": {...},
+        "language": "en",
+        "seed": 12345,
+        "model_size": "1.7B"
+    }
+    """
+    backend = get_backend()
+    
+    # Load model if not loaded or different size
+    if not backend.is_loaded() or (
+        hasattr(backend, '_current_model_size') and 
+        backend._current_model_size != model_size
+    ):
+        await backend.load_model_async(model_size)
+    
+    # Generate audio
+    audio, sample_rate = await backend.generate(
+        text=text,
+        voice_prompt=voice_prompt,
+        language=language,
+        seed=seed,
+        instruct=None,  # TODO: Add instruct support
+    )
+    
+    # Convert to base64
+    buffer = io.BytesIO()
+    sf.write(buffer, audio, sample_rate, format="WAV")
+    buffer.seek(0)
+    audio_bytes = buffer.read()
+    audio_b64 = base64.b64encode(audio_bytes).decode('utf-8')
+    
+    # Calculate duration
+    duration = len(audio) / sample_rate
+    
+    return {
+        "audio": audio_b64,
+        "sample_rate": sample_rate,
+        "duration": duration,
+    }
+
+
+@app.post("/tts/create_voice_prompt")
+async def create_voice_prompt(
+    audio: UploadFile = File(...),
+    reference_text: str = Form(...),
+    use_cache: bool = Form(True),
+):
+    """
+    Create voice prompt from reference audio.
+    
+    Request (multipart/form-data):
+    - audio: Audio file
+    - reference_text: Transcript
+    - use_cache: Whether to use cached prompts (default: true)
+    """
+    backend = get_backend()
+    
+    # Save uploaded file temporarily
+    import tempfile
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
+        tmp_path = tmp_file.name
+        content = await audio.read()
+        tmp_file.write(content)
+    
+    try:
+        # Create voice prompt
+        voice_prompt, was_cached = await backend.create_voice_prompt(
+            audio_path=tmp_path,
+            reference_text=reference_text,
+            use_cache=use_cache,
+        )
+        
+        return {
+            "voice_prompt": voice_prompt,
+            "was_cached": was_cached,
+        }
+    finally:
+        # Clean up temp file
+        Path(tmp_path).unlink(missing_ok=True)
+
+
+def main():
+    """Main entry point."""
+    parser = argparse.ArgumentParser(description="Voicebox TTS Provider - PyTorch CPU")
+    parser.add_argument(
+        "--port",
+        type=int,
+        default=0,  # 0 means random port
+        help="Port to bind to",
+    )
+    parser.add_argument(
+        "--data-dir",
+        type=str,
+        default=None,
+        help="Data directory for models and cache",
+    )
+    args = parser.parse_args()
+    
+    # Set data directory if provided
+    if args.data_dir:
+        from backend import config
+        config.set_data_dir(args.data_dir)
+    
+    # Determine port
+    port = args.port
+    if port == 0:
+        import socket
+        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+            s.bind(('', 0))
+            port = s.getsockname()[1]
+    
+    print(f"Starting TTS Provider (PyTorch CPU) on port {port}")
+    
+    uvicorn.run(
+        app,
+        host="127.0.0.1",
+        port=port,
+        log_level="info",
+    )
+
+
+if __name__ == "__main__":
+    main()
diff --git a/providers/pytorch-cpu/requirements.txt b/providers/pytorch-cpu/requirements.txt
new file mode 100644
index 00000000..35593b57
--- /dev/null
+++ b/providers/pytorch-cpu/requirements.txt
@@ -0,0 +1,8 @@
+torch>=2.0.0
+transformers>=4.30.0
+qwen-tts>=0.1.0
+fastapi>=0.100.0
+uvicorn>=0.23.0
+soundfile>=0.12.0
+numpy>=1.24.0
+librosa>=0.10.0
diff --git a/providers/pytorch-cuda/build.py b/providers/pytorch-cuda/build.py
new file mode 100644
index 00000000..c6e56e7b
--- /dev/null
+++ b/providers/pytorch-cuda/build.py
@@ -0,0 +1,84 @@
+"""
+PyInstaller build script for PyTorch CUDA provider.
+"""
+
+import PyInstaller.__main__
+import os
+import platform
+from pathlib import Path
+
+
+def build_provider():
+    """Build PyTorch CUDA provider as standalone binary."""
+    provider_dir = Path(__file__).parent
+    backend_dir = provider_dir.parent.parent / "backend"
+    
+    # PyInstaller arguments
+    args = [
+        'main.py',
+        '--onefile',
+        '--name', 'tts-provider-pytorch-cuda',
+    ]
+    
+    # Add backend to path
+    args.extend([
+        '--paths', str(backend_dir.parent),
+    ])
+    
+    # Add hidden imports
+    args.extend([
+        '--hidden-import', 'backend',
+        '--hidden-import', 'backend.backends',
+        '--hidden-import', 'backend.backends.pytorch_backend',
+        '--hidden-import', 'backend.config',
+        '--hidden-import', 'backend.utils.audio',
+        '--hidden-import', 'backend.utils.cache',
+        '--hidden-import', 'backend.utils.progress',
+        '--hidden-import', 'backend.utils.hf_progress',
+        '--hidden-import', 'backend.utils.tasks',
+        '--hidden-import', 'torch',
+        '--hidden-import', 'torch.cuda',
+        '--hidden-import', 'torch.backends.cudnn',
+        '--hidden-import', 'transformers',
+        '--hidden-import', 'qwen_tts',
+        '--hidden-import', 'qwen_tts.inference',
+        '--hidden-import', 'qwen_tts.inference.qwen3_tts_model',
+        '--hidden-import', 'qwen_tts.inference.qwen3_tts_tokenizer',
+        '--hidden-import', 'qwen_tts.core',
+        '--hidden-import', 'qwen_tts.cli',
+        '--copy-metadata', 'qwen-tts',
+        '--collect-submodules', 'qwen_tts',
+        '--collect-data', 'qwen_tts',
+        '--hidden-import', 'pkg_resources.extern',
+        '--collect-submodules', 'jaraco',
+        '--hidden-import', 'fastapi',
+        '--hidden-import', 'uvicorn',
+        '--hidden-import', 'soundfile',
+        '--hidden-import', 'numpy',
+        '--hidden-import', 'librosa',
+    ])
+    
+    # Platform-specific extensions
+    if platform.system() == "Windows":
+        args[2] = 'tts-provider-pytorch-cuda.exe'
+    
+    args.extend([
+        '--noconfirm',
+        '--clean',
+    ])
+    
+    # Change to provider directory
+    os.chdir(provider_dir)
+    
+    # Run PyInstaller
+    PyInstaller.__main__.run(args)
+    
+    binary_name = 'tts-provider-pytorch-cuda'
+    if platform.system() == "Windows":
+        binary_name += '.exe'
+    
+    print(f"Binary built in {provider_dir / 'dist' / binary_name}")
+
+
+if __name__ == '__main__':
+    build_provider()
diff --git a/providers/pytorch-cuda/main.py b/providers/pytorch-cuda/main.py
new file mode 100644
index 00000000..a89782ff
--- /dev/null
+++ b/providers/pytorch-cuda/main.py
@@ -0,0 +1,238 @@
+"""
+Standalone TTS provider server for PyTorch CUDA.
+"""
+
+import argparse
+import asyncio
+import base64
+import io
+import sys
+from pathlib import Path
+from typing import Optional
+
+import numpy as np
+import soundfile as sf
+from fastapi import FastAPI, File, Form, HTTPException, UploadFile
+from fastapi.middleware.cors import CORSMiddleware
+import uvicorn
+
+# Add parent directory to path to import backend modules
+sys.path.insert(0, str(Path(__file__).parent.parent.parent / "backend"))
+
+from backend.backends.pytorch_backend import PyTorchTTSBackend
+
+
+app = FastAPI(title="Voicebox TTS Provider - PyTorch CUDA")
+
+# CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+# Global backend instance
+_backend: Optional[PyTorchTTSBackend] = None
+
+
+def get_backend() -> PyTorchTTSBackend:
+    """Get or create backend instance."""
+    global _backend
+    if _backend is None:
+        _backend = PyTorchTTSBackend()
+    return _backend
+
+
+@app.get("/tts/health")
+async def health():
+    """Health check endpoint."""
+    backend = get_backend()
+    backend_type = "pytorch-cuda"
+    
+    model_size = None
+    if backend.is_loaded():
+        if hasattr(backend, '_current_model_size') and backend._current_model_size:
+            model_size = backend._current_model_size
+    
+    device = backend.device if hasattr(backend, 'device') else "cpu"
+    
+    return {
+        "status": "healthy",
+        "provider": backend_type,
+        "version": "1.0.0",  # TODO: Get from version file
+        "model": model_size,
+        "device": device,
+    }
+
+
+@app.get("/tts/status")
+async def status():
+    """Model status endpoint."""
+    backend = get_backend()
+    
+    model_size = None
+    if backend.is_loaded():
+        if hasattr(backend, '_current_model_size') and backend._current_model_size:
+            model_size = backend._current_model_size
+    
+    available_sizes = ["1.7B", "0.6B"]
+    
+    gpu_available = False
+    vram_used_mb = None
+    
+    try:
+        import torch
+        gpu_available = torch.cuda.is_available()
+        if gpu_available:
+            vram_used_mb = int(torch.cuda.memory_allocated() / 1024 / 1024)
+    except ImportError:
+        pass
+    
+    return {
+        "model_loaded": backend.is_loaded(),
+        "model_size": model_size,
+        "available_sizes": available_sizes,
+        "gpu_available": gpu_available,
+        "vram_used_mb": vram_used_mb,
+    }
+
+
+@app.post("/tts/generate")
+async def generate(
+    text: str,
+    voice_prompt: dict,
+    language: str = "en",
+    seed: Optional[int] = None,
+    model_size: str = "1.7B",
+):
+    """
+    Generate speech from text.
+    
+    Request body (JSON):
+    {
+        "text": "Hello world!",
+        "voice_prompt": {...},
+        "language": "en",
+        "seed": 12345,
+        "model_size": "1.7B"
+    }
+    """
+    backend = get_backend()
+    
+    # Load model if not loaded or different size
+    if not backend.is_loaded() or (
+        hasattr(backend, '_current_model_size') and 
+        backend._current_model_size != model_size
+    ):
+        await backend.load_model_async(model_size)
+    
+    # Generate audio
+    audio, sample_rate = await backend.generate(
+        text=text,
+        voice_prompt=voice_prompt,
+        language=language,
+        seed=seed,
+        instruct=None,  # TODO: Add instruct support
+    )
+    
+    # Convert to base64
+    buffer = io.BytesIO()
+    sf.write(buffer, audio, sample_rate, format="WAV")
+    buffer.seek(0)
+    audio_bytes = buffer.read()
+    audio_b64 = base64.b64encode(audio_bytes).decode('utf-8')
+    
+    # Calculate duration
+    duration = len(audio) / sample_rate
+    
+    return {
+        "audio": audio_b64,
+        "sample_rate": sample_rate,
+        "duration": duration,
+    }
+
+
+@app.post("/tts/create_voice_prompt")
+async def create_voice_prompt(
+    audio: UploadFile = File(...),
+    reference_text: str = Form(...),
+    use_cache: bool = Form(True),
+):
+    """
+    Create voice prompt from reference audio.
+    
+    Request (multipart/form-data):
+    - audio: Audio file
+    - reference_text: Transcript
+    - use_cache: Whether to use cached prompts (default: true)
+    """
+    backend = get_backend()
+    
+    # Save uploaded file temporarily
+    import tempfile
+    with tempfile.NamedTemporaryFile(delete=False, suffix=".wav") as tmp_file:
+        tmp_path = tmp_file.name
+        content = await audio.read()
+        tmp_file.write(content)
+    
+    try:
+        # Create voice prompt
+        voice_prompt, was_cached = await backend.create_voice_prompt(
+            audio_path=tmp_path,
+            reference_text=reference_text,
+            use_cache=use_cache,
+        )
+        
+        return {
+            "voice_prompt": voice_prompt,
+            "was_cached": was_cached,
+        }
+    finally:
+        # Clean up temp file
+        Path(tmp_path).unlink(missing_ok=True)
+
+
+def main():
+    """Main entry point."""
+    parser = argparse.ArgumentParser(description="Voicebox TTS Provider - PyTorch CUDA")
+    parser.add_argument(
+        "--port",
+        type=int,
+        default=0,  # 0 means random port
+        help="Port to bind to",
+    )
+    parser.add_argument(
+        "--data-dir",
+        type=str,
+        default=None,
+        help="Data directory for models and cache",
+    )
+    args = parser.parse_args()
+    
+    # Set data directory if provided
+    if args.data_dir:
+        from backend import config
+        config.set_data_dir(args.data_dir)
+    
+    # Determine port
+    port = args.port
+    if port == 0:
+        import socket
+        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
+            s.bind(('', 0))
+            port = s.getsockname()[1]
+    
+    print(f"Starting TTS Provider (PyTorch CUDA) on port {port}")
+    
+    uvicorn.run(
+        app,
+        host="127.0.0.1",
+        port=port,
+        log_level="info",
+    )
+
+
+if __name__ == "__main__":
+    main()
diff --git a/providers/pytorch-cuda/requirements.txt b/providers/pytorch-cuda/requirements.txt
new file mode 100644
index 00000000..0f5eafd0
--- /dev/null
+++ b/providers/pytorch-cuda/requirements.txt
@@ -0,0 +1,10 @@
+torch>=2.0.0 --index-url https://download.pytorch.org/whl/cu121
+torchvision>=0.15.0 --index-url https://download.pytorch.org/whl/cu121
+torchaudio>=2.0.0 --index-url https://download.pytorch.org/whl/cu121
+transformers>=4.30.0
+qwen-tts>=0.1.0
+fastapi>=0.100.0
+uvicorn>=0.23.0
+soundfile>=0.12.0
+numpy>=1.24.0
+librosa>=0.10.0

From d89521559aa0bb9d3266ff3967eb0319ba9f74ca Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 03:09:49 -0800
Subject: [PATCH 02/33] Update LocalProvider to manage model size dynamically
 and clean up build scripts

- Introduced a new attribute `_current_model_size` in `LocalProvider` to store the current model size, allowing for dynamic configuration during generation.
- Updated the `generate` method to use the current model size instead of a hardcoded value.
- Modified the `load_model` method to track the requested model size.
- Removed platform-specific extension handling from the build scripts for both CPU and CUDA providers to streamline the build process.
---
 backend/providers/local.py      | 9 +++++----
 providers/pytorch-cpu/build.py  | 4 ----
 providers/pytorch-cuda/build.py | 4 ----
 3 files changed, 5 insertions(+), 12 deletions(-)

diff --git a/backend/providers/local.py b/backend/providers/local.py
index 1bde7bfe..004e6fc3 100644
--- a/backend/providers/local.py
+++ b/backend/providers/local.py
@@ -25,6 +25,7 @@ def __init__(self, base_url: str):
         """
         self.base_url = base_url.rstrip('/')
         self.client = httpx.AsyncClient(timeout=300.0)  # 5 minute timeout for generation
+        self._current_model_size = "1.7B"  # Default model size
     
     async def generate(
         self,
@@ -42,7 +43,7 @@ async def generate(
                 "voice_prompt": voice_prompt,
                 "language": language,
                 "seed": seed,
-                "model_size": "1.7B",  # TODO: Make configurable
+                "model_size": self._current_model_size,
             }
         )
         response.raise_for_status()
@@ -116,9 +117,9 @@ async def combine_voice_prompts(
     
     async def load_model(self, model_size: str) -> None:
         """Load TTS model."""
-        # Model loading is handled automatically by the provider server
-        # when generate() is called, so this is a no-op
-        pass
+        # Track the requested model size - the provider server will load it
+        # when generate() is called with this size
+        self._current_model_size = model_size
     
     def unload_model(self) -> None:
         """Unload model to free memory."""
diff --git a/providers/pytorch-cpu/build.py b/providers/pytorch-cpu/build.py
index 2276b686..8894edcb 100644
--- a/providers/pytorch-cpu/build.py
+++ b/providers/pytorch-cpu/build.py
@@ -56,10 +56,6 @@ def build_provider():
         '--hidden-import', 'librosa',
     ])
     
-    # Platform-specific extensions
-    if platform.system() == "Windows":
-        args[2] = 'tts-provider-pytorch-cpu.exe'
-    
     args.extend([
         '--noconfirm',
         '--clean',
diff --git a/providers/pytorch-cuda/build.py b/providers/pytorch-cuda/build.py
index c6e56e7b..8ff67334 100644
--- a/providers/pytorch-cuda/build.py
+++ b/providers/pytorch-cuda/build.py
@@ -58,10 +58,6 @@ def build_provider():
         '--hidden-import', 'librosa',
     ])
     
-    # Platform-specific extensions
-    if platform.system() == "Windows":
-        args[2] = 'tts-provider-pytorch-cuda.exe'
-    
     args.extend([
         '--noconfirm',
         '--clean',

From ec9402c568c3104cb55532721541c49bddd18ccd Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 03:11:34 -0800
Subject: [PATCH 03/33] Update qwen-tts version in requirements for CPU and
 CUDA providers from 0.1.0 to 0.0.5

---
 providers/pytorch-cpu/requirements.txt  | 2 +-
 providers/pytorch-cuda/requirements.txt | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/providers/pytorch-cpu/requirements.txt b/providers/pytorch-cpu/requirements.txt
index 35593b57..3f4144e3 100644
--- a/providers/pytorch-cpu/requirements.txt
+++ b/providers/pytorch-cpu/requirements.txt
@@ -1,6 +1,6 @@
 torch>=2.0.0
 transformers>=4.30.0
-qwen-tts>=0.1.0
+qwen-tts>=0.0.5
 fastapi>=0.100.0
 uvicorn>=0.23.0
 soundfile>=0.12.0
diff --git a/providers/pytorch-cuda/requirements.txt b/providers/pytorch-cuda/requirements.txt
index 0f5eafd0..5a106503 100644
--- a/providers/pytorch-cuda/requirements.txt
+++ b/providers/pytorch-cuda/requirements.txt
@@ -2,7 +2,7 @@ torch>=2.0.0 --index-url https://download.pytorch.org/whl/cu121
 torchvision>=0.15.0 --index-url https://download.pytorch.org/whl/cu121
 torchaudio>=2.0.0 --index-url https://download.pytorch.org/whl/cu121
 transformers>=4.30.0
-qwen-tts>=0.1.0
+qwen-tts>=0.0.5
 fastapi>=0.100.0
 uvicorn>=0.23.0
 soundfile>=0.12.0

From ec0fb601978d1983abc8eecf4ba88f30c395996c Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 03:40:27 -0800
Subject: [PATCH 04/33] Enhance release workflow and add radio group component

- Updated the release workflow to include a new configuration for the Ubuntu 22.04 platform without TTS bundled.
- Added the @radix-ui/react-radio-group dependency to package.json.
- Implemented a new RadioGroup component for better UI handling of radio inputs.
---
 .github/workflows/release.yml         |  8 ++---
 app/package.json                      |  1 +
 app/src/components/ui/radio-group.tsx | 44 +++++++++++++++++++++++++++
 3 files changed, 49 insertions(+), 4 deletions(-)
 create mode 100644 app/src/components/ui/radio-group.tsx

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index de067112..07f5c98d 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -132,10 +132,10 @@ jobs:
             python-version: "3.12"
             backend: "pytorch"
           # Linux - No TTS bundled, providers downloaded separately
-          # - platform: 'ubuntu-22.04'
-          #   args: ''
-          #   python-version: '3.12'
-          #   backend: 'none'
+          - platform: "ubuntu-22.04"
+            args: ""
+            python-version: "3.12"
+            backend: "none"
           # Windows - No TTS bundled, providers downloaded separately
           - platform: "windows-latest"
             args: ""
diff --git a/app/package.json b/app/package.json
index 905dea23..00170cca 100644
--- a/app/package.json
+++ b/app/package.json
@@ -24,6 +24,7 @@
     "@radix-ui/react-label": "^2.1.0",
     "@radix-ui/react-popover": "^1.1.1",
     "@radix-ui/react-progress": "^1.1.0",
+    "@radix-ui/react-radio-group": "^1.2.0",
     "@radix-ui/react-scroll-area": "^1.1.0",
     "@radix-ui/react-select": "^2.1.1",
     "@radix-ui/react-separator": "^1.1.0",
diff --git a/app/src/components/ui/radio-group.tsx b/app/src/components/ui/radio-group.tsx
new file mode 100644
index 00000000..fed418e6
--- /dev/null
+++ b/app/src/components/ui/radio-group.tsx
@@ -0,0 +1,44 @@
+"use client"
+
+import * as React from "react"
+import * as RadioGroupPrimitive from "@radix-ui/react-radio-group"
+import { Circle } from "lucide-react"
+
+import { cn } from "@/lib/utils/cn"
+
+const RadioGroup = React.forwardRef<
+  React.ElementRef<typeof RadioGroupPrimitive.Root>,
+  React.ComponentPropsWithoutRef<typeof RadioGroupPrimitive.Root>
+>(({ className, ...props }, ref) => {
+  return (
+    <RadioGroupPrimitive.Root
+      className={cn("grid gap-2", className)}
+      {...props}
+      ref={ref}
+    />
+  )
+})
+RadioGroup.displayName = RadioGroupPrimitive.Root.displayName
+
+const RadioGroupItem = React.forwardRef<
+  React.ElementRef<typeof RadioGroupPrimitive.Item>,
+  React.ComponentPropsWithoutRef<typeof RadioGroupPrimitive.Item>
+>(({ className, ...props }, ref) => {
+  return (
+    <RadioGroupPrimitive.Item
+      ref={ref}
+      className={cn(
+        "aspect-square h-4 w-4 rounded-full border border-primary text-primary ring-offset-background focus:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50",
+        className
+      )}
+      {...props}
+    >
+      <RadioGroupPrimitive.Indicator className="flex items-center justify-center">
+        <Circle className="h-2.5 w-2.5 fill-current text-current" />
+      </RadioGroupPrimitive.Indicator>
+    </RadioGroupPrimitive.Item>
+  )
+})
+RadioGroupItem.displayName = RadioGroupPrimitive.Item.displayName
+
+export { RadioGroup, RadioGroupItem }

From ce4269ffa545cd9b908cb9df916718fcd9784a7f Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 03:45:41 -0800
Subject: [PATCH 05/33] Refactor build scripts and update release workflow

- Commented out the PyTorch CPU configuration in the release workflow for Ubuntu 22.04.
- Updated TTS provider documentation to clarify options for Windows and Linux users.
- Enhanced build scripts for both CPU and CUDA providers by excluding large unused modules to reduce binary size.
---
 .github/workflows/release.yml   | 12 ++++++------
 providers/pytorch-cpu/build.py  | 18 ++++++++++++++++++
 providers/pytorch-cuda/build.py | 18 ++++++++++++++++++
 3 files changed, 42 insertions(+), 6 deletions(-)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 07f5c98d..ebf84c01 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -28,9 +28,9 @@ jobs:
             provider: "pytorch-cuda"
             python-version: "3.12"
           # PyTorch CPU provider (Linux)
-          - platform: "ubuntu-22.04"
-            provider: "pytorch-cpu"
-            python-version: "3.12"
+          # - platform: "ubuntu-22.04"
+          #   provider: "pytorch-cpu"
+          #   python-version: "3.12"
           # PyTorch CUDA provider (Linux) - large binary, uploaded to R2
           - platform: "ubuntu-22.04"
             provider: "pytorch-cuda"
@@ -268,10 +268,10 @@ jobs:
             - **Windows**: Download the `.msi` installer - requires downloading a TTS provider on first use
             - **Linux**: Download the `.AppImage` or `.deb` package - requires downloading a TTS provider on first use
 
-            ### TTS Providers (Windows/Linux)
+            ### TTS Providers
             Windows and Linux users will be prompted to download a TTS provider on first launch:
-            - **PyTorch CPU** (~300MB) - Works on any system
-            - **PyTorch CUDA** (~2.4GB) - 4-5x faster on NVIDIA GPUs
+            - **Windows**: PyTorch CPU (~300MB) or PyTorch CUDA (~2.4GB for NVIDIA GPUs)
+            - **Linux**: PyTorch CUDA (~2.4GB) - requires NVIDIA GPU
 
             The app includes automatic updates - future updates will be installed automatically.
           releaseDraft: true
diff --git a/providers/pytorch-cpu/build.py b/providers/pytorch-cpu/build.py
index 8894edcb..6596c266 100644
--- a/providers/pytorch-cpu/build.py
+++ b/providers/pytorch-cpu/build.py
@@ -56,6 +56,24 @@ def build_provider():
         '--hidden-import', 'librosa',
     ])
     
+    # Exclude large unused modules to reduce binary size
+    args.extend([
+        '--exclude-module', 'torch.utils.tensorboard',
+        '--exclude-module', 'tensorboard',
+        '--exclude-module', 'triton',
+        '--exclude-module', 'torch.distributed',
+        '--exclude-module', 'torch._dynamo',
+        '--exclude-module', 'torch._inductor',
+        '--exclude-module', 'torch.testing',
+        '--exclude-module', 'torch.utils.benchmark',
+        '--exclude-module', 'IPython',
+        '--exclude-module', 'matplotlib',
+        '--exclude-module', 'PIL',
+        '--exclude-module', 'cv2',
+        '--exclude-module', 'torchvision',
+        '--exclude-module', 'torchaudio',
+    ])
+    
     args.extend([
         '--noconfirm',
         '--clean',
diff --git a/providers/pytorch-cuda/build.py b/providers/pytorch-cuda/build.py
index 8ff67334..565885b2 100644
--- a/providers/pytorch-cuda/build.py
+++ b/providers/pytorch-cuda/build.py
@@ -58,6 +58,24 @@ def build_provider():
         '--hidden-import', 'librosa',
     ])
     
+    # Exclude large unused modules to reduce binary size
+    args.extend([
+        '--exclude-module', 'torch.utils.tensorboard',
+        '--exclude-module', 'tensorboard',
+        '--exclude-module', 'triton',
+        '--exclude-module', 'torch.distributed',
+        '--exclude-module', 'torch._dynamo',
+        '--exclude-module', 'torch._inductor',
+        '--exclude-module', 'torch.testing',
+        '--exclude-module', 'torch.utils.benchmark',
+        '--exclude-module', 'IPython',
+        '--exclude-module', 'matplotlib',
+        '--exclude-module', 'PIL',
+        '--exclude-module', 'cv2',
+        '--exclude-module', 'torchvision',
+        '--exclude-module', 'torchaudio',
+    ])
+    
     args.extend([
         '--noconfirm',
         '--clean',

From ab10c26ce44a98692048c61b2fea293ff62a6931 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 04:11:30 -0800
Subject: [PATCH 06/33] Update release workflow to include libasound2-dev
 dependency for Ubuntu 22.04

---
 .github/workflows/release.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index ebf84c01..cce4670b 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -151,7 +151,7 @@ jobs:
         if: matrix.platform == 'ubuntu-22.04'
         run: |
           sudo apt-get update
-          sudo apt-get install -y libwebkit2gtk-4.1-dev libappindicator3-dev librsvg2-dev patchelf llvm-dev
+          sudo apt-get install -y libwebkit2gtk-4.1-dev libappindicator3-dev librsvg2-dev patchelf llvm-dev libasound2-dev
 
       - name: Install LLVM (macOS)
         if: matrix.platform == 'macos-latest' || matrix.platform == 'macos-15-intel'

From a52ff7d9504a5fba5d446b34ebe49ec5fda90c33 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 05:10:27 -0800
Subject: [PATCH 07/33] Add Linux audio capture module with unsupported
 functionality

- Introduced a new `linux.rs` module for audio capture, indicating that audio capture is not supported on Linux at this time.
- Updated `mod.rs` to include the Linux module conditionally based on the target OS.
---
 tauri/src-tauri/src/audio_capture/linux.rs | 16 ++++++++++++++++
 tauri/src-tauri/src/audio_capture/mod.rs   |  4 ++++
 2 files changed, 20 insertions(+)
 create mode 100644 tauri/src-tauri/src/audio_capture/linux.rs

diff --git a/tauri/src-tauri/src/audio_capture/linux.rs b/tauri/src-tauri/src/audio_capture/linux.rs
new file mode 100644
index 00000000..7550e086
--- /dev/null
+++ b/tauri/src-tauri/src/audio_capture/linux.rs
@@ -0,0 +1,16 @@
+use crate::audio_capture::AudioCaptureState;
+
+pub async fn start_capture(
+    _state: &AudioCaptureState,
+    _max_duration_secs: u32,
+) -> Result<(), String> {
+    Err("Audio capture is not supported on Linux, YET. Use the built-in recording features instead.".to_string())
+}
+
+pub async fn stop_capture(_state: &AudioCaptureState) -> Result<String, String> {
+    Err("Audio capture is not supported on Linux.".to_string())
+}
+
+pub fn is_supported() -> bool {
+    false
+}
diff --git a/tauri/src-tauri/src/audio_capture/mod.rs b/tauri/src-tauri/src/audio_capture/mod.rs
index 7a55c334..a67bf795 100644
--- a/tauri/src-tauri/src/audio_capture/mod.rs
+++ b/tauri/src-tauri/src/audio_capture/mod.rs
@@ -2,11 +2,15 @@
 mod macos;
 #[cfg(target_os = "windows")]
 mod windows;
+#[cfg(target_os = "linux")]
+mod linux;
 
 #[cfg(target_os = "macos")]
 pub use macos::*;
 #[cfg(target_os = "windows")]
 pub use windows::*;
+#[cfg(target_os = "linux")]
+pub use linux::*;
 
 use std::sync::{Arc, Mutex};
 

From 942064912a3bdd6fec0e5517773b3bb88e51234a Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 20:18:27 -0800
Subject: [PATCH 08/33] Update TTS provider methods and dependencies

- Renamed `load_model` to `load_model_async` in TTS provider classes for clarity and consistency.
- Added compatibility alias for `load_model` to maintain existing functionality.
- Enhanced `get_model_status` to handle both synchronous and asynchronous check functions.
- Updated version numbers in `bun.lock` and `Cargo.lock` to 0.1.12, reflecting recent changes.
---
 backend/main.py              | 14 ++++++++++++--
 backend/providers/base.py    |  2 +-
 backend/providers/bundled.py |  6 ++++--
 backend/providers/local.py   |  5 ++++-
 bun.lock                     | 11 +++++++----
 tauri/src-tauri/Cargo.lock   |  2 +-
 6 files changed, 29 insertions(+), 11 deletions(-)

diff --git a/backend/main.py b/backend/main.py
index 3bd4b7e6..f6d00a1f 100644
--- a/backend/main.py
+++ b/backend/main.py
@@ -1362,7 +1362,12 @@ def check_whisper_loaded(model_size: str):
                 if asyncio.iscoroutinefunction(check_func):
                     loaded = await check_func()
                 else:
-                    loaded = check_func()
+                    result = check_func()
+                    # Handle lambdas that return coroutines
+                    if asyncio.iscoroutine(result):
+                        loaded = await result
+                    else:
+                        loaded = result
             except Exception:
                 loaded = False
             
@@ -1389,7 +1394,12 @@ def check_whisper_loaded(model_size: str):
                 if asyncio.iscoroutinefunction(check_func):
                     loaded = await check_func()
                 else:
-                    loaded = check_func()
+                    result = check_func()
+                    # Handle lambdas that return coroutines
+                    if asyncio.iscoroutine(result):
+                        loaded = await result
+                    else:
+                        loaded = result
             except Exception:
                 loaded = False
             
diff --git a/backend/providers/base.py b/backend/providers/base.py
index f3a6b4c2..50b05ce0 100644
--- a/backend/providers/base.py
+++ b/backend/providers/base.py
@@ -72,7 +72,7 @@ async def combine_voice_prompts(
         """
         ...
     
-    async def load_model(self, model_size: str) -> None:
+    async def load_model_async(self, model_size: str) -> None:
         """Load TTS model."""
         ...
     
diff --git a/backend/providers/bundled.py b/backend/providers/bundled.py
index b4a5e2ca..9c37e23c 100644
--- a/backend/providers/bundled.py
+++ b/backend/providers/bundled.py
@@ -55,14 +55,16 @@ async def combine_voice_prompts(
         backend = self._get_backend()
         return await backend.combine_voice_prompts(audio_paths, reference_texts)
     
-    async def load_model(self, model_size: str) -> None:
+    async def load_model_async(self, model_size: str) -> None:
         """Load TTS model."""
         backend = self._get_backend()
-        # Backends use load_model_async, but Protocol defines load_model
         if hasattr(backend, 'load_model_async'):
             await backend.load_model_async(model_size)
         else:
             await backend.load_model(model_size)
+
+    # Alias for compatibility
+    load_model = load_model_async
     
     def unload_model(self) -> None:
         """Unload model to free memory."""
diff --git a/backend/providers/local.py b/backend/providers/local.py
index 004e6fc3..3ea4d75b 100644
--- a/backend/providers/local.py
+++ b/backend/providers/local.py
@@ -115,11 +115,14 @@ async def combine_voice_prompts(
         
         return mixed, combined_text
     
-    async def load_model(self, model_size: str) -> None:
+    async def load_model_async(self, model_size: str) -> None:
         """Load TTS model."""
         # Track the requested model size - the provider server will load it
         # when generate() is called with this size
         self._current_model_size = model_size
+
+    # Alias for compatibility
+    load_model = load_model_async
     
     def unload_model(self) -> None:
         """Unload model to free memory."""
diff --git a/bun.lock b/bun.lock
index 9e08a825..3879020e 100644
--- a/bun.lock
+++ b/bun.lock
@@ -13,7 +13,7 @@
     },
     "app": {
       "name": "@voicebox/app",
-      "version": "0.1.11",
+      "version": "0.1.12",
       "dependencies": {
         "@dnd-kit/core": "^6.3.1",
         "@dnd-kit/sortable": "^10.0.0",
@@ -26,6 +26,7 @@
         "@radix-ui/react-label": "^2.1.0",
         "@radix-ui/react-popover": "^1.1.1",
         "@radix-ui/react-progress": "^1.1.0",
+        "@radix-ui/react-radio-group": "^1.2.0",
         "@radix-ui/react-scroll-area": "^1.1.0",
         "@radix-ui/react-select": "^2.1.1",
         "@radix-ui/react-separator": "^1.1.0",
@@ -68,7 +69,7 @@
     },
     "landing": {
       "name": "@voicebox/landing",
-      "version": "0.1.11",
+      "version": "0.1.12",
       "dependencies": {
         "@radix-ui/react-separator": "^1.1.8",
         "@radix-ui/react-slot": "^1.2.4",
@@ -93,7 +94,7 @@
     },
     "tauri": {
       "name": "@voicebox/tauri",
-      "version": "0.1.11",
+      "version": "0.1.12",
       "dependencies": {
         "@tauri-apps/api": "^2.0.0",
         "@tauri-apps/plugin-dialog": "^2.0.0",
@@ -116,7 +117,7 @@
     },
     "web": {
       "name": "@voicebox/web",
-      "version": "0.1.11",
+      "version": "0.1.12",
       "dependencies": {
         "@tanstack/react-query": "^5.0.0",
         "react": "^18.3.0",
@@ -407,6 +408,8 @@
 
     "@radix-ui/react-progress": ["@radix-ui/react-progress@1.1.8", "", { "dependencies": { "@radix-ui/react-context": "1.1.3", "@radix-ui/react-primitive": "2.1.4" }, "peerDependencies": { "@types/react": "*", "@types/react-dom": "*", "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc", "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-+gISHcSPUJ7ktBy9RnTqbdKW78bcGke3t6taawyZ71pio1JewwGSJizycs7rLhGTvMJYCQB1DBK4KQsxs7U8dA=="],
 
+    "@radix-ui/react-radio-group": ["@radix-ui/react-radio-group@1.3.8", "", { "dependencies": { "@radix-ui/primitive": "1.1.3", "@radix-ui/react-compose-refs": "1.1.2", "@radix-ui/react-context": "1.1.2", "@radix-ui/react-direction": "1.1.1", "@radix-ui/react-presence": "1.1.5", "@radix-ui/react-primitive": "2.1.3", "@radix-ui/react-roving-focus": "1.1.11", "@radix-ui/react-use-controllable-state": "1.2.2", "@radix-ui/react-use-previous": "1.1.1", "@radix-ui/react-use-size": "1.1.1" }, "peerDependencies": { "@types/react": "*", "@types/react-dom": "*", "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc", "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-VBKYIYImA5zsxACdisNQ3BjCBfmbGH3kQlnFVqlWU4tXwjy7cGX8ta80BcrO+WJXIn5iBylEH3K6ZTlee//lgQ=="],
+
     "@radix-ui/react-roving-focus": ["@radix-ui/react-roving-focus@1.1.11", "", { "dependencies": { "@radix-ui/primitive": "1.1.3", "@radix-ui/react-collection": "1.1.7", "@radix-ui/react-compose-refs": "1.1.2", "@radix-ui/react-context": "1.1.2", "@radix-ui/react-direction": "1.1.1", "@radix-ui/react-id": "1.1.1", "@radix-ui/react-primitive": "2.1.3", "@radix-ui/react-use-callback-ref": "1.1.1", "@radix-ui/react-use-controllable-state": "1.2.2" }, "peerDependencies": { "@types/react": "*", "@types/react-dom": "*", "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc", "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-7A6S9jSgm/S+7MdtNDSb+IU859vQqJ/QAtcYQcfFC6W8RS4IxIZDldLR0xqCFZ6DCyrQLjLPsxtTNch5jVA4lA=="],
 
     "@radix-ui/react-scroll-area": ["@radix-ui/react-scroll-area@1.2.10", "", { "dependencies": { "@radix-ui/number": "1.1.1", "@radix-ui/primitive": "1.1.3", "@radix-ui/react-compose-refs": "1.1.2", "@radix-ui/react-context": "1.1.2", "@radix-ui/react-direction": "1.1.1", "@radix-ui/react-presence": "1.1.5", "@radix-ui/react-primitive": "2.1.3", "@radix-ui/react-use-callback-ref": "1.1.1", "@radix-ui/react-use-layout-effect": "1.1.1" }, "peerDependencies": { "@types/react": "*", "@types/react-dom": "*", "react": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc", "react-dom": "^16.8 || ^17.0 || ^18.0 || ^19.0 || ^19.0.0-rc" }, "optionalPeers": ["@types/react", "@types/react-dom"] }, "sha512-tAXIa1g3sM5CGpVT0uIbUx/U3Gs5N8T52IICuCtObaos1S8fzsrPXG5WObkQN3S6NVl6wKgPhAIiBGbWnvc97A=="],
diff --git a/tauri/src-tauri/Cargo.lock b/tauri/src-tauri/Cargo.lock
index 4528097c..35b15188 100644
--- a/tauri/src-tauri/Cargo.lock
+++ b/tauri/src-tauri/Cargo.lock
@@ -5041,7 +5041,7 @@ checksum = "0b928f33d975fc6ad9f86c8f283853ad26bdd5b10b7f1542aa2fa15e2289105a"
 
 [[package]]
 name = "voicebox"
-version = "0.1.11"
+version = "0.1.12"
 dependencies = [
  "base64 0.22.1",
  "core-foundation-sys",

From dcbdf3e89b01b6b5784ed3e75b548ba42ec7c928 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 20:18:32 -0800
Subject: [PATCH 09/33] =?UTF-8?q?Bump=20version:=200.1.12=20=E2=86=92=200.?=
 =?UTF-8?q?1.13?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

---
 .bumpversion.cfg                | 2 +-
 app/package.json                | 2 +-
 backend/__init__.py             | 2 +-
 landing/package.json            | 2 +-
 package.json                    | 2 +-
 tauri/package.json              | 2 +-
 tauri/src-tauri/Cargo.toml      | 2 +-
 tauri/src-tauri/tauri.conf.json | 2 +-
 web/package.json                | 2 +-
 9 files changed, 9 insertions(+), 9 deletions(-)

diff --git a/.bumpversion.cfg b/.bumpversion.cfg
index 37ef7924..151a8ac0 100644
--- a/.bumpversion.cfg
+++ b/.bumpversion.cfg
@@ -1,5 +1,5 @@
 [bumpversion]
-current_version = 0.1.12
+current_version = 0.1.13
 commit = True
 tag = True
 tag_name = v{new_version}
diff --git a/app/package.json b/app/package.json
index 00170cca..0849a94b 100644
--- a/app/package.json
+++ b/app/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@voicebox/app",
-  "version": "0.1.12",
+  "version": "0.1.13",
   "private": true,
   "type": "module",
   "scripts": {
diff --git a/backend/__init__.py b/backend/__init__.py
index e75772bd..36b3fee7 100644
--- a/backend/__init__.py
+++ b/backend/__init__.py
@@ -1,3 +1,3 @@
 # Backend package
 
-__version__ = "0.1.12"
+__version__ = "0.1.13"
diff --git a/landing/package.json b/landing/package.json
index 655e57a6..8af4d00e 100644
--- a/landing/package.json
+++ b/landing/package.json
@@ -1,6 +1,6 @@
 {
   "name": "@voicebox/landing",
-  "version": "0.1.12",
+  "version": "0.1.13",
   "description": "Landing page for voicebox.sh",
   "scripts": {
     "dev": "bun --bun next dev --turbo",
diff --git a/package.json b/package.json
index c0f3c21e..f6af4cbd 100644
--- a/package.json
+++ b/package.json
@@ -1,6 +1,6 @@
 {
   "name": "voicebox",
-  "version": "0.1.12",
+  "version": "0.1.13",
   "private": true,
   "workspaces": [
     "app",
diff --git a/tauri/package.json b/tauri/package.json
index 163f56c8..f7ec77ec 100644
--- a/tauri/package.json
+++ b/tauri/package.json
@@ -1,7 +1,7 @@
 {
   "name": "@voicebox/tauri",
   "private": true,
-  "version": "0.1.12",
+  "version": "0.1.13",
   "type": "module",
   "scripts": {
     "dev": "vite",
diff --git a/tauri/src-tauri/Cargo.toml b/tauri/src-tauri/Cargo.toml
index 739dd34d..aa3b1a9c 100644
--- a/tauri/src-tauri/Cargo.toml
+++ b/tauri/src-tauri/Cargo.toml
@@ -1,6 +1,6 @@
 [package]
 name = "voicebox"
-version = "0.1.12"
+version = "0.1.13"
 description = "A production-quality desktop app for Qwen3-TTS voice cloning and generation"
 authors = ["you"]
 license = ""
diff --git a/tauri/src-tauri/tauri.conf.json b/tauri/src-tauri/tauri.conf.json
index 53b95d18..294d5049 100644
--- a/tauri/src-tauri/tauri.conf.json
+++ b/tauri/src-tauri/tauri.conf.json
@@ -1,7 +1,7 @@
 {
   "$schema": "https://schema.tauri.app/config/2",
   "productName": "Voicebox",
-  "version": "0.1.12",
+  "version": "0.1.13",
   "identifier": "sh.voicebox.app",
   "build": {
     "beforeDevCommand": "bun run dev",
diff --git a/web/package.json b/web/package.json
index 99d82c56..1f44b3df 100644
--- a/web/package.json
+++ b/web/package.json
@@ -1,7 +1,7 @@
 {
   "name": "@voicebox/web",
   "private": true,
-  "version": "0.1.12",
+  "version": "0.1.13",
   "type": "module",
   "scripts": {
     "dev": "vite",

From 6dd5bb231198eb3ee8c42643030a2040d861da7c Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sat, 31 Jan 2026 22:18:01 -0800
Subject: [PATCH 10/33] hugeicons

---
 app/package.json                              |   3 +-
 app/src/App.tsx                               |  11 ++---
 .../components/AudioPlayer/AudioPlayer.tsx    |  11 ++---
 app/src/components/AudioTab/AudioTab.tsx      |  27 ++++++------
 .../Generation/FloatingGenerateBox.tsx        |   9 ++--
 .../components/Generation/GenerationForm.tsx  |   7 +--
 app/src/components/History/HistoryTable.tsx   |  33 +++++++-------
 app/src/components/MainEditor/MainEditor.tsx  |   7 +--
 .../ServerSettings/ModelManagement.tsx        |  30 ++++++-------
 .../ServerSettings/ModelProgress.tsx          |   7 +--
 .../ServerSettings/ProviderSettings.tsx       |  17 ++++----
 .../ServerSettings/ServerStatus.tsx           |   7 +--
 .../ServerSettings/UpdateStatus.tsx           |  15 ++++---
 app/src/components/Sidebar.tsx                |  21 ++++-----
 .../components/StoriesTab/StoryChatItem.tsx   |  13 +++---
 .../components/StoriesTab/StoryContent.tsx    |   7 +--
 app/src/components/StoriesTab/StoryList.tsx   |  13 +++---
 .../StoriesTab/StoryTrackEditor.tsx           |  41 +++++++++---------
 .../VoiceProfiles/AudioSampleRecording.tsx    |  13 +++---
 .../VoiceProfiles/AudioSampleSystem.tsx       |  13 +++---
 .../VoiceProfiles/AudioSampleUpload.tsx       |  11 ++---
 .../components/VoiceProfiles/ProfileCard.tsx  |  11 ++---
 .../components/VoiceProfiles/ProfileForm.tsx  |  17 ++++----
 .../components/VoiceProfiles/ProfileList.tsx  |   7 +--
 .../components/VoiceProfiles/SampleList.tsx   |  21 ++++-----
 .../components/VoiceProfiles/SampleUpload.tsx |   9 ++--
 app/src/components/VoicesTab/VoicesTab.tsx    |  13 +++---
 app/src/components/ui/checkbox.tsx            |   5 ++-
 app/src/components/ui/dialog.tsx              |   5 ++-
 app/src/components/ui/dropdown-menu.tsx       |   9 ++--
 app/src/components/ui/multi-select.tsx        |   7 +--
 app/src/components/ui/radio-group.tsx         |   5 ++-
 app/src/components/ui/select.tsx              |  11 ++---
 app/src/components/ui/toast.tsx               |   5 ++-
 app/src/hooks/useAutoUpdater.ts               |   2 +-
 app/src/hooks/useAutoUpdater.tsx              |   7 +--
 app/src/lib/api/types.ts                      |   1 +
 app/src/lib/hooks/useModelDownloadToast.tsx   |  15 ++++---
 backend/voicebox-server.spec                  |   6 +--
 bun.lock                                      |  14 ++++--
 tauri/src-tauri/Cargo.lock                    |   2 +-
 tauri/src-tauri/gen/Assets.car                | Bin 3847048 -> 3847048 bytes
 42 files changed, 261 insertions(+), 227 deletions(-)

diff --git a/app/package.json b/app/package.json
index 0849a94b..07028409 100644
--- a/app/package.json
+++ b/app/package.json
@@ -17,6 +17,8 @@
     "@dnd-kit/sortable": "^10.0.0",
     "@dnd-kit/utilities": "^3.2.2",
     "@hookform/resolvers": "^3.9.0",
+    "@hugeicons/core-free-icons": "^3.1.1",
+    "@hugeicons/react": "^1.1.4",
     "@radix-ui/react-alert-dialog": "^1.1.1",
     "@radix-ui/react-avatar": "^1.1.0",
     "@radix-ui/react-dialog": "^1.1.1",
@@ -44,7 +46,6 @@
     "clsx": "^2.1.1",
     "date-fns": "^3.6.0",
     "framer-motion": "^12.29.0",
-    "lucide-react": "^0.454.0",
     "motion": "^12.29.0",
     "react": "^18.3.0",
     "react-dom": "^18.3.0",
diff --git a/app/src/App.tsx b/app/src/App.tsx
index fbe29118..e54bc9dd 100644
--- a/app/src/App.tsx
+++ b/app/src/App.tsx
@@ -40,7 +40,7 @@ function App() {
   const serverStartingRef = useRef(false);
 
   // Automatically check for app updates on startup and show toast notifications
-  useAutoUpdater({ checkOnMount: true, showToast: true });
+  useAutoUpdater(true);
 
   // Sync stored setting to Rust on startup
   useEffect(() => {
@@ -82,8 +82,7 @@ function App() {
       console.log('Dev mode: Skipping auto-start of server (run it separately)');
       setServerReady(true); // Mark as ready so UI doesn't show loading screen
       // Mark that server was not started by app (so we don't try to stop it on close)
-      // @ts-expect-error - adding property to window
-      window.__voiceboxServerStartedByApp = false;
+      (window as any).__voiceboxServerStartedByApp = false;
       return;
     }
 
@@ -103,14 +102,12 @@ function App() {
         useServerStore.getState().setServerUrl(serverUrl);
         setServerReady(true);
         // Mark that we started the server (so we know to stop it on close)
-        // @ts-expect-error - adding property to window
-        window.__voiceboxServerStartedByApp = true;
+        (window as any).__voiceboxServerStartedByApp = true;
       })
       .catch((error) => {
         console.error('Failed to auto-start server:', error);
         serverStartingRef.current = false;
-        // @ts-expect-error - adding property to window
-        window.__voiceboxServerStartedByApp = false;
+        (window as any).__voiceboxServerStartedByApp = false;
       });
 
     // Cleanup: stop server on actual unmount (not StrictMode remount)
diff --git a/app/src/components/AudioPlayer/AudioPlayer.tsx b/app/src/components/AudioPlayer/AudioPlayer.tsx
index 48dd9e78..c49f7a38 100644
--- a/app/src/components/AudioPlayer/AudioPlayer.tsx
+++ b/app/src/components/AudioPlayer/AudioPlayer.tsx
@@ -1,5 +1,6 @@
 import { useQuery } from '@tanstack/react-query';
-import { Pause, Play, Repeat, Volume2, VolumeX, X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { PauseIcon, PlayIcon, RepeatIcon, VolumeHighIcon, VolumeMuteIcon, Cancel01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useMemo, useRef, useState } from 'react';
 import WaveSurfer from 'wavesurfer.js';
 import { Button } from '@/components/ui/button';
@@ -832,7 +833,7 @@ export function AudioPlayer() {
             className="shrink-0"
             title={duration === 0 && !isLoading ? 'Audio not loaded' : ''}
           >
-            {isPlaying ? <Pause className="h-5 w-5" /> : <Play className="h-5 w-5" />}
+            {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={20} className="h-5 w-5" /> : <HugeiconsIcon icon={PlayIcon} size={20} className="h-5 w-5" />}
           </Button>
 
           {/* Waveform */}
@@ -873,7 +874,7 @@ export function AudioPlayer() {
             className={isLooping ? 'text-primary' : ''}
             title="Toggle loop"
           >
-            <Repeat className="h-4 w-4" />
+            <HugeiconsIcon icon={RepeatIcon} size={16} className="h-4 w-4" />
           </Button>
 
           {/* Volume Control */}
@@ -884,7 +885,7 @@ export function AudioPlayer() {
               onClick={() => setVolume(volume > 0 ? 0 : 1)}
               className="h-8 w-8"
             >
-              {volume > 0 ? <Volume2 className="h-4 w-4" /> : <VolumeX className="h-4 w-4" />}
+              {volume > 0 ? <HugeiconsIcon icon={VolumeHighIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={VolumeMuteIcon} size={16} className="h-4 w-4" />}
             </Button>
             <Slider
               value={[volume * 100]}
@@ -903,7 +904,7 @@ export function AudioPlayer() {
             className="shrink-0"
             title="Close player"
           >
-            <X className="h-5 w-5" />
+            <HugeiconsIcon icon={Cancel01Icon} size={20} className="h-5 w-5" />
           </Button>
         </div>
       </div>
diff --git a/app/src/components/AudioTab/AudioTab.tsx b/app/src/components/AudioTab/AudioTab.tsx
index f76e99d7..150e7660 100644
--- a/app/src/components/AudioTab/AudioTab.tsx
+++ b/app/src/components/AudioTab/AudioTab.tsx
@@ -1,5 +1,6 @@
 import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
-import { Check, CheckCircle2, Edit, Plus, Speaker, Trash2 } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CheckmarkCircle01Icon, CheckmarkCircle02Icon, Edit01Icon, Add01Icon, SpeakerIcon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useState } from 'react';
 import { Badge } from '@/components/ui/badge';
 import { Button } from '@/components/ui/button';
@@ -135,7 +136,7 @@ export function AudioTab() {
       <div className="flex items-center justify-between mb-6 shrink-0">
         <h2 className="text-2xl font-bold">Audio Channels</h2>
         <Button onClick={() => setCreateDialogOpen(true)}>
-          <Plus className="h-4 w-4 mr-2" />
+          <HugeiconsIcon icon={Add01Icon} size={16} className="h-4 w-4 mr-2" />
           New Channel
         </Button>
       </div>
@@ -150,13 +151,13 @@ export function AudioTab() {
         >
           {allChannels.length === 0 ? (
             <div className="flex flex-col items-center justify-center py-12 border-2 border-dashed border-muted rounded-md">
-              <Speaker className="h-12 w-12 text-muted-foreground mb-4" />
+              <HugeiconsIcon icon={SpeakerIcon} size={48} className="h-12 w-12 text-muted-foreground mb-4" />
               <p className="text-muted-foreground mb-4">
                 No audio channels yet. Create your first channel to route voices to specific
                 devices.
               </p>
               <Button onClick={() => setCreateDialogOpen(true)}>
-                <Plus className="h-4 w-4 mr-2" />
+                <HugeiconsIcon icon={Add01Icon} size={16} className="h-4 w-4 mr-2" />
                 Create Channel
               </Button>
             </div>
@@ -178,7 +179,7 @@ export function AudioTab() {
                       <div className="flex-1 min-w-0">
                         <div className="flex items-center gap-2 mb-3">
                           <div className="h-8 w-8 rounded-lg bg-muted flex items-center justify-center shrink-0">
-                            <Speaker className="h-4 w-4 text-muted-foreground" />
+                            <HugeiconsIcon icon={SpeakerIcon} size={16} className="h-4 w-4 text-muted-foreground" />
                           </div>
                           <div className="flex items-center gap-2 min-w-0">
                             <h3 className="font-semibold text-base truncate">{channel.name}</h3>
@@ -235,7 +236,7 @@ export function AudioTab() {
                               setEditingChannel(channel.id);
                             }}
                           >
-                            <Edit className="h-4 w-4" />
+                            <HugeiconsIcon icon={Edit01Icon} size={16} className="h-4 w-4" />
                           </Button>
                           <Button
                             variant="ghost"
@@ -248,7 +249,7 @@ export function AudioTab() {
                               }
                             }}
                           >
-                            <Trash2 className="h-4 w-4" />
+                            <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
                           </Button>
                         </div>
                       )}
@@ -325,10 +326,10 @@ export function AudioTab() {
                           isConnected ? 'bg-accent border-accent' : 'border-muted-foreground/30',
                         )}
                       >
-                        {isConnected && <Check className="h-3 w-3 text-accent-foreground" />}
+                        {isConnected && <HugeiconsIcon icon={CheckmarkCircle01Icon} size={12} className="h-3 w-3 text-accent-foreground" />}
                       </div>
                     ) : device.is_default ? (
-                      <CheckCircle2 className="h-4 w-4 text-primary shrink-0" />
+                      <HugeiconsIcon icon={CheckmarkCircle02Icon} size={16} className="h-4 w-4 text-primary shrink-0" />
                     ) : null}
                     <span className={cn('truncate flex-1', device.is_default && 'font-medium')}>
                       {device.name}
@@ -339,7 +340,7 @@ export function AudioTab() {
             </div>
           ) : (
             <div className="flex flex-col items-center justify-center py-12 border-2 border-dashed border-muted rounded-md">
-              <CheckCircle2 className="h-12 w-12 text-muted-foreground mb-4" />
+              <HugeiconsIcon icon={CheckmarkCircle02Icon} size={48} className="h-12 w-12 text-muted-foreground mb-4" />
               <p className="text-muted-foreground text-center">
                 {platform.metadata.isTauri ? 'No audio devices found' : 'Audio device selection requires Tauri'}
               </p>
@@ -494,7 +495,7 @@ function CreateChannelDialog({ open, onOpenChange, devices, onCreate }: CreateCh
                           setSelectedDevices(selectedDevices.filter((id) => id !== deviceId))
                         }
                       >
-                        <Trash2 className="h-3 w-3" />
+                        <HugeiconsIcon icon={Delete01Icon} size={12} className="h-3 w-3" />
                       </Button>
                     </div>
                   );
@@ -602,7 +603,7 @@ function EditChannelDialog({
                           setSelectedDevices(selectedDevices.filter((id) => id !== deviceId))
                         }
                       >
-                        <Trash2 className="h-3 w-3" />
+                        <HugeiconsIcon icon={Delete01Icon} size={12} className="h-3 w-3" />
                       </Button>
                     </div>
                   );
@@ -648,7 +649,7 @@ function EditChannelDialog({
                           setSelectedVoices(selectedVoices.filter((id) => id !== profileId))
                         }
                       >
-                        <Trash2 className="h-3 w-3" />
+                        <HugeiconsIcon icon={Delete01Icon} size={12} className="h-3 w-3" />
                       </Button>
                     </div>
                   );
diff --git a/app/src/components/Generation/FloatingGenerateBox.tsx b/app/src/components/Generation/FloatingGenerateBox.tsx
index b020a81f..dc835dfb 100644
--- a/app/src/components/Generation/FloatingGenerateBox.tsx
+++ b/app/src/components/Generation/FloatingGenerateBox.tsx
@@ -1,6 +1,7 @@
 import { useMatchRoute } from '@tanstack/react-router';
 import { AnimatePresence, motion } from 'framer-motion';
-import { Loader2, MessageSquare, Sparkles } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Loading01Icon, TextSquareIcon, SparklesIcon } from '@hugeicons/core-free-icons';
 import { useEffect, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import { Form, FormControl, FormField, FormItem, FormMessage } from '@/components/ui/form';
@@ -301,9 +302,9 @@ export function FloatingGenerateBox({
                   size="icon"
                 >
                   {isPending ? (
-                    <Loader2 className="h-4 w-4 animate-spin" />
+                    <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
                   ) : (
-                    <Sparkles className="h-4 w-4" />
+                    <HugeiconsIcon icon={SparklesIcon} size={16} className="h-4 w-4" />
                   )}
                 </Button>
                 <AnimatePresence>
@@ -327,7 +328,7 @@ export function FloatingGenerateBox({
                             : 'bg-card border border-border hover:bg-background/50',
                         )}
                       >
-                        <MessageSquare className="h-4 w-4" />
+                        <HugeiconsIcon icon={TextSquareIcon} size={16} className="h-4 w-4" />
                       </Button>
                     </motion.div>
                   )}
diff --git a/app/src/components/Generation/GenerationForm.tsx b/app/src/components/Generation/GenerationForm.tsx
index 31b100f8..edf7b749 100644
--- a/app/src/components/Generation/GenerationForm.tsx
+++ b/app/src/components/Generation/GenerationForm.tsx
@@ -1,4 +1,5 @@
-import { Loader2, Mic } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Loading01Icon, Mic01Icon } from '@hugeicons/core-free-icons';
 import { Button } from '@/components/ui/button';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import {
@@ -46,7 +47,7 @@ export function GenerationForm() {
               <FormLabel>Voice Profile</FormLabel>
               {selectedProfile ? (
                 <div className="mt-2 p-3 border rounded-md bg-muted/50 flex items-center gap-2">
-                  <Mic className="h-4 w-4 text-muted-foreground" />
+                  <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4 text-muted-foreground" />
                   <span className="font-medium">{selectedProfile.name}</span>
                   <span className="text-sm text-muted-foreground">{selectedProfile.language}</span>
                 </div>
@@ -177,7 +178,7 @@ export function GenerationForm() {
             >
               {isPending ? (
                 <>
-                  <Loader2 className="mr-2 h-4 w-4 animate-spin" />
+                  <HugeiconsIcon icon={Loading01Icon} size={16} className="mr-2 h-4 w-4 animate-spin" />
                   Generating...
                 </>
               ) : (
diff --git a/app/src/components/History/HistoryTable.tsx b/app/src/components/History/HistoryTable.tsx
index e572f69e..0c889046 100644
--- a/app/src/components/History/HistoryTable.tsx
+++ b/app/src/components/History/HistoryTable.tsx
@@ -1,12 +1,13 @@
+import { HugeiconsIcon } from '@hugeicons/react';
 import {
-  AudioWaveform,
-  Download,
-  FileArchive,
-  Loader2,
-  MoreHorizontal,
-  Play,
-  Trash2,
-} from 'lucide-react';
+  WaveIcon,
+  Download01Icon,
+  Archive01Icon,
+  Loading01Icon,
+  MoreHorizontalIcon,
+  PlayIcon,
+  Delete01Icon,
+} from '@hugeicons/core-free-icons';
 import { useEffect, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import {
@@ -222,7 +223,7 @@ export function HistoryTable() {
   if (isLoading && page === 0) {
     return (
       <div className="flex items-center justify-center h-full">
-        <Loader2 className="h-8 w-8 animate-spin text-muted-foreground" />
+        <HugeiconsIcon icon={Loading01Icon} size={32} className="h-8 w-8 animate-spin text-muted-foreground" />
       </div>
     );
   }
@@ -268,7 +269,7 @@ export function HistoryTable() {
                 >
                   {/* Waveform icon */}
                   <div className="flex items-center shrink-0">
-                    <AudioWaveform className="h-5 w-5 text-muted-foreground" />
+                    <HugeiconsIcon icon={WaveIcon} size={20} className="h-5 w-5 text-muted-foreground" />
                   </div>
 
                   {/* Left side - Meta information */}
@@ -310,28 +311,28 @@ export function HistoryTable() {
                           className="h-8 w-8"
                           aria-label="Actions"
                         >
-                          <MoreHorizontal className="h-4 w-4" />
+                          <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
                         </Button>
                       </DropdownMenuTrigger>
                       <DropdownMenuContent align="end">
                         <DropdownMenuItem
                           onClick={() => handlePlay(gen.id, gen.text, gen.profile_id)}
                         >
-                          <Play className="mr-2 h-4 w-4" />
+                          <HugeiconsIcon icon={PlayIcon} size={16} className="mr-2 h-4 w-4" />
                           Play
                         </DropdownMenuItem>
                         <DropdownMenuItem
                           onClick={() => handleDownloadAudio(gen.id, gen.text)}
                           disabled={exportGenerationAudio.isPending}
                         >
-                          <Download className="mr-2 h-4 w-4" />
+                          <HugeiconsIcon icon={Download01Icon} size={16} className="mr-2 h-4 w-4" />
                           Export Audio
                         </DropdownMenuItem>
                         <DropdownMenuItem
                           onClick={() => handleExportPackage(gen.id, gen.text)}
                           disabled={exportGeneration.isPending}
                         >
-                          <FileArchive className="mr-2 h-4 w-4" />
+                          <HugeiconsIcon icon={Archive01Icon} size={16} className="mr-2 h-4 w-4" />
                           Export Package
                         </DropdownMenuItem>
                         <DropdownMenuItem
@@ -339,7 +340,7 @@ export function HistoryTable() {
                           disabled={deleteGeneration.isPending}
                           className="text-destructive focus:text-destructive"
                         >
-                          <Trash2 className="mr-2 h-4 w-4" />
+                          <HugeiconsIcon icon={Delete01Icon} size={16} className="mr-2 h-4 w-4" />
                           Delete
                         </DropdownMenuItem>
                       </DropdownMenuContent>
@@ -352,7 +353,7 @@ export function HistoryTable() {
             {/* Load more trigger element */}
             {hasMore && (
               <div ref={loadMoreRef} className="flex items-center justify-center py-4">
-                {isFetching && <Loader2 className="h-6 w-6 animate-spin text-muted-foreground" />}
+                {isFetching && <HugeiconsIcon icon={Loading01Icon} size={24} className="h-6 w-6 animate-spin text-muted-foreground" />}
               </div>
             )}
 
diff --git a/app/src/components/MainEditor/MainEditor.tsx b/app/src/components/MainEditor/MainEditor.tsx
index 9d597b1e..17125893 100644
--- a/app/src/components/MainEditor/MainEditor.tsx
+++ b/app/src/components/MainEditor/MainEditor.tsx
@@ -1,4 +1,5 @@
-import { Sparkles, Upload } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { SparklesIcon, Upload01Icon } from '@hugeicons/core-free-icons';
 import { useRef, useState } from 'react';
 import { FloatingGenerateBox } from '@/components/Generation/FloatingGenerateBox';
 import { HistoryTable } from '@/components/History/HistoryTable';
@@ -89,7 +90,7 @@ export function MainEditor() {
             <h2 className="text-2xl font-bold">Voicebox</h2>
             <div className="flex gap-2">
               <Button variant="outline" onClick={handleImportClick}>
-                <Upload className="mr-2 h-4 w-4" />
+                <HugeiconsIcon icon={Upload01Icon} size={16} className="mr-2 h-4 w-4" />
                 Import Voice
               </Button>
               <input
@@ -100,7 +101,7 @@ export function MainEditor() {
                 className="hidden"
               />
               <Button onClick={() => setDialogOpen(true)}>
-                <Sparkles className="mr-2 h-4 w-4" />
+                <HugeiconsIcon icon={SparklesIcon} size={16} className="mr-2 h-4 w-4" />
                 Create Voice
               </Button>
             </div>
diff --git a/app/src/components/ServerSettings/ModelManagement.tsx b/app/src/components/ServerSettings/ModelManagement.tsx
index 4a5fd439..f7e10fdb 100644
--- a/app/src/components/ServerSettings/ModelManagement.tsx
+++ b/app/src/components/ServerSettings/ModelManagement.tsx
@@ -1,5 +1,6 @@
 import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
-import { Download, Loader2, Trash2 } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Download01Icon, Loading01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useCallback, useState } from 'react';
 import {
   AlertDialog,
@@ -67,11 +68,11 @@ export function ModelManagement() {
 
   const handleDownload = async (modelName: string) => {
     console.log('[Download] Button clicked for:', modelName, 'at', new Date().toISOString());
-    
+
     // Find display name
     const model = modelStatus?.models.find((m) => m.model_name === modelName);
     const displayName = model?.display_name || modelName;
-    
+
     try {
       // IMPORTANT: Call the API FIRST before setting state
       // Setting state enables the SSE EventSource in useModelDownloadToast,
@@ -79,11 +80,11 @@ export function ModelManagement() {
       console.log('[Download] Calling download API for:', modelName);
       const result = await apiClient.triggerModelDownload(modelName);
       console.log('[Download] Download API responded:', result);
-      
+
       // NOW set state to enable SSE tracking (after download has started on backend)
       setDownloadingModel(modelName);
       setDownloadingDisplayName(displayName);
-      
+
       // Download initiated successfully - state will be cleared when SSE reports completion
       // or by the polling interval detecting the model is downloaded
       queryClient.invalidateQueries({ queryKey: ['modelStatus'] });
@@ -117,7 +118,7 @@ export function ModelManagement() {
       // Invalidate AND explicitly refetch to ensure UI updates
       // Using refetchType: 'all' ensures we refetch even if the query is stale
       console.log('[Delete] Invalidating modelStatus query');
-      await queryClient.invalidateQueries({ 
+      await queryClient.invalidateQueries({
         queryKey: ['modelStatus'],
         refetchType: 'all',
       });
@@ -153,7 +154,7 @@ export function ModelManagement() {
       <CardContent className="space-y-4">
         {isLoading ? (
           <div className="flex items-center justify-center py-8">
-            <Loader2 className="h-6 w-6 animate-spin text-muted-foreground" />
+            <HugeiconsIcon icon={Loading01Icon} size={24} className="h-6 w-6 animate-spin text-muted-foreground" />
           </div>
         ) : modelStatus ? (
           <div className="space-y-4">
@@ -212,7 +213,6 @@ export function ModelManagement() {
                   ))}
               </div>
             </div>
-
           </div>
         ) : null}
       </CardContent>
@@ -246,7 +246,7 @@ export function ModelManagement() {
             >
               {deleteMutation.isPending ? (
                 <>
-                  <Loader2 className="h-4 w-4 mr-2 animate-spin" />
+                  <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 mr-2 animate-spin" />
                   Deleting...
                 </>
               ) : (
@@ -265,20 +265,20 @@ interface ModelItemProps {
     model_name: string;
     display_name: string;
     downloaded: boolean;
-    downloading?: boolean;  // From server - true if download in progress
+    downloading?: boolean; // From server - true if download in progress
     size_mb?: number;
     loaded: boolean;
   };
   onDownload: () => void;
   onDelete: () => void;
-  isDownloading: boolean;  // Local state - true if user just clicked download
+  isDownloading: boolean; // Local state - true if user just clicked download
   formatSize: (sizeMb?: number) => string;
 }
 
 function ModelItem({ model, onDownload, onDelete, isDownloading, formatSize }: ModelItemProps) {
   // Use server's downloading state OR local state (for immediate feedback before server updates)
   const showDownloading = model.downloading || isDownloading;
-  
+
   return (
     <div className="flex items-center justify-between p-3 border rounded-lg">
       <div className="flex-1">
@@ -315,17 +315,17 @@ function ModelItem({ model, onDownload, onDelete, isDownloading, formatSize }: M
               disabled={model.loaded}
               title={model.loaded ? 'Unload model before deleting' : 'Delete model'}
             >
-              <Trash2 className="h-4 w-4" />
+              <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
             </Button>
           </div>
         ) : showDownloading ? (
           <Button size="sm" variant="outline" disabled>
-            <Loader2 className="h-4 w-4 mr-2 animate-spin" />
+            <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 mr-2 animate-spin" />
             Downloading...
           </Button>
         ) : (
           <Button size="sm" onClick={onDownload} variant="outline">
-            <Download className="h-4 w-4 mr-2" />
+            <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-2" />
             Download
           </Button>
         )}
diff --git a/app/src/components/ServerSettings/ModelProgress.tsx b/app/src/components/ServerSettings/ModelProgress.tsx
index 76aa99f1..30229c50 100644
--- a/app/src/components/ServerSettings/ModelProgress.tsx
+++ b/app/src/components/ServerSettings/ModelProgress.tsx
@@ -1,4 +1,5 @@
-import { Loader2, XCircle } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Loading01Icon, CancelCircleIcon } from '@hugeicons/core-free-icons';
 import { useEffect, useState } from 'react';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import { Progress } from '@/components/ui/progress';
@@ -74,10 +75,10 @@ export function ModelProgress({ modelName, displayName, isDownloading = false }:
   const getStatusIcon = () => {
     switch (progress.status) {
       case 'error':
-        return <XCircle className="h-4 w-4 text-destructive" />;
+        return <HugeiconsIcon icon={CancelCircleIcon} size={16} className="h-4 w-4 text-destructive" />;
       case 'downloading':
       case 'extracting':
-        return <Loader2 className="h-4 w-4 animate-spin" />;
+        return <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />;
       default:
         return null;
     }
diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index c18874a9..7ae237aa 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -1,5 +1,6 @@
 import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
-import { Download, Loader2, Trash2 } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Download01Icon, Loading01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useCallback, useState } from 'react';
 import {
   AlertDialog,
@@ -155,7 +156,7 @@ export function ProviderSettings() {
         </CardHeader>
         <CardContent>
           <div className="flex items-center justify-center py-8">
-            <Loader2 className="h-6 w-6 animate-spin" />
+            <HugeiconsIcon icon={Loading01Icon} size={24} className="h-6 w-6 animate-spin" />
           </div>
         </CardContent>
       </Card>
@@ -217,10 +218,10 @@ export function ProviderSettings() {
                     disabled={downloadingProvider === 'pytorch-cuda'}
                   >
                     {downloadingProvider === 'pytorch-cuda' ? (
-                      <Loader2 className="h-4 w-4 animate-spin" />
+                      <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
                     ) : (
                       <>
-                        <Download className="h-4 w-4 mr-1" />
+                        <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-1" />
                         Download (2.4GB)
                       </>
                     )}
@@ -241,7 +242,7 @@ export function ProviderSettings() {
                     size="sm"
                     variant="ghost"
                   >
-                    <Trash2 className="h-4 w-4" />
+                    <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
                   </Button>
                 )}
               </div>
@@ -270,10 +271,10 @@ export function ProviderSettings() {
                       disabled={downloadingProvider === 'pytorch-cpu'}
                     >
                       {downloadingProvider === 'pytorch-cpu' ? (
-                        <Loader2 className="h-4 w-4 animate-spin" />
+                        <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
                       ) : (
                         <>
-                          <Download className="h-4 w-4 mr-1" />
+                          <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-1" />
                           Download (300MB)
                         </>
                       )}
@@ -294,7 +295,7 @@ export function ProviderSettings() {
                       size="sm"
                       variant="ghost"
                     >
-                      <Trash2 className="h-4 w-4" />
+                      <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
                     </Button>
                   )}
                 </div>
diff --git a/app/src/components/ServerSettings/ServerStatus.tsx b/app/src/components/ServerSettings/ServerStatus.tsx
index 02a94ec2..8b5e5197 100644
--- a/app/src/components/ServerSettings/ServerStatus.tsx
+++ b/app/src/components/ServerSettings/ServerStatus.tsx
@@ -1,4 +1,5 @@
-import { Loader2, XCircle } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Loading01Icon, CancelCircleIcon } from '@hugeicons/core-free-icons';
 import { Badge } from '@/components/ui/badge';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import { useServerHealth } from '@/lib/hooks/useServer';
@@ -32,12 +33,12 @@ export function ServerStatus() {
 
         {isLoading ? (
           <div className="flex items-center gap-2">
-            <Loader2 className="h-4 w-4 animate-spin" />
+            <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
             <span className="text-sm">Checking connection...</span>
           </div>
         ) : error ? (
           <div className="flex items-center gap-2">
-            <XCircle className="h-4 w-4 text-destructive" />
+            <HugeiconsIcon icon={CancelCircleIcon} size={16} className="h-4 w-4 text-destructive" />
             <span className="text-sm text-destructive">Connection failed: {error.message}</span>
           </div>
         ) : health ? (
diff --git a/app/src/components/ServerSettings/UpdateStatus.tsx b/app/src/components/ServerSettings/UpdateStatus.tsx
index a3d832aa..5cab320e 100644
--- a/app/src/components/ServerSettings/UpdateStatus.tsx
+++ b/app/src/components/ServerSettings/UpdateStatus.tsx
@@ -1,4 +1,5 @@
-import { AlertCircle, Download, RefreshCw } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { AlertCircleIcon, Download01Icon, Refresh01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useState } from 'react';
 import { Badge } from '@/components/ui/badge';
 import { Button } from '@/components/ui/button';
@@ -36,21 +37,21 @@ export function UpdateStatus() {
             variant="outline"
             size="sm"
           >
-            <RefreshCw className={`h-4 w-4 mr-2 ${status.checking ? 'animate-spin' : ''}`} />
+            <HugeiconsIcon icon={Refresh01Icon} size={16} className={`h-4 w-4 mr-2 ${status.checking ? 'animate-spin' : ''}`} />
             Check for Updates
           </Button>
         </div>
 
         {status.checking && (
           <div className="flex items-center gap-2 text-sm text-muted-foreground">
-            <RefreshCw className="h-4 w-4 animate-spin" />
+            <HugeiconsIcon icon={Refresh01Icon} size={16} className="h-4 w-4 animate-spin" />
             Checking for updates...
           </div>
         )}
 
         {status.error && (
           <div className="flex items-center gap-2 text-sm text-destructive">
-            <AlertCircle className="h-4 w-4" />
+            <HugeiconsIcon icon={AlertCircleIcon} size={16} className="h-4 w-4" />
             {status.error}
           </div>
         )}
@@ -65,7 +66,7 @@ export function UpdateStatus() {
               <Badge>New</Badge>
             </div>
             <Button onClick={downloadAndInstall} className="w-full" size="sm">
-              <Download className="h-4 w-4 mr-2" />
+              <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-2" />
               Download Update
             </Button>
           </div>
@@ -75,7 +76,7 @@ export function UpdateStatus() {
           <div className="space-y-2">
             <div className="flex items-center justify-between text-sm">
               <div className="flex items-center gap-2">
-                <Download className="h-4 w-4" />
+                <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4" />
                 Downloading update...
               </div>
               {status.downloadProgress !== undefined && (
@@ -109,7 +110,7 @@ export function UpdateStatus() {
               your convenience.
             </div>
             <Button onClick={restartAndInstall} className="w-full" size="sm">
-              <RefreshCw className="h-4 w-4 mr-2" />
+              <HugeiconsIcon icon={Refresh01Icon} size={16} className="h-4 w-4 mr-2" />
               Restart Now
             </Button>
           </div>
diff --git a/app/src/components/Sidebar.tsx b/app/src/components/Sidebar.tsx
index a849344f..04442db0 100644
--- a/app/src/components/Sidebar.tsx
+++ b/app/src/components/Sidebar.tsx
@@ -1,5 +1,6 @@
 import { Link, useMatchRoute } from '@tanstack/react-router';
-import { Box, BookOpen, Loader2, Mic, Server, Speaker, Volume2 } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { PackageIcon, Book01Icon, Loading01Icon, Mic01Icon, McpServerIcon, SpeakerIcon, VolumeHighIcon } from '@hugeicons/core-free-icons';
 import voiceboxLogo from '@/assets/voicebox-logo.png';
 import { cn } from '@/lib/utils/cn';
 import { useGenerationStore } from '@/stores/generationStore';
@@ -10,12 +11,12 @@ interface SidebarProps {
 }
 
 const tabs = [
-  { id: 'main', path: '/', icon: Volume2, label: 'Generate' },
-  { id: 'stories', path: '/stories', icon: BookOpen, label: 'Stories' },
-  { id: 'voices', path: '/voices', icon: Mic, label: 'Voices' },
-  { id: 'audio', path: '/audio', icon: Speaker, label: 'Audio' },
-  { id: 'models', path: '/models', icon: Box, label: 'Models' },
-  { id: 'server', path: '/server', icon: Server, label: 'Server' },
+  { id: 'main', path: '/', icon: VolumeHighIcon, label: 'Generate' },
+  { id: 'stories', path: '/stories', icon: Book01Icon, label: 'Stories' },
+  { id: 'voices', path: '/voices', icon: Mic01Icon, label: 'Voices' },
+  { id: 'audio', path: '/audio', icon: SpeakerIcon, label: 'Audio' },
+  { id: 'models', path: '/models', icon: PackageIcon, label: 'Models' },
+  { id: 'server', path: '/server', icon: McpServerIcon, label: 'Server' },
 ];
 
 export function Sidebar({ isMacOS }: SidebarProps) {
@@ -43,7 +44,7 @@ export function Sidebar({ isMacOS }: SidebarProps) {
           // For index route, use exact match; for others, use default matching
           const isActive =
             tab.path === '/'
-              ? matchRoute({ to: '/', exact: true })
+              ? matchRoute({ to: '/' })
               : matchRoute({ to: tab.path });
 
           return (
@@ -58,7 +59,7 @@ export function Sidebar({ isMacOS }: SidebarProps) {
               title={tab.label}
               aria-label={tab.label}
             >
-              <Icon className="h-5 w-5" />
+              <HugeiconsIcon icon={Icon} size={20} className="h-5 w-5" />
             </Link>
           );
         })}
@@ -75,7 +76,7 @@ export function Sidebar({ isMacOS }: SidebarProps) {
             isPlayerVisible ? 'mb-[120px]' : 'mb-0',
           )}
         >
-          <Loader2 className="h-6 w-6 text-accent animate-spin" />
+          <HugeiconsIcon icon={Loading01Icon} size={24} className="h-6 w-6 text-accent animate-spin" />
         </div>
       )}
     </div>
diff --git a/app/src/components/StoriesTab/StoryChatItem.tsx b/app/src/components/StoriesTab/StoryChatItem.tsx
index 19fa2249..c1dd793f 100644
--- a/app/src/components/StoriesTab/StoryChatItem.tsx
+++ b/app/src/components/StoriesTab/StoryChatItem.tsx
@@ -1,6 +1,7 @@
 import { useSortable } from '@dnd-kit/sortable';
 import { CSS } from '@dnd-kit/utilities';
-import { GripVertical, Mic, MoreHorizontal, Play, Trash2 } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { DragDropVerticalIcon, Mic01Icon, MoreHorizontalIcon, PlayIcon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useState } from 'react';
 import { Button } from '@/components/ui/button';
 import {
@@ -74,7 +75,7 @@ export function StoryChatItem({
           className="shrink-0 cursor-grab active:cursor-grabbing touch-none text-muted-foreground hover:text-foreground transition-colors"
           {...dragHandleProps}
         >
-          <GripVertical className="h-5 w-5" />
+          <HugeiconsIcon icon={DragDropVerticalIcon} size={20} className="h-5 w-5" />
         </button>
       )}
 
@@ -92,7 +93,7 @@ export function StoryChatItem({
               onError={() => setAvatarError(true)}
             />
           ) : (
-            <Mic className="h-5 w-5 text-muted-foreground" />
+            <HugeiconsIcon icon={Mic01Icon} size={20} className="h-5 w-5 text-muted-foreground" />
           )}
         </div>
       </div>
@@ -119,16 +120,16 @@ export function StoryChatItem({
         <DropdownMenu>
           <DropdownMenuTrigger asChild>
             <Button variant="ghost" size="icon" className="h-8 w-8" aria-label="Actions">
-              <MoreHorizontal className="h-4 w-4" />
+              <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
             </Button>
           </DropdownMenuTrigger>
           <DropdownMenuContent align="end">
             <DropdownMenuItem onClick={handlePlay}>
-              <Play className="mr-2 h-4 w-4" />
+              <HugeiconsIcon icon={PlayIcon} size={16} className="mr-2 h-4 w-4" />
               Play from here
             </DropdownMenuItem>
             <DropdownMenuItem onClick={onRemove} className="text-destructive focus:text-destructive">
-              <Trash2 className="mr-2 h-4 w-4" />
+              <HugeiconsIcon icon={Delete01Icon} size={16} className="mr-2 h-4 w-4" />
               Remove from Story
             </DropdownMenuItem>
           </DropdownMenuContent>
diff --git a/app/src/components/StoriesTab/StoryContent.tsx b/app/src/components/StoriesTab/StoryContent.tsx
index 483e6657..518c42a0 100644
--- a/app/src/components/StoriesTab/StoryContent.tsx
+++ b/app/src/components/StoriesTab/StoryContent.tsx
@@ -13,7 +13,8 @@ import {
   sortableKeyboardCoordinates,
   verticalListSortingStrategy,
 } from '@dnd-kit/sortable';
-import { Download, Plus } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Download01Icon, Add01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useMemo, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import { Input } from '@/components/ui/input';
@@ -271,7 +272,7 @@ export function StoryContent() {
           <Popover open={isAddOpen} onOpenChange={setIsAddOpen}>
             <PopoverTrigger asChild>
               <Button variant="outline" size="sm">
-                <Plus className="mr-2 h-4 w-4" />
+                <HugeiconsIcon icon={Add01Icon} size={16} className="mr-2 h-4 w-4" />
                 Add
               </Button>
             </PopoverTrigger>
@@ -316,7 +317,7 @@ export function StoryContent() {
               onClick={handleExportAudio}
               disabled={exportAudio.isPending}
             >
-              <Download className="mr-2 h-4 w-4" />
+              <HugeiconsIcon icon={Download01Icon} size={16} className="mr-2 h-4 w-4" />
               Export Audio
             </Button>
           )}
diff --git a/app/src/components/StoriesTab/StoryList.tsx b/app/src/components/StoriesTab/StoryList.tsx
index ebbd6616..a283a34a 100644
--- a/app/src/components/StoriesTab/StoryList.tsx
+++ b/app/src/components/StoriesTab/StoryList.tsx
@@ -1,4 +1,5 @@
-import { Plus, BookOpen, MoreHorizontal, Pencil, Trash2 } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Add01Icon, Book01Icon, MoreHorizontalIcon, PencilIcon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useState } from 'react';
 import {
   AlertDialog,
@@ -177,7 +178,7 @@ export function StoryList() {
       <div className="flex items-center justify-between mb-4 px-1">
         <h2 className="text-2xl font-bold">Stories</h2>
         <Button onClick={() => setCreateDialogOpen(true)} size="sm">
-          <Plus className="mr-2 h-4 w-4" />
+          <HugeiconsIcon icon={Add01Icon} size={16} className="mr-2 h-4 w-4" />
           New Story
         </Button>
       </div>
@@ -186,7 +187,7 @@ export function StoryList() {
       <div className="flex-1 min-h-0 overflow-y-auto space-y-2">
         {storyList.length === 0 ? (
           <div className="text-center py-12 px-5 border-2 border-dashed border-muted rounded-2xl text-muted-foreground">
-            <BookOpen className="h-12 w-12 mx-auto mb-4 opacity-50" />
+            <HugeiconsIcon icon={Book01Icon} size={48} className="h-12 w-12 mx-auto mb-4 opacity-50" />
             <p className="text-sm">No stories yet</p>
             <p className="text-xs mt-2">Create your first story to get started</p>
           </div>
@@ -227,19 +228,19 @@ export function StoryList() {
                       className="h-8 w-8 opacity-0 group-hover:opacity-100 transition-opacity"
                       onClick={(e) => e.stopPropagation()}
                     >
-                      <MoreHorizontal className="h-4 w-4" />
+                      <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
                     </Button>
                   </DropdownMenuTrigger>
                   <DropdownMenuContent align="end">
                     <DropdownMenuItem onClick={() => handleEditClick(story)}>
-                      <Pencil className="mr-2 h-4 w-4" />
+                      <HugeiconsIcon icon={PencilIcon} size={16} className="mr-2 h-4 w-4" />
                       Edit
                     </DropdownMenuItem>
                     <DropdownMenuItem
                       onClick={() => handleDeleteClick(story.id)}
                       className="text-destructive focus:text-destructive"
                     >
-                      <Trash2 className="mr-2 h-4 w-4" />
+                      <HugeiconsIcon icon={Delete01Icon} size={16} className="mr-2 h-4 w-4" />
                       Delete
                     </DropdownMenuItem>
                   </DropdownMenuContent>
diff --git a/app/src/components/StoriesTab/StoryTrackEditor.tsx b/app/src/components/StoriesTab/StoryTrackEditor.tsx
index 74dbde25..95a10296 100644
--- a/app/src/components/StoriesTab/StoryTrackEditor.tsx
+++ b/app/src/components/StoriesTab/StoryTrackEditor.tsx
@@ -1,14 +1,15 @@
+import { HugeiconsIcon } from '@hugeicons/react';
 import {
-  Copy,
-  GripHorizontal,
-  Minus,
-  Pause,
-  Play,
-  Plus,
-  Scissors,
-  Square,
-  Trash2,
-} from 'lucide-react';
+  Copy01Icon,
+  DragDropHorizontalIcon,
+  RemoveIcon,
+  PauseIcon,
+  PlayIcon,
+  Add01Icon,
+  Scissor01Icon,
+  SquareIcon,
+  Delete01Icon,
+} from '@hugeicons/core-free-icons';
 import { useCallback, useEffect, useMemo, useRef, useState } from 'react';
 import WaveSurfer from 'wavesurfer.js';
 import { Button } from '@/components/ui/button';
@@ -723,7 +724,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
           onMouseDown={handleResizeStart}
           aria-label="Resize track editor"
         >
-          <GripHorizontal className="h-3 w-3 text-muted-foreground/50 group-hover:text-muted-foreground" />
+          <HugeiconsIcon icon={DragDropHorizontalIcon} size={12} className="h-3 w-3 text-muted-foreground/50 group-hover:text-muted-foreground" />
         </button>
 
         {/* Toolbar */}
@@ -737,7 +738,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
               onClick={handlePlayPause}
               title="Play/Pause (Space)"
             >
-              {isCurrentlyPlaying ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
+              {isCurrentlyPlaying ? <HugeiconsIcon icon={PauseIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={PlayIcon} size={16} className="h-4 w-4" />}
             </Button>
             <Button
               variant="ghost"
@@ -746,7 +747,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
               onClick={handleStop}
               disabled={!isCurrentlyPlaying}
             >
-              <Square className="h-3 w-3" />
+              <HugeiconsIcon icon={SquareIcon} size={12} className="h-3 w-3" />
             </Button>
             <span className="text-xs text-muted-foreground tabular-nums ml-2">
               {formatTime(currentTimeMs)} / {formatTime(totalDurationMs)}
@@ -763,7 +764,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
                 onClick={handleSplit}
                 title="Split at playhead (S)"
               >
-                <Scissors className="h-4 w-4" />
+                <HugeiconsIcon icon={Scissor01Icon} size={16} className="h-4 w-4" />
               </Button>
               <Button
                 variant="ghost"
@@ -772,7 +773,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
                 onClick={handleDuplicate}
                 title="Duplicate (Cmd/Ctrl+D)"
               >
-                <Copy className="h-4 w-4" />
+                <HugeiconsIcon icon={Copy01Icon} size={16} className="h-4 w-4" />
               </Button>
               <Button
                 variant="ghost"
@@ -781,7 +782,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
                 onClick={handleDelete}
                 title="Delete (Delete/Backspace)"
               >
-                <Trash2 className="h-4 w-4" />
+                <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
               </Button>
             </div>
           )}
@@ -790,10 +791,10 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
           <div className="flex items-center gap-2">
             <span className="text-xs text-muted-foreground">Zoom:</span>
             <Button variant="ghost" size="icon" className="h-6 w-6" onClick={handleZoomOut}>
-              <Minus className="h-3 w-3" />
+              <HugeiconsIcon icon={RemoveIcon} size={12} className="h-3 w-3" />
             </Button>
             <Button variant="ghost" size="icon" className="h-6 w-6" onClick={handleZoomIn}>
-              <Plus className="h-3 w-3" />
+              <HugeiconsIcon icon={Add01Icon} size={12} className="h-3 w-3" />
             </Button>
           </div>
         </div>
@@ -837,7 +838,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
               type="button"
               className="h-6 border-b bg-muted/20 sticky top-0 z-10 cursor-pointer text-left"
               style={{ width: `${timelineWidth}px` }}
-              onClick={handleTimelineClick}
+              onClick={(e) => handleTimelineClick(e as unknown as React.MouseEvent<HTMLDivElement>)}
               aria-label="Seek timeline"
             >
               {timeMarkers.map((ms) => (
@@ -878,7 +879,7 @@ export function StoryTrackEditor({ storyId, items }: StoryTrackEditorProps) {
               <button
                 type="button"
                 className="absolute inset-0 z-0 cursor-pointer"
-                onClick={handleTimelineClick}
+                onClick={(e) => handleTimelineClick(e as unknown as React.MouseEvent<HTMLDivElement>)}
                 aria-label="Seek timeline"
               />
 
diff --git a/app/src/components/VoiceProfiles/AudioSampleRecording.tsx b/app/src/components/VoiceProfiles/AudioSampleRecording.tsx
index 4f2db4e3..4364b351 100644
--- a/app/src/components/VoiceProfiles/AudioSampleRecording.tsx
+++ b/app/src/components/VoiceProfiles/AudioSampleRecording.tsx
@@ -1,4 +1,5 @@
-import { Mic, Pause, Play, Square } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, PauseIcon, PlayIcon, SquareIcon } from '@hugeicons/core-free-icons';
 import { memo, useEffect, useState } from 'react';
 import { Visualizer } from 'react-sound-visualizer';
 import { Button } from '@/components/ui/button';
@@ -95,7 +96,7 @@ export function AudioSampleRecording({
                 size="lg"
                 className="relative z-10 flex items-center gap-2"
               >
-                <Mic className="h-5 w-5" />
+                <HugeiconsIcon icon={Mic01Icon} size={20} className="h-5 w-5" />
                 Start Recording
               </Button>
               <p className="relative z-10 text-sm text-muted-foreground text-center">
@@ -122,7 +123,7 @@ export function AudioSampleRecording({
                 onClick={onStop}
                 className="relative z-10 flex items-center gap-2 bg-accent text-accent-foreground hover:bg-accent/90"
               >
-                <Square className="h-4 w-4" />
+                <HugeiconsIcon icon={SquareIcon} size={16} className="h-4 w-4" />
                 Stop Recording
               </Button>
               <p className="relative z-10 text-sm text-muted-foreground text-center">
@@ -134,13 +135,13 @@ export function AudioSampleRecording({
           {file && !isRecording && (
             <div className="flex flex-col items-center justify-center gap-4 p-4 border-2 border-primary rounded-lg bg-primary/5 min-h-[180px]">
               <div className="flex items-center gap-2">
-                <Mic className="h-5 w-5 text-primary" />
+                <HugeiconsIcon icon={Mic01Icon} size={20} className="h-5 w-5 text-primary" />
                 <span className="font-medium">Recording complete</span>
               </div>
               <p className="text-sm text-muted-foreground text-center">File: {file.name}</p>
               <div className="flex gap-2">
                 <Button type="button" size="icon" variant="outline" onClick={onPlayPause}>
-                  {isPlaying ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
+                  {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={PlayIcon} size={16} className="h-4 w-4" />}
                 </Button>
                 <Button
                   type="button"
@@ -149,7 +150,7 @@ export function AudioSampleRecording({
                   disabled={isTranscribing}
                   className="flex items-center gap-2"
                 >
-                  <Mic className="h-4 w-4" />
+                  <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4" />
                   {isTranscribing ? 'Transcribing...' : 'Transcribe'}
                 </Button>
                 <Button
diff --git a/app/src/components/VoiceProfiles/AudioSampleSystem.tsx b/app/src/components/VoiceProfiles/AudioSampleSystem.tsx
index 0cc892b2..d120e1a1 100644
--- a/app/src/components/VoiceProfiles/AudioSampleSystem.tsx
+++ b/app/src/components/VoiceProfiles/AudioSampleSystem.tsx
@@ -1,4 +1,5 @@
-import { Mic, Monitor, Pause, Play, Square } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, DeskIcon, PauseIcon, PlayIcon, SquareIcon } from '@hugeicons/core-free-icons';
 import { Button } from '@/components/ui/button';
 import { FormControl, FormItem, FormMessage } from '@/components/ui/form';
 import { formatAudioDuration } from '@/lib/utils/audio';
@@ -35,7 +36,7 @@ export function AudioSampleSystem({
           {!isRecording && !file && (
             <div className="flex flex-col items-center justify-center gap-4 p-4 border-2 border-dashed rounded-lg min-h-[180px]">
               <Button type="button" onClick={onStart} size="lg" className="flex items-center gap-2">
-                <Monitor className="h-5 w-5" />
+                <HugeiconsIcon icon={DeskIcon} size={20} className="h-5 w-5" />
                 Start Capture
               </Button>
               <p className="text-sm text-muted-foreground text-center">
@@ -60,7 +61,7 @@ export function AudioSampleSystem({
                 variant="destructive"
                 className="flex items-center gap-2"
               >
-                <Square className="h-4 w-4" />
+                <HugeiconsIcon icon={SquareIcon} size={16} className="h-4 w-4" />
                 Stop Capture
               </Button>
               <p className="text-sm text-muted-foreground text-center">
@@ -72,13 +73,13 @@ export function AudioSampleSystem({
           {file && !isRecording && (
             <div className="flex flex-col items-center justify-center gap-4 p-4 border-2 border-primary rounded-lg bg-primary/5 min-h-[180px]">
               <div className="flex items-center gap-2">
-                <Monitor className="h-5 w-5 text-primary" />
+                <HugeiconsIcon icon={DeskIcon} size={20} className="h-5 w-5 text-primary" />
                 <span className="font-medium">Capture complete</span>
               </div>
               <p className="text-sm text-muted-foreground text-center">File: {file.name}</p>
               <div className="flex gap-2">
                 <Button type="button" size="icon" variant="outline" onClick={onPlayPause}>
-                  {isPlaying ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
+                  {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={PlayIcon} size={16} className="h-4 w-4" />}
                 </Button>
                 <Button
                   type="button"
@@ -87,7 +88,7 @@ export function AudioSampleSystem({
                   disabled={isTranscribing}
                   className="flex items-center gap-2"
                 >
-                  <Mic className="h-4 w-4" />
+                  <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4" />
                   {isTranscribing ? 'Transcribing...' : 'Transcribe'}
                 </Button>
                 <Button
diff --git a/app/src/components/VoiceProfiles/AudioSampleUpload.tsx b/app/src/components/VoiceProfiles/AudioSampleUpload.tsx
index c66ded14..9a954121 100644
--- a/app/src/components/VoiceProfiles/AudioSampleUpload.tsx
+++ b/app/src/components/VoiceProfiles/AudioSampleUpload.tsx
@@ -1,4 +1,5 @@
-import { Mic, Pause, Play, Upload } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, PauseIcon, PlayIcon, Upload01Icon } from '@hugeicons/core-free-icons';
 import { useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import { FormControl, FormItem, FormMessage } from '@/components/ui/form';
@@ -89,7 +90,7 @@ export function AudioSampleUpload({
                   onClick={() => fileInputRef.current?.click()}
                   className="flex items-center gap-2"
                 >
-                  <Upload className="h-5 w-5" />
+                  <HugeiconsIcon icon={Upload01Icon} size={20} className="h-5 w-5" />
                   Choose File
                 </Button>
                 <p className="text-sm text-muted-foreground text-center">
@@ -99,7 +100,7 @@ export function AudioSampleUpload({
             ) : (
               <>
                 <div className="flex items-center gap-2">
-                  <Upload className="h-5 w-5 text-primary" />
+                  <HugeiconsIcon icon={Upload01Icon} size={20} className="h-5 w-5 text-primary" />
                   <span className="font-medium">File uploaded</span>
                 </div>
                 <p className="text-sm text-muted-foreground text-center">File: {file.name}</p>
@@ -111,7 +112,7 @@ export function AudioSampleUpload({
                     onClick={onPlayPause}
                     disabled={isValidating}
                   >
-                    {isPlaying ? <Pause className="h-4 w-4" /> : <Play className="h-4 w-4" />}
+                    {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={16} className="h-4 w-4" /> : <HugeiconsIcon icon={PlayIcon} size={16} className="h-4 w-4" />}
                   </Button>
                   <Button
                     type="button"
@@ -120,7 +121,7 @@ export function AudioSampleUpload({
                     disabled={isTranscribing || isValidating || isDisabled}
                     className="flex items-center gap-2"
                   >
-                    <Mic className="h-4 w-4" />
+                    <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4" />
                     {isTranscribing ? 'Transcribing...' : 'Transcribe'}
                   </Button>
                   <Button
diff --git a/app/src/components/VoiceProfiles/ProfileCard.tsx b/app/src/components/VoiceProfiles/ProfileCard.tsx
index e879294f..5e2588fa 100644
--- a/app/src/components/VoiceProfiles/ProfileCard.tsx
+++ b/app/src/components/VoiceProfiles/ProfileCard.tsx
@@ -1,4 +1,5 @@
-import { Download, Edit, Mic, Trash2 } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Download01Icon, Edit01Icon, Mic01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useState } from 'react';
 import { Badge } from '@/components/ui/badge';
 import { Button } from '@/components/ui/button';
@@ -84,7 +85,7 @@ export function ProfileCard({ profile }: ProfileCardProps) {
                   onError={() => setAvatarError(true)}
                 />
               ) : (
-                <Mic className="h-3.5 w-3.5 text-muted-foreground" />
+                <HugeiconsIcon icon={Mic01Icon} size={14} className="h-3.5 w-3.5 text-muted-foreground" />
               )}
             </div>
             <span className="break-words">{profile.name}</span>
@@ -101,13 +102,13 @@ export function ProfileCard({ profile }: ProfileCardProps) {
           </div>
           <div className="flex gap-0.5 justify-end items-end mt-auto">
             <CircleButton
-              icon={Download}
+              icon={(props) => <HugeiconsIcon icon={Download01Icon} size={14} {...props} />}
               onClick={handleExport}
               disabled={exportProfile.isPending}
               aria-label="Export profile"
             />
             <CircleButton
-              icon={Edit}
+              icon={(props) => <HugeiconsIcon icon={Edit01Icon} size={14} {...props} />}
               onClick={(e) => {
                 e.stopPropagation();
                 handleEdit();
@@ -115,7 +116,7 @@ export function ProfileCard({ profile }: ProfileCardProps) {
               aria-label="Edit profile"
             />
             <CircleButton
-              icon={Trash2}
+              icon={(props) => <HugeiconsIcon icon={Delete01Icon} size={14} {...props} />}
               onClick={handleDeleteClick}
               disabled={deleteProfile.isPending}
               aria-label="Delete profile"
diff --git a/app/src/components/VoiceProfiles/ProfileForm.tsx b/app/src/components/VoiceProfiles/ProfileForm.tsx
index f4fc5711..3fcd987e 100644
--- a/app/src/components/VoiceProfiles/ProfileForm.tsx
+++ b/app/src/components/VoiceProfiles/ProfileForm.tsx
@@ -1,5 +1,6 @@
 import { zodResolver } from '@hookform/resolvers/zod';
-import { Edit2, Mic, Monitor, Upload, X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Edit02Icon, Mic01Icon, DeskIcon, Upload01Icon, Cancel01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useRef, useState } from 'react';
 import { useForm } from 'react-hook-form';
 import * as z from 'zod';
@@ -635,7 +636,7 @@ export function ProfileForm() {
                     setSampleMode('record');
                   }}
                 >
-                  <X className="h-3 w-3 mr-1" />
+                  <HugeiconsIcon icon={Cancel01Icon} size={12} className="h-3 w-3 mr-1" />
                   Discard
                 </Button>
               </div>
@@ -668,16 +669,16 @@ export function ProfileForm() {
                           className={`grid w-full ${platform.metadata.isTauri && isSystemAudioSupported ? 'grid-cols-3' : 'grid-cols-2'}`}
                         >
                           <TabsTrigger value="upload" className="flex items-center gap-2">
-                            <Upload className="h-4 w-4 shrink-0" />
+                            <HugeiconsIcon icon={Upload01Icon} size={16} className="h-4 w-4 shrink-0" />
                             Upload
                           </TabsTrigger>
                           <TabsTrigger value="record" className="flex items-center gap-2">
-                            <Mic className="h-4 w-4 shrink-0" />
+                            <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4 shrink-0" />
                             Record
                           </TabsTrigger>
                           {platform.metadata.isTauri && isSystemAudioSupported && (
                             <TabsTrigger value="system" className="flex items-center gap-2">
-                              <Monitor className="h-4 w-4 shrink-0" />
+                              <HugeiconsIcon icon={DeskIcon} size={16} className="h-4 w-4 shrink-0" />
                               System Audio
                             </TabsTrigger>
                           )}
@@ -798,7 +799,7 @@ export function ProfileForm() {
                                     className="h-full w-full object-cover"
                                   />
                                 ) : (
-                                  <Mic className="h-10 w-10 text-muted-foreground" />
+                                  <HugeiconsIcon icon={Mic01Icon} size={40} className="h-10 w-10 text-muted-foreground" />
                                 )}
                               </div>
                               <button
@@ -806,7 +807,7 @@ export function ProfileForm() {
                                 onClick={() => avatarInputRef.current?.click()}
                                 className="absolute inset-0 rounded-full bg-accent/60 opacity-0 group-hover:opacity-100 transition-opacity flex items-center justify-center cursor-pointer"
                               >
-                                <Edit2 className="h-6 w-6 text-accent-foreground" />
+                                <HugeiconsIcon icon={Edit02Icon} size={24} className="h-6 w-6 text-accent-foreground" />
                               </button>
                               {(avatarPreview || editingProfile?.avatar_path) && (
                                 <button
@@ -815,7 +816,7 @@ export function ProfileForm() {
                                   disabled={deleteAvatar.isPending}
                                   className="absolute bottom-0 right-0 h-6 w-6 rounded-full bg-background/60 backdrop-blur-sm text-muted-foreground flex items-center justify-center hover:bg-background/80 hover:text-foreground transition-colors shadow-sm border border-border/50"
                                 >
-                                  <X className="h-3.5 w-3.5" />
+                                  <HugeiconsIcon icon={Cancel01Icon} size={14} className="h-3.5 w-3.5" />
                                 </button>
                               )}
                             </div>
diff --git a/app/src/components/VoiceProfiles/ProfileList.tsx b/app/src/components/VoiceProfiles/ProfileList.tsx
index 8dcb06a4..4e57bfdb 100644
--- a/app/src/components/VoiceProfiles/ProfileList.tsx
+++ b/app/src/components/VoiceProfiles/ProfileList.tsx
@@ -1,4 +1,5 @@
-import { Mic, Sparkles } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, SparklesIcon } from '@hugeicons/core-free-icons';
 import { Button } from '@/components/ui/button';
 import { Card, CardContent } from '@/components/ui/card';
 import { useProfiles } from '@/lib/hooks/useProfiles';
@@ -30,12 +31,12 @@ export function ProfileList() {
         {allProfiles.length === 0 ? (
           <Card>
             <CardContent className="flex flex-col items-center justify-center py-12">
-              <Mic className="h-12 w-12 text-muted-foreground mb-4" />
+              <HugeiconsIcon icon={Mic01Icon} size={48} className="h-12 w-12 text-muted-foreground mb-4" />
               <p className="text-muted-foreground mb-4">
                 No voice profiles yet. Create your first profile to get started.
               </p>
               <Button onClick={() => setDialogOpen(true)}>
-                <Sparkles className="mr-2 h-4 w-4" />
+                <HugeiconsIcon icon={SparklesIcon} size={16} className="mr-2 h-4 w-4" />
                 Create Voice
               </Button>
             </CardContent>
diff --git a/app/src/components/VoiceProfiles/SampleList.tsx b/app/src/components/VoiceProfiles/SampleList.tsx
index 19aa1ca8..17664afd 100644
--- a/app/src/components/VoiceProfiles/SampleList.tsx
+++ b/app/src/components/VoiceProfiles/SampleList.tsx
@@ -1,4 +1,5 @@
-import { Check, Edit, Pause, Play, Plus, Trash2, Volume2, X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CheckmarkCircle01Icon, Edit01Icon, PauseIcon, PlayIcon, Add01Icon, Delete01Icon, VolumeHighIcon, Cancel01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import { CircleButton } from '@/components/ui/circle-button';
@@ -103,7 +104,7 @@ function MiniSamplePlayer({ audioUrl }: MiniSamplePlayerProps) {
           onClick={handlePlayPause}
           disabled={isLoading}
         >
-          {isPlaying ? <Pause className="h-3.5 w-3.5" /> : <Play className="h-3.5 w-3.5 ml-0.5" />}
+          {isPlaying ? <HugeiconsIcon icon={PauseIcon} size={14} className="h-3.5 w-3.5" /> : <HugeiconsIcon icon={PlayIcon} size={14} className="h-3.5 w-3.5 ml-0.5" />}
         </Button>
 
         <div className="flex-1 min-w-0 flex items-center gap-2">
@@ -129,7 +130,7 @@ function MiniSamplePlayer({ audioUrl }: MiniSamplePlayerProps) {
           onClick={handleStop}
           title="Stop"
         >
-          <X className="h-3.5 w-3.5" />
+          <HugeiconsIcon icon={Cancel01Icon} size={14} className="h-3.5 w-3.5" />
         </Button>
       </div>
     </div>
@@ -209,7 +210,7 @@ export function SampleList({ profileId }: SampleListProps) {
     <div className="space-y-4 pt-4">
       {samples && samples.length === 0 ? (
         <div className="flex flex-col items-center justify-center py-8 text-center border border-dashed rounded-lg">
-          <Volume2 className="h-8 w-8 text-muted-foreground/50 mb-2" />
+          <HugeiconsIcon icon={VolumeHighIcon} size={32} className="h-8 w-8 text-muted-foreground/50 mb-2" />
           <p className="text-sm text-muted-foreground">No samples yet</p>
           <p className="text-xs text-muted-foreground/70 mt-1">
             Add your first audio sample to get started
@@ -232,7 +233,7 @@ export function SampleList({ profileId }: SampleListProps) {
                   /* Edit Mode */
                   <div className="p-4 space-y-3">
                     <div className="flex items-center gap-2 text-xs text-muted-foreground mb-2">
-                      <Edit className="h-3 w-3" />
+                      <HugeiconsIcon icon={Edit01Icon} size={12} className="h-3 w-3" />
                       <span>Editing transcription</span>
                     </div>
                     <Textarea
@@ -250,7 +251,7 @@ export function SampleList({ profileId }: SampleListProps) {
                         onClick={handleCancelEdit}
                         disabled={updateSample.isPending}
                       >
-                        <X className="h-4 w-4 mr-1" />
+                        <HugeiconsIcon icon={Cancel01Icon} size={16} className="h-4 w-4 mr-1" />
                         Cancel
                       </Button>
                       <Button
@@ -259,7 +260,7 @@ export function SampleList({ profileId }: SampleListProps) {
                         onClick={() => handleSaveEdit(sample.id)}
                         disabled={updateSample.isPending}
                       >
-                        <Check className="h-4 w-4 mr-1" />
+                        <HugeiconsIcon icon={CheckmarkCircle01Icon} size={16} className="h-4 w-4 mr-1" />
                         {updateSample.isPending ? 'Saving...' : 'Save'}
                       </Button>
                     </div>
@@ -278,12 +279,12 @@ export function SampleList({ profileId }: SampleListProps) {
                       {/* Action Buttons */}
                       <div className="shrink-0 flex items-center gap-0.5 opacity-0 group-hover:opacity-100 transition-opacity">
                         <CircleButton
-                          icon={Edit}
+                          icon={(props) => <HugeiconsIcon icon={Edit01Icon} size={14} {...props} />}
                           title="Edit transcription"
                           onClick={() => handleStartEdit(sample.id, sample.reference_text)}
                         />
                         <CircleButton
-                          icon={Trash2}
+                          icon={(props) => <HugeiconsIcon icon={Delete01Icon} size={14} {...props} />}
                           title="Delete sample"
                           onClick={() => handleDeleteClick(sample.id)}
                           disabled={deleteSample.isPending}
@@ -312,7 +313,7 @@ export function SampleList({ profileId }: SampleListProps) {
         className="w-full"
         onClick={() => setUploadOpen(true)}
       >
-        <Plus className="mr-2 h-4 w-4" />
+        <HugeiconsIcon icon={Add01Icon} size={16} className="mr-2 h-4 w-4" />
         Add Sample
       </Button>
 
diff --git a/app/src/components/VoiceProfiles/SampleUpload.tsx b/app/src/components/VoiceProfiles/SampleUpload.tsx
index 3c53b7d6..a57a27c0 100644
--- a/app/src/components/VoiceProfiles/SampleUpload.tsx
+++ b/app/src/components/VoiceProfiles/SampleUpload.tsx
@@ -1,5 +1,6 @@
 import { zodResolver } from '@hookform/resolvers/zod';
-import { Mic, Monitor, Upload } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon, DeskIcon, Upload01Icon } from '@hugeicons/core-free-icons';
 import { useEffect, useState } from 'react';
 import { useForm } from 'react-hook-form';
 import * as z from 'zod';
@@ -236,16 +237,16 @@ export function SampleUpload({ profileId, open, onOpenChange }: SampleUploadProp
                 className={`grid w-full ${platform.metadata.isTauri && isSystemAudioSupported ? 'grid-cols-3' : 'grid-cols-2'}`}
               >
                 <TabsTrigger value="upload" className="flex items-center gap-2">
-                  <Upload className="h-4 w-4 shrink-0" />
+                  <HugeiconsIcon icon={Upload01Icon} size={16} className="h-4 w-4 shrink-0" />
                   Upload
                 </TabsTrigger>
                 <TabsTrigger value="record" className="flex items-center gap-2">
-                  <Mic className="h-4 w-4 shrink-0" />
+                  <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4 shrink-0" />
                   Record
                 </TabsTrigger>
                 {platform.metadata.isTauri && isSystemAudioSupported && (
                   <TabsTrigger value="system" className="flex items-center gap-2">
-                    <Monitor className="h-4 w-4 shrink-0" />
+                    <HugeiconsIcon icon={DeskIcon} size={16} className="h-4 w-4 shrink-0" />
                     System Audio
                   </TabsTrigger>
                 )}
diff --git a/app/src/components/VoicesTab/VoicesTab.tsx b/app/src/components/VoicesTab/VoicesTab.tsx
index 12fedef5..c1e98a33 100644
--- a/app/src/components/VoicesTab/VoicesTab.tsx
+++ b/app/src/components/VoicesTab/VoicesTab.tsx
@@ -1,5 +1,6 @@
 import { useQuery, useQueryClient } from '@tanstack/react-query';
-import { Edit, MoreHorizontal, Plus, Trash2, Mic } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Edit01Icon, MoreHorizontalIcon, Add01Icon, Delete01Icon, Mic01Icon } from '@hugeicons/core-free-icons';
 import { useMemo, useRef } from 'react';
 import { Button } from '@/components/ui/button';
 import {
@@ -112,7 +113,7 @@ export function VoicesTab() {
         <div className="flex items-center justify-between mb-6">
           <h1 className="text-2xl font-bold">Voices</h1>
           <Button onClick={() => setDialogOpen(true)}>
-            <Plus className="h-4 w-4 mr-2" />
+            <HugeiconsIcon icon={Add01Icon} size={16} className="h-4 w-4 mr-2" />
             New Voice
           </Button>
         </div>
@@ -185,7 +186,7 @@ function VoiceRow({
       <TableCell>
         <div className="flex items-center gap-2">
           <div className="h-8 w-8 rounded-lg bg-muted flex items-center justify-center shrink-0">
-            <Mic className="h-4 w-4 text-muted-foreground" />
+            <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4 text-muted-foreground" />
           </div>
           <div>
             <div className="font-medium">{profile.name}</div>
@@ -214,16 +215,16 @@ function VoiceRow({
         <DropdownMenu>
           <DropdownMenuTrigger asChild>
             <Button variant="ghost" size="icon">
-              <MoreHorizontal className="h-4 w-4" />
+              <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
             </Button>
           </DropdownMenuTrigger>
           <DropdownMenuContent>
             <DropdownMenuItem onClick={onEdit}>
-              <Edit className="h-4 w-4 mr-2" />
+              <HugeiconsIcon icon={Edit01Icon} size={16} className="h-4 w-4 mr-2" />
               Edit
             </DropdownMenuItem>
             <DropdownMenuItem onClick={onDelete} className="text-destructive">
-              <Trash2 className="h-4 w-4 mr-2" />
+              <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4 mr-2" />
               Delete
             </DropdownMenuItem>
           </DropdownMenuContent>
diff --git a/app/src/components/ui/checkbox.tsx b/app/src/components/ui/checkbox.tsx
index f423fef0..303fe26d 100644
--- a/app/src/components/ui/checkbox.tsx
+++ b/app/src/components/ui/checkbox.tsx
@@ -1,5 +1,6 @@
 import * as React from 'react';
-import { Check } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CheckmarkCircle01Icon } from '@hugeicons/core-free-icons';
 import { cn } from '@/lib/utils/cn';
 
 export interface CheckboxProps {
@@ -34,7 +35,7 @@ const Checkbox = React.forwardRef<HTMLButtonElement, CheckboxProps>(
         )}
         {...props}
       >
-        {checked && <Check className="h-3 w-3 text-accent-foreground" />}
+        {checked && <HugeiconsIcon icon={CheckmarkCircle01Icon} size={12} className="h-3 w-3 text-accent-foreground" />}
       </button>
     );
   },
diff --git a/app/src/components/ui/dialog.tsx b/app/src/components/ui/dialog.tsx
index 5fe10944..14a38c3a 100644
--- a/app/src/components/ui/dialog.tsx
+++ b/app/src/components/ui/dialog.tsx
@@ -1,5 +1,6 @@
 import * as DialogPrimitive from '@radix-ui/react-dialog';
-import { X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Cancel01Icon } from '@hugeicons/core-free-icons';
 import * as React from 'react';
 import { cn } from '@/lib/utils/cn';
 
@@ -42,7 +43,7 @@ const DialogContent = React.forwardRef<
     >
       {children}
       <DialogPrimitive.Close className="absolute right-4 top-4 rounded-sm opacity-70 ring-offset-background transition-opacity hover:opacity-100 focus:outline-none focus:ring-2 focus:ring-ring focus:ring-offset-2 disabled:pointer-events-none data-[state=open]:bg-accent data-[state=open]:text-muted-foreground">
-        <X className="h-4 w-4" />
+        <HugeiconsIcon icon={Cancel01Icon} size={16} className="h-4 w-4" />
         <span className="sr-only">Close</span>
       </DialogPrimitive.Close>
     </DialogPrimitive.Content>
diff --git a/app/src/components/ui/dropdown-menu.tsx b/app/src/components/ui/dropdown-menu.tsx
index d59c291c..bb83b772 100644
--- a/app/src/components/ui/dropdown-menu.tsx
+++ b/app/src/components/ui/dropdown-menu.tsx
@@ -1,6 +1,7 @@
 import * as React from 'react';
 import * as DropdownMenuPrimitive from '@radix-ui/react-dropdown-menu';
-import { MoreHorizontal } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { MoreHorizontalIcon } from '@hugeicons/core-free-icons';
 import { cn } from '@/lib/utils/cn';
 
 const DropdownMenu = DropdownMenuPrimitive.Root;
@@ -26,7 +27,7 @@ const DropdownMenuSubTrigger = React.forwardRef<
     {...props}
   >
     {children}
-    <MoreHorizontal className="ml-auto h-4 w-4" />
+    <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="ml-auto h-4 w-4" />
   </DropdownMenuPrimitive.SubTrigger>
 ));
 DropdownMenuSubTrigger.displayName = DropdownMenuPrimitive.SubTrigger.displayName;
@@ -97,7 +98,7 @@ const DropdownMenuCheckboxItem = React.forwardRef<
   >
     <span className="absolute left-2 flex h-3.5 w-3.5 items-center justify-center">
       <DropdownMenuPrimitive.ItemIndicator>
-        <MoreHorizontal className="h-4 w-4" />
+        <HugeiconsIcon icon={MoreHorizontalIcon} size={16} className="h-4 w-4" />
       </DropdownMenuPrimitive.ItemIndicator>
     </span>
     {children}
@@ -119,7 +120,7 @@ const DropdownMenuRadioItem = React.forwardRef<
   >
     <span className="absolute left-2 flex h-3.5 w-3.5 items-center justify-center">
       <DropdownMenuPrimitive.ItemIndicator>
-        <MoreHorizontal className="h-2 w-2 fill-current" />
+        <HugeiconsIcon icon={MoreHorizontalIcon} size={8} className="h-2 w-2 fill-current" />
       </DropdownMenuPrimitive.ItemIndicator>
     </span>
     {children}
diff --git a/app/src/components/ui/multi-select.tsx b/app/src/components/ui/multi-select.tsx
index 0f3ffb5e..d807c23b 100644
--- a/app/src/components/ui/multi-select.tsx
+++ b/app/src/components/ui/multi-select.tsx
@@ -1,5 +1,6 @@
 import * as React from 'react';
-import { ChevronDown, Check } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { ArrowDown01Icon, CheckmarkCircle01Icon } from '@hugeicons/core-free-icons';
 import { cn } from '@/lib/utils/cn';
 import {
   DropdownMenu,
@@ -36,7 +37,7 @@ const MultiSelectCheckboxItem = React.forwardRef<
   >
     <span className="absolute left-2 flex h-3.5 w-3.5 items-center justify-center">
       <DropdownMenuPrimitive.ItemIndicator>
-        <Check className="h-4 w-4" />
+        <HugeiconsIcon icon={CheckmarkCircle01Icon} size={16} className="h-4 w-4" />
       </DropdownMenuPrimitive.ItemIndicator>
     </span>
     {children}
@@ -78,7 +79,7 @@ export function MultiSelect({
           )}
         >
           <span className="line-clamp-1">{displayText}</span>
-          <ChevronDown className="h-4 w-4 opacity-50" />
+          <HugeiconsIcon icon={ArrowDown01Icon} size={16} className="h-4 w-4 opacity-50" />
         </button>
       </DropdownMenuTrigger>
       <DropdownMenuContent
diff --git a/app/src/components/ui/radio-group.tsx b/app/src/components/ui/radio-group.tsx
index fed418e6..a76cf821 100644
--- a/app/src/components/ui/radio-group.tsx
+++ b/app/src/components/ui/radio-group.tsx
@@ -2,7 +2,8 @@
 
 import * as React from "react"
 import * as RadioGroupPrimitive from "@radix-ui/react-radio-group"
-import { Circle } from "lucide-react"
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CircleIcon } from '@hugeicons/core-free-icons';
 
 import { cn } from "@/lib/utils/cn"
 
@@ -34,7 +35,7 @@ const RadioGroupItem = React.forwardRef<
       {...props}
     >
       <RadioGroupPrimitive.Indicator className="flex items-center justify-center">
-        <Circle className="h-2.5 w-2.5 fill-current text-current" />
+        <HugeiconsIcon icon={CircleIcon} size={10} className="h-2.5 w-2.5 fill-current text-current" />
       </RadioGroupPrimitive.Indicator>
     </RadioGroupPrimitive.Item>
   )
diff --git a/app/src/components/ui/select.tsx b/app/src/components/ui/select.tsx
index 4a1949fc..2f88e528 100644
--- a/app/src/components/ui/select.tsx
+++ b/app/src/components/ui/select.tsx
@@ -1,5 +1,6 @@
 import * as SelectPrimitive from '@radix-ui/react-select';
-import { Check, ChevronDown, ChevronUp } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CheckmarkCircle01Icon, ArrowDown01Icon, ArrowUp01Icon } from '@hugeicons/core-free-icons';
 import * as React from 'react';
 import { cn } from '@/lib/utils/cn';
 
@@ -23,7 +24,7 @@ const SelectTrigger = React.forwardRef<
   >
     {children}
     <SelectPrimitive.Icon asChild>
-      <ChevronDown className="h-4 w-4 opacity-50" />
+      <HugeiconsIcon icon={ArrowDown01Icon} size={16} className="h-4 w-4 opacity-50" />
     </SelectPrimitive.Icon>
   </SelectPrimitive.Trigger>
 ));
@@ -38,7 +39,7 @@ const SelectScrollUpButton = React.forwardRef<
     className={cn('flex cursor-default items-center justify-center py-1', className)}
     {...props}
   >
-    <ChevronUp className="h-4 w-4" />
+    <HugeiconsIcon icon={ArrowUp01Icon} size={16} className="h-4 w-4" />
   </SelectPrimitive.ScrollUpButton>
 ));
 SelectScrollUpButton.displayName = SelectPrimitive.ScrollUpButton.displayName;
@@ -52,7 +53,7 @@ const SelectScrollDownButton = React.forwardRef<
     className={cn('flex cursor-default items-center justify-center py-1', className)}
     {...props}
   >
-    <ChevronDown className="h-4 w-4" />
+    <HugeiconsIcon icon={ArrowDown01Icon} size={16} className="h-4 w-4" />
   </SelectPrimitive.ScrollDownButton>
 ));
 SelectScrollDownButton.displayName = SelectPrimitive.ScrollDownButton.displayName;
@@ -115,7 +116,7 @@ const SelectItem = React.forwardRef<
   >
     <span className="absolute left-2 flex h-3.5 w-3.5 items-center justify-center">
       <SelectPrimitive.ItemIndicator>
-        <Check className="h-4 w-4" />
+        <HugeiconsIcon icon={CheckmarkCircle01Icon} size={16} className="h-4 w-4" />
       </SelectPrimitive.ItemIndicator>
     </span>
 
diff --git a/app/src/components/ui/toast.tsx b/app/src/components/ui/toast.tsx
index 35150afd..48a8743d 100644
--- a/app/src/components/ui/toast.tsx
+++ b/app/src/components/ui/toast.tsx
@@ -1,6 +1,7 @@
 import * as ToastPrimitives from '@radix-ui/react-toast';
 import { cva, type VariantProps } from 'class-variance-authority';
-import { X } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Cancel01Icon } from '@hugeicons/core-free-icons';
 import * as React from 'react';
 import { cn } from '@/lib/utils/cn';
 
@@ -79,7 +80,7 @@ const ToastClose = React.forwardRef<
     toast-close=""
     {...props}
   >
-    <X className="h-4 w-4" />
+    <HugeiconsIcon icon={Cancel01Icon} size={16} className="h-4 w-4" />
   </ToastPrimitives.Close>
 ));
 ToastClose.displayName = ToastPrimitives.Close.displayName;
diff --git a/app/src/hooks/useAutoUpdater.ts b/app/src/hooks/useAutoUpdater.ts
index 7a9f169a..e99d3ac5 100644
--- a/app/src/hooks/useAutoUpdater.ts
+++ b/app/src/hooks/useAutoUpdater.ts
@@ -41,7 +41,7 @@ export function useAutoUpdater(checkOnMount = false) {
       checkForUpdates();
     }
     // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.metadata.isTauricheckOnMountcheckForUpdates]);
+  }, []);
 
   return {
     status,
diff --git a/app/src/hooks/useAutoUpdater.tsx b/app/src/hooks/useAutoUpdater.tsx
index 8a6351f6..af156495 100644
--- a/app/src/hooks/useAutoUpdater.tsx
+++ b/app/src/hooks/useAutoUpdater.tsx
@@ -1,4 +1,5 @@
-import { Download, RefreshCw } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Download01Icon, Refresh01Icon } from '@hugeicons/core-free-icons';
 import { useCallback, useEffect, useRef, useState } from 'react';
 import { Progress } from '@/components/ui/progress';
 import { ToastAction } from '@/components/ui/toast';
@@ -73,7 +74,7 @@ export function useAutoUpdater(options: boolean | UseAutoUpdaterOptions = false)
     }
     // Empty dependency array - only run once on mount
     // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.metadata.isTauricheckOnMountcheckForUpdates]);
+  }, []);
 
   // Show toast when update is available
   useEffect(() => {
@@ -174,7 +175,7 @@ export function useAutoUpdater(options: boolean | UseAutoUpdaterOptions = false)
       duration: Infinity,
       action: (
         <ToastAction altText="Restart now" onClick={handleRestartNow}>
-          <RefreshCw className="h-3 w-3 mr-1" />
+          <HugeiconsIcon icon={Refresh01Icon} size={12} className="h-3 w-3 mr-1" />
           Restart Now
         </ToastAction>
       ),
diff --git a/app/src/lib/api/types.ts b/app/src/lib/api/types.ts
index 131c1be5..dd76ca1e 100644
--- a/app/src/lib/api/types.ts
+++ b/app/src/lib/api/types.ts
@@ -34,6 +34,7 @@ export interface GenerationRequest {
   language: LanguageCode;
   seed?: number;
   model_size?: '1.7B' | '0.6B';
+  instruct?: string;
 }
 
 export interface GenerationResponse {
diff --git a/app/src/lib/hooks/useModelDownloadToast.tsx b/app/src/lib/hooks/useModelDownloadToast.tsx
index 2df221e1..56c13b9d 100644
--- a/app/src/lib/hooks/useModelDownloadToast.tsx
+++ b/app/src/lib/hooks/useModelDownloadToast.tsx
@@ -1,4 +1,5 @@
-import { CheckCircle2, Loader2, XCircle } from 'lucide-react';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { CheckmarkCircle02Icon, Loading01Icon, CancelCircleIcon } from '@hugeicons/core-free-icons';
 import { useCallback, useEffect, useRef } from 'react';
 import { Progress } from '@/components/ui/progress';
 import { useToast } from '@/components/ui/use-toast';
@@ -59,7 +60,7 @@ export function useModelDownloadToast({
       title: displayName,
       description: (
         <div className="flex items-center gap-2">
-          <Loader2 className="h-4 w-4 animate-spin" />
+          <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
           <span>Connecting to download...</span>
         </div>
       ),
@@ -96,19 +97,19 @@ export function useModelDownloadToast({
 
           switch (progress.status) {
             case 'complete':
-              statusIcon = <CheckCircle2 className="h-4 w-4 text-green-500" />;
+              statusIcon = <HugeiconsIcon icon={CheckmarkCircle02Icon} size={16} className="h-4 w-4 text-green-500" />;
               statusText = 'Download complete';
               break;
             case 'error':
-              statusIcon = <XCircle className="h-4 w-4 text-destructive" />;
+              statusIcon = <HugeiconsIcon icon={CancelCircleIcon} size={16} className="h-4 w-4 text-destructive" />;
               statusText = `Error: ${progress.error || 'Unknown error'}`;
               break;
             case 'downloading':
-              statusIcon = <Loader2 className="h-4 w-4 animate-spin" />;
+              statusIcon = <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />;
               statusText = progress.filename || 'Downloading...';
               break;
             case 'extracting':
-              statusIcon = <Loader2 className="h-4 w-4 animate-spin" />;
+              statusIcon = <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />;
               statusText = 'Extracting...';
               break;
           }
@@ -154,7 +155,7 @@ export function useModelDownloadToast({
               toastUpdateRef.current({
                 title: (
                   <div className="flex items-center gap-2">
-                    <CheckCircle2 className="h-4 w-4 text-green-500" />
+                    <HugeiconsIcon icon={CheckmarkCircle02Icon} size={16} className="h-4 w-4 text-green-500" />
                     <span>{displayName}</span>
                   </div>
                 ),
diff --git a/backend/voicebox-server.spec b/backend/voicebox-server.spec
index 5d6bb317..dc6fe876 100644
--- a/backend/voicebox-server.spec
+++ b/backend/voicebox-server.spec
@@ -1,15 +1,11 @@
 # -*- mode: python ; coding: utf-8 -*-
 from PyInstaller.utils.hooks import collect_data_files
 from PyInstaller.utils.hooks import collect_submodules
-from PyInstaller.utils.hooks import copy_metadata
 
 datas = []
-hiddenimports = ['backend', 'backend.main', 'backend.config', 'backend.database', 'backend.models', 'backend.profiles', 'backend.history', 'backend.tts', 'backend.transcribe', 'backend.platform_detect', 'backend.backends', 'backend.backends.pytorch_backend', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.validation', 'torch', 'transformers', 'fastapi', 'uvicorn', 'sqlalchemy', 'librosa', 'soundfile', 'qwen_tts', 'qwen_tts.inference', 'qwen_tts.inference.qwen3_tts_model', 'qwen_tts.inference.qwen3_tts_tokenizer', 'qwen_tts.core', 'qwen_tts.cli', 'pkg_resources.extern', 'backend.backends.mlx_backend', 'mlx', 'mlx.core', 'mlx.nn', 'mlx_audio', 'mlx_audio.tts', 'mlx_audio.stt']
-datas += collect_data_files('qwen_tts')
+hiddenimports = ['backend', 'backend.main', 'backend.config', 'backend.database', 'backend.models', 'backend.profiles', 'backend.history', 'backend.tts', 'backend.transcribe', 'backend.platform_detect', 'backend.providers', 'backend.providers.base', 'backend.providers.bundled', 'backend.providers.types', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.validation', 'fastapi', 'uvicorn', 'sqlalchemy', 'librosa', 'soundfile', 'pkg_resources.extern', 'backend.backends', 'backend.backends.mlx_backend', 'mlx', 'mlx.core', 'mlx.nn', 'mlx_audio', 'mlx_audio.tts', 'mlx_audio.stt']
 datas += collect_data_files('mlx')
 datas += collect_data_files('mlx_audio')
-datas += copy_metadata('qwen-tts')
-hiddenimports += collect_submodules('qwen_tts')
 hiddenimports += collect_submodules('jaraco')
 hiddenimports += collect_submodules('mlx')
 hiddenimports += collect_submodules('mlx_audio')
diff --git a/bun.lock b/bun.lock
index 3879020e..2a2e89f0 100644
--- a/bun.lock
+++ b/bun.lock
@@ -13,12 +13,14 @@
     },
     "app": {
       "name": "@voicebox/app",
-      "version": "0.1.12",
+      "version": "0.1.13",
       "dependencies": {
         "@dnd-kit/core": "^6.3.1",
         "@dnd-kit/sortable": "^10.0.0",
         "@dnd-kit/utilities": "^3.2.2",
         "@hookform/resolvers": "^3.9.0",
+        "@hugeicons/core-free-icons": "^3.1.1",
+        "@hugeicons/react": "^1.1.4",
         "@radix-ui/react-alert-dialog": "^1.1.1",
         "@radix-ui/react-avatar": "^1.1.0",
         "@radix-ui/react-dialog": "^1.1.1",
@@ -69,7 +71,7 @@
     },
     "landing": {
       "name": "@voicebox/landing",
-      "version": "0.1.12",
+      "version": "0.1.13",
       "dependencies": {
         "@radix-ui/react-separator": "^1.1.8",
         "@radix-ui/react-slot": "^1.2.4",
@@ -94,7 +96,7 @@
     },
     "tauri": {
       "name": "@voicebox/tauri",
-      "version": "0.1.12",
+      "version": "0.1.13",
       "dependencies": {
         "@tauri-apps/api": "^2.0.0",
         "@tauri-apps/plugin-dialog": "^2.0.0",
@@ -117,7 +119,7 @@
     },
     "web": {
       "name": "@voicebox/web",
-      "version": "0.1.12",
+      "version": "0.1.13",
       "dependencies": {
         "@tanstack/react-query": "^5.0.0",
         "react": "^18.3.0",
@@ -272,6 +274,10 @@
 
     "@hookform/resolvers": ["@hookform/resolvers@3.10.0", "", { "peerDependencies": { "react-hook-form": "^7.0.0" } }, "sha512-79Dv+3mDF7i+2ajj7SkypSKHhl1cbln1OGavqrsF7p6mbUv11xpqpacPsGDCTRvCSjEEIez2ef1NveSVL3b0Ag=="],
 
+    "@hugeicons/core-free-icons": ["@hugeicons/core-free-icons@3.1.1", "", {}, "sha512-UpS2lUQFi5sKyJSWwM6rO+BnPLvVz1gsyCpPHeZyVuZqi89YH8ksliza4cwaODqKOZyeXmG8juo1ty4QtQofkg=="],
+
+    "@hugeicons/react": ["@hugeicons/react@1.1.4", "", { "peerDependencies": { "react": ">=16.0.0" } }, "sha512-gsc3eZyd2fGqRUThW9+lfjxxsOkz6KNVmRXRgJjP32GL0OnnLJnl3hytKt47CBbiQj2xE2kCw+rnP3UQCThcKw=="],
+
     "@humanwhocodes/config-array": ["@humanwhocodes/config-array@0.13.0", "", { "dependencies": { "@humanwhocodes/object-schema": "^2.0.3", "debug": "^4.3.1", "minimatch": "^3.0.5" } }, "sha512-DZLEEqFWQFiyK6h5YIeynKx7JlvCYWL0cImfSRXZ9l4Sg2efkFGTuFf6vzXjK1cq6IYkU+Eg/JizXw+TD2vRNw=="],
 
     "@humanwhocodes/module-importer": ["@humanwhocodes/module-importer@1.0.1", "", {}, "sha512-bxveV4V8v5Yb4ncFTT3rPSgZBOpCkjfK0y4oVVVJwIuDVBRMDXrPyXRL988i5ap9m9bnyEEjWfm5WkBmtffLfA=="],
diff --git a/tauri/src-tauri/Cargo.lock b/tauri/src-tauri/Cargo.lock
index 35b15188..450b9a35 100644
--- a/tauri/src-tauri/Cargo.lock
+++ b/tauri/src-tauri/Cargo.lock
@@ -5041,7 +5041,7 @@ checksum = "0b928f33d975fc6ad9f86c8f283853ad26bdd5b10b7f1542aa2fa15e2289105a"
 
 [[package]]
 name = "voicebox"
-version = "0.1.12"
+version = "0.1.13"
 dependencies = [
  "base64 0.22.1",
  "core-foundation-sys",
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index de0e9a0857a73b17c17669c16a83ca113ff15db8..07985db1eef00047b8abef0dcec27baa2fa36323 100644
GIT binary patch
delta 832
zcmZY8yG~S56b9fK#*yJVqJS`hh>G_G`+lMDaQ5YdN8k<YjHQKziN#P#CdNj45*ibV
zq4WVvcmWGLC&n1Gq4g(7<Lu<i?*6sbzU+SgQQw76$7{<IwOVZ)reG4rpapH1KK#9Q
z+}>l&-idzO`>a{-wOOivJ^X0?j1*jCV}w*>l1`*TSy8DpBk!^ZI!2qMAS=A}#LgDi
zNop2CW?}us^Jjajoi_vD9r!woKm#s86E4GOf8blWS;&wilU9=PWl4&MM81rYxXamj
zBP-70aGjFzV9x6-^>>TbyGFrSB`Tv5>CzZd+DLLCTk;iJj#^ls&2UhV!c-SQFJo)2
zUifHbS)mygOH3Y_r=XJ{XB8JoS)D^U98{JS=NCbP)LLv5Dl^ZVjwC7<NckWs1Vm=(
zQpy$jLF)fU$k8fu=RphIo$VHk!8lC7Buv3HwBZWOz*V>gvoHtqa2?Jv7NG+-U<sDt
zCal0MScThg2kyce+=Kh@03O1l{?7K})6>Fgn}u?YoR6MVmW&+794sfzWM;T9KRgt(
zPX4>EPIrIn2@tHq1~A|tK!O6@-`_Gvzn&_WLNttmz#~yn1-wJWDdZ~Iq+HZ74b@{2
veZ})b>~xPdEI9D}qm9kRtC@vbO@G4=7{PvmefIsAgUyxteE;Xc=7-V0{*~nt

delta 825
zcmZY7J5N+W7zW^7R%E%00)l{miuaG5`-Q}nnKN@jX~{pZGnN(>CKkJ;WMgc!C!sN+
z*e(45Cj13EH^vw>F|@vlSS%-bGLxL-edjx8+MmBv+wlHqV`Z{ZsZ78$Ou;ye!6?)Z
ze{390@3G;|Bf~l$^sCMbvt0dk_|E(sYT78Q^`;=pijtI8k-V0iM3gS2=$&%`@2n;E
z_Yp!y%~CAm=F=yS_tuwQ_I<1Gt1tvLI0wUU9!9!-U(dtM7)4ORatfST)RdYKtg!Po
z1a1o##9)mot&ZxXW~JMHSbtq>YG;%-N|NO)kP;%3)0q>u!bxQ<Pf88uXl9({r#a7x
z`dqcivNk!fl5Fyfly`z$7LtN9F-9$-LHwDqG5r7Y^izGY*7VFsX=A2jj3ni_qnJxh
z*{SHg<2+|Gm}6MUggH6SVrzG&4x=yz<1hh}Fa^_a0cPMLT!LAcgL$|N3-BlB3M|1g
ztiV-Rg*8}*Yj7QIzy{oeTW}lhz}@cd&b{N~CRah0DHOy^DM(qz$a{goR1vsTsn9VE
z&ZITRu>Y<^Yk&Jb5NtvN7;q3EL4oe>Z=2q?2WYb*OJXYGm)exb712=CiTU7j4o;t`
x<M_brw652%tzN@{@Aev7wdXVQm5Tm^t3QPGJJy9a9}l)xtFzs&2U~APegpG5;e-GH


From 3b14f81741c0e12d8fab60cd89ed6d948938f354 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sun, 1 Feb 2026 00:00:47 -0800
Subject: [PATCH 11/33] Enhance release workflow and update provider settings

- Added macOS support for PyTorch CPU providers in the release workflow.
- Updated the ProviderSettings component to handle macOS-specific conditions and improve UI interactions.
- Refactored the radio group component styles for better accessibility and visual consistency.
- Improved provider management logic to ensure proper handling of available providers across different platforms.
---
 .github/workflows/release.yml                 |  18 +-
 .../ServerSettings/ProviderSettings.tsx       | 249 ++++++++----------
 app/src/components/ui/radio-group.tsx         |   2 +-
 backend/providers/__init__.py                 |  78 +++---
 backend/providers/installer.py                |   8 +
 tauri/src-tauri/gen/Assets.car                | Bin 3847048 -> 3847048 bytes
 6 files changed, 173 insertions(+), 182 deletions(-)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index cce4670b..648e1c36 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -28,13 +28,21 @@ jobs:
             provider: "pytorch-cuda"
             python-version: "3.12"
           # PyTorch CPU provider (Linux)
-          # - platform: "ubuntu-22.04"
-          #   provider: "pytorch-cpu"
-          #   python-version: "3.12"
+          - platform: "ubuntu-22.04"
+            provider: "pytorch-cpu"
+            python-version: "3.12"
           # PyTorch CUDA provider (Linux) - large binary, uploaded to R2
           - platform: "ubuntu-22.04"
             provider: "pytorch-cuda"
             python-version: "3.12"
+          # PyTorch CPU provider (macOS Apple Silicon)
+          - platform: "macos-latest"
+            provider: "pytorch-cpu"
+            python-version: "3.12"
+          # PyTorch CPU provider (macOS Intel)
+          - platform: "macos-15-intel"
+            provider: "pytorch-cpu"
+            python-version: "3.12"
 
     steps:
       - uses: actions/checkout@v4
@@ -101,6 +109,10 @@ jobs:
           # Add platform suffix for clarity
           if [ "${{ matrix.platform }}" == "windows-latest" ]; then
             UPLOAD_NAME="tts-provider-${{ matrix.provider }}-windows.exe"
+          elif [ "${{ matrix.platform }}" == "macos-latest" ]; then
+            UPLOAD_NAME="tts-provider-${{ matrix.provider }}-macos-arm64"
+          elif [ "${{ matrix.platform }}" == "macos-15-intel" ]; then
+            UPLOAD_NAME="tts-provider-${{ matrix.provider }}-macos-x64"
           else
             UPLOAD_NAME="tts-provider-${{ matrix.provider }}-linux"
           fi
diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index 7ae237aa..16af4a34 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -1,6 +1,6 @@
-import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
+import { Delete01Icon, Download01Icon, Loading01Icon } from '@hugeicons/core-free-icons';
 import { HugeiconsIcon } from '@hugeicons/react';
-import { Download01Icon, Loading01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
+import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
 import { useCallback, useState } from 'react';
 import {
   AlertDialog,
@@ -23,12 +23,18 @@ import { useModelDownloadToast } from '@/lib/hooks/useModelDownloadToast';
 
 const isMacOS = () => navigator.platform.toLowerCase().includes('mac');
 
-type ProviderType = 'auto' | 'bundled-mlx' | 'bundled-pytorch' | 'pytorch-cpu' | 'pytorch-cuda' | 'remote' | 'openai';
+type ProviderType =
+  | 'auto'
+  | 'bundled-mlx'
+  | 'bundled-pytorch'
+  | 'pytorch-cpu'
+  | 'pytorch-cuda'
+  | 'remote'
+  | 'openai';
 
 export function ProviderSettings() {
   const { toast } = useToast();
   const queryClient = useQueryClient();
-  const [selectedProvider, setSelectedProvider] = useState<ProviderType>('auto');
   const [downloadingProvider, setDownloadingProvider] = useState<string | null>(null);
 
   const { data: providersData, isLoading } = useQuery({
@@ -167,6 +173,7 @@ export function ProviderSettings() {
 
   // Determine current active provider
   const currentProvider = activeProvider?.provider || 'auto';
+  const selectedProvider = currentProvider as ProviderType;
 
   return (
     <>
@@ -176,41 +183,25 @@ export function ProviderSettings() {
           <CardDescription>Choose how Voicebox generates speech</CardDescription>
         </CardHeader>
         <CardContent>
-          <RadioGroup
-            value={selectedProvider}
-            onValueChange={(value) => setSelectedProvider(value as ProviderType)}
-          >
-            {/* Auto-detect */}
-            <div className="flex items-center space-x-2 py-2">
-              <RadioGroupItem value="auto" id="auto" />
-              <Label htmlFor="auto" className="flex-1 cursor-pointer">
-                <div className="font-medium">Auto-detect (Recommended)</div>
-                <div className="text-sm text-muted-foreground">
-                  Automatically choose the best available provider
-                </div>
-              </Label>
-              {currentProvider === 'auto' && (
-                <Badge variant="outline" className="ml-2">
-                  Active
-                </Badge>
-              )}
-            </div>
-
+          <RadioGroup value={selectedProvider} onValueChange={(value) => handleStart(value)}>
             {/* PyTorch CUDA */}
-            <div className="flex items-center justify-between py-2">
-              <div className="flex items-center space-x-2 flex-1">
-                <RadioGroupItem value="pytorch-cuda" id="cuda" />
-                <Label htmlFor="cuda" className="flex-1 cursor-pointer">
+            <div
+              className={`flex items-center justify-between py-2 ${isMacOS() ? 'opacity-50' : ''}`}
+            >
+              <div className="flex items-center space-x-3 flex-1">
+                <RadioGroupItem value="pytorch-cuda" id="cuda" disabled={isMacOS()} />
+                <Label
+                  htmlFor="cuda"
+                  className={`flex-1 ${isMacOS() ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                >
                   <div className="font-medium">PyTorch CUDA (NVIDIA GPU)</div>
                   <div className="text-sm text-muted-foreground">
-                    4-5x faster inference on NVIDIA GPUs
+                    {isMacOS() ? 'Not available on macOS' : '4-5x faster inference on NVIDIA GPUs'}
                   </div>
                 </Label>
               </div>
               <div className="flex items-center gap-2">
-                {currentProvider === 'pytorch-cuda' && (
-                  <Badge variant="outline">Active</Badge>
-                )}
+                {currentProvider === 'pytorch-cuda' && <Badge variant="outline">Active</Badge>}
                 {!installedProviders.includes('pytorch-cuda') && (
                   <Button
                     onClick={() => handleDownload('pytorch-cuda')}
@@ -218,7 +209,11 @@ export function ProviderSettings() {
                     disabled={downloadingProvider === 'pytorch-cuda'}
                   >
                     {downloadingProvider === 'pytorch-cuda' ? (
-                      <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
+                      <HugeiconsIcon
+                        icon={Loading01Icon}
+                        size={16}
+                        className="h-4 w-4 animate-spin"
+                      />
                     ) : (
                       <>
                         <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-1" />
@@ -227,148 +222,109 @@ export function ProviderSettings() {
                     )}
                   </Button>
                 )}
-                {installedProviders.includes('pytorch-cuda') && selectedProvider !== 'pytorch-cuda' && (
-                  <Button
-                    onClick={() => handleStart('pytorch-cuda')}
-                    size="sm"
-                    variant="outline"
-                  >
-                    Start
-                  </Button>
-                )}
+                {installedProviders.includes('pytorch-cuda') &&
+                  selectedProvider !== 'pytorch-cuda' && (
+                    <Button onClick={() => handleStart('pytorch-cuda')} size="sm" variant="outline">
+                      Start
+                    </Button>
+                  )}
                 {installedProviders.includes('pytorch-cuda') && (
-                  <Button
-                    onClick={() => handleDelete('pytorch-cuda')}
-                    size="sm"
-                    variant="ghost"
-                  >
+                  <Button onClick={() => handleDelete('pytorch-cuda')} size="sm" variant="ghost">
                     <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
                   </Button>
                 )}
               </div>
             </div>
 
-            {/* PyTorch CPU (Windows/Linux only) */}
-            {!isMacOS() && (
-              <div className="flex items-center justify-between py-2">
-                <div className="flex items-center space-x-2 flex-1">
-                  <RadioGroupItem value="pytorch-cpu" id="cpu" />
-                  <Label htmlFor="cpu" className="flex-1 cursor-pointer">
-                    <div className="font-medium">PyTorch CPU</div>
-                    <div className="text-sm text-muted-foreground">
-                      Works on any system, slower inference
-                    </div>
-                  </Label>
-                </div>
-                <div className="flex items-center gap-2">
-                  {currentProvider === 'pytorch-cpu' && (
-                    <Badge variant="outline">Active</Badge>
-                  )}
-                  {!installedProviders.includes('pytorch-cpu') && (
-                    <Button
-                      onClick={() => handleDownload('pytorch-cpu')}
-                      size="sm"
-                      disabled={downloadingProvider === 'pytorch-cpu'}
-                    >
-                      {downloadingProvider === 'pytorch-cpu' ? (
-                        <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
-                      ) : (
-                        <>
-                          <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-1" />
-                          Download (300MB)
-                        </>
-                      )}
-                    </Button>
-                  )}
-                  {installedProviders.includes('pytorch-cpu') && selectedProvider !== 'pytorch-cpu' && (
-                    <Button
-                      onClick={() => handleStart('pytorch-cpu')}
-                      size="sm"
-                      variant="outline"
-                    >
+            {/* PyTorch CPU */}
+            <div className="flex items-center justify-between py-2">
+              <div className="flex items-center space-x-3 flex-1">
+                <RadioGroupItem value="pytorch-cpu" id="cpu" />
+                <Label htmlFor="cpu" className="flex-1 cursor-pointer">
+                  <div className="font-medium">PyTorch CPU</div>
+                  <div className="text-sm text-muted-foreground">
+                    Works on any system, slower inference
+                  </div>
+                </Label>
+              </div>
+              <div className="flex items-center gap-2">
+                {currentProvider === 'pytorch-cpu' && <Badge variant="outline">Active</Badge>}
+                {!installedProviders.includes('pytorch-cpu') && (
+                  <Button
+                    onClick={() => handleDownload('pytorch-cpu')}
+                    size="sm"
+                    disabled={downloadingProvider === 'pytorch-cpu'}
+                  >
+                    {downloadingProvider === 'pytorch-cpu' ? (
+                      <HugeiconsIcon
+                        icon={Loading01Icon}
+                        size={16}
+                        className="h-4 w-4 animate-spin"
+                      />
+                    ) : (
+                      <>
+                        <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-1" />
+                        Download (300MB)
+                      </>
+                    )}
+                  </Button>
+                )}
+                {installedProviders.includes('pytorch-cpu') &&
+                  selectedProvider !== 'pytorch-cpu' && (
+                    <Button onClick={() => handleStart('pytorch-cpu')} size="sm" variant="outline">
                       Start
                     </Button>
                   )}
-                  {installedProviders.includes('pytorch-cpu') && (
-                    <Button
-                      onClick={() => handleDelete('pytorch-cpu')}
-                      size="sm"
-                      variant="ghost"
-                    >
-                      <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
-                    </Button>
-                  )}
-                </div>
+                {installedProviders.includes('pytorch-cpu') && (
+                  <Button onClick={() => handleDelete('pytorch-cpu')} size="sm" variant="ghost">
+                    <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
+                  </Button>
+                )}
               </div>
-            )}
+            </div>
 
-            {/* MLX bundled (macOS only) */}
+            {/* MLX bundled (macOS Apple Silicon only) */}
             {isMacOS() && (
-              <div className="p-3 bg-muted rounded-md">
-                <div className="text-sm">
-                  <div className="font-medium flex items-center gap-2">
-                    MLX (Apple Silicon)
-                    {currentProvider === 'bundled-mlx' && (
-                      <Badge variant="outline">Active</Badge>
-                    )}
-                  </div>
-                  <div className="text-muted-foreground mt-1">
-                    Bundled with the app - optimized for M1/M2/M3 chips
+              <div className="flex items-center space-x-3 py-2">
+                <RadioGroupItem value="bundled-mlx" id="mlx" />
+                <Label htmlFor="mlx" className="flex-1 cursor-pointer">
+                  <div className="font-medium">MLX (Apple Silicon)</div>
+                  <div className="text-sm text-muted-foreground">
+                    Bundled with the app - optimized for M-series chips
                   </div>
-                </div>
+                </Label>
+                {currentProvider === 'bundled-mlx' && (
+                  <Badge variant="outline" className="ml-2">
+                    Active
+                  </Badge>
+                )}
               </div>
             )}
 
             {/* Remote */}
-            <div className="space-y-2 py-2">
-              <div className="flex items-center space-x-2">
-                <RadioGroupItem value="remote" id="remote" />
-                <Label htmlFor="remote" className="flex-1 cursor-pointer">
+            <div className="space-y-2 py-2 opacity-50">
+              <div className="flex items-center space-x-3">
+                <RadioGroupItem value="remote" id="remote" disabled />
+                <Label htmlFor="remote" className="flex-1 cursor-not-allowed">
                   <div className="font-medium">Remote Server</div>
                   <div className="text-sm text-muted-foreground">
-                    Connect to your own TTS server
+                    Connect to your own TTS server (coming soon)
                   </div>
                 </Label>
               </div>
-              {selectedProvider === 'remote' && (
-                <div className="ml-6">
-                  <input
-                    type="text"
-                    placeholder="http://your-server:8000"
-                    className="w-full px-3 py-2 border rounded-md"
-                    disabled
-                  />
-                  <div className="text-xs text-muted-foreground mt-1">
-                    Remote provider support coming soon
-                  </div>
-                </div>
-              )}
             </div>
 
             {/* OpenAI */}
-            <div className="space-y-2 py-2">
-              <div className="flex items-center space-x-2">
-                <RadioGroupItem value="openai" id="openai" />
-                <Label htmlFor="openai" className="flex-1 cursor-pointer">
+            <div className="space-y-2 py-2 opacity-50">
+              <div className="flex items-center space-x-3">
+                <RadioGroupItem value="openai" id="openai" disabled />
+                <Label htmlFor="openai" className="flex-1 cursor-not-allowed">
                   <div className="font-medium">OpenAI API</div>
                   <div className="text-sm text-muted-foreground">
-                    Use OpenAI's TTS API (requires API key)
+                    Use OpenAI's TTS API (coming soon)
                   </div>
                 </Label>
               </div>
-              {selectedProvider === 'openai' && (
-                <div className="ml-6">
-                  <input
-                    type="password"
-                    placeholder="sk-..."
-                    className="w-full px-3 py-2 border rounded-md"
-                    disabled
-                  />
-                  <div className="text-xs text-muted-foreground mt-1">
-                    OpenAI provider support coming soon
-                  </div>
-                </div>
-              )}
             </div>
           </RadioGroup>
         </CardContent>
@@ -385,7 +341,10 @@ export function ProviderSettings() {
           </AlertDialogHeader>
           <AlertDialogFooter>
             <AlertDialogCancel>Cancel</AlertDialogCancel>
-            <AlertDialogAction onClick={confirmDelete} className="bg-destructive text-destructive-foreground">
+            <AlertDialogAction
+              onClick={confirmDelete}
+              className="bg-destructive text-destructive-foreground"
+            >
               Delete
             </AlertDialogAction>
           </AlertDialogFooter>
diff --git a/app/src/components/ui/radio-group.tsx b/app/src/components/ui/radio-group.tsx
index a76cf821..c82678c3 100644
--- a/app/src/components/ui/radio-group.tsx
+++ b/app/src/components/ui/radio-group.tsx
@@ -29,7 +29,7 @@ const RadioGroupItem = React.forwardRef<
     <RadioGroupPrimitive.Item
       ref={ref}
       className={cn(
-        "aspect-square h-4 w-4 rounded-full border border-primary text-primary ring-offset-background focus:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50",
+        "aspect-square h-4 w-4 rounded-full border border-accent text-accent ring-offset-background focus:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50",
         className
       )}
       {...props}
diff --git a/backend/providers/__init__.py b/backend/providers/__init__.py
index 09854d77..a901059a 100644
--- a/backend/providers/__init__.py
+++ b/backend/providers/__init__.py
@@ -10,7 +10,7 @@
 from .types import ProviderType
 from .bundled import BundledProvider
 from .local import LocalProvider
-from .installer import get_provider_binary_path
+from .installer import get_provider_binary_path, _get_providers_dir
 from ..config import get_data_dir
 import subprocess
 import socket
@@ -50,38 +50,44 @@ async def start_provider(self, provider_type: str) -> None:
         Args:
             provider_type: Type of provider to start
         """
-        if provider_type in ["bundled-mlx", "bundled-pytorch"]:
-            # Use bundled provider
+        if provider_type == "bundled-mlx":
+            # Use bundled MLX provider
             self.active_provider = self._get_default_provider()
         elif provider_type in ["pytorch-cpu", "pytorch-cuda"]:
-            # Start local provider subprocess
+            # Try to start external provider subprocess if binary exists
             provider_path = get_provider_binary_path(provider_type)
-            if not provider_path or not provider_path.exists():
-                raise ValueError(f"Provider {provider_type} is not installed. Please download it first.")
-            
-            # Find a free port
-            port = self._get_free_port()
-            
-            # Start provider subprocess
-            from ..config import get_data_dir
-            process = subprocess.Popen(
-                [
-                    str(provider_path),
-                    "--port", str(port),
-                    "--data-dir", str(get_data_dir()),
-                ],
-                stdout=subprocess.PIPE,
-                stderr=subprocess.PIPE,
-            )
-            
-            # Wait for provider to be ready
-            base_url = f"http://127.0.0.1:{port}"
-            await self._wait_for_provider_health(base_url, timeout=30)
-            
-            # Create LocalProvider instance
-            self.active_provider = LocalProvider(base_url)
-            self._provider_process = process
-            self._provider_port = port
+            if provider_path and provider_path.exists():
+                # External downloaded provider exists, start it
+                # Find a free port
+                port = self._get_free_port()
+
+                # Start provider subprocess
+                from ..config import get_data_dir
+                process = subprocess.Popen(
+                    [
+                        str(provider_path),
+                        "--port", str(port),
+                        "--data-dir", str(get_data_dir()),
+                    ],
+                    stdout=subprocess.PIPE,
+                    stderr=subprocess.PIPE,
+                )
+
+                # Wait for provider to be ready
+                base_url = f"http://127.0.0.1:{port}"
+                await self._wait_for_provider_health(base_url, timeout=30)
+
+                # Create LocalProvider instance
+                self.active_provider = LocalProvider(base_url)
+                self._provider_process = process
+                self._provider_port = port
+            else:
+                # No external binary, use bundled provider (if available)
+                if provider_type == "pytorch-cpu":
+                    # PyTorch CPU can use bundled backend
+                    self.active_provider = self._get_default_provider()
+                else:
+                    raise ValueError(f"Provider {provider_type} is not installed. Please download it first.")
         elif provider_type == "remote":
             # Remote provider - will be implemented in Phase 5
             raise NotImplementedError("Remote provider not yet implemented")
@@ -122,11 +128,17 @@ async def list_installed(self) -> list[str]:
         # Bundled providers are always available
         system = platform.system()
         machine = platform.machine()
-        
+
         if system == "Darwin" and machine == "arm64":
+            # Apple Silicon gets MLX
             installed.append("bundled-mlx")
-        else:
-            installed.append("bundled-pytorch")
+
+        # PyTorch CPU is available on all platforms (check if bundled or downloaded)
+        # For now, assume it's bundled on macOS Intel, Windows, Linux
+        # Downloaded binaries will be detected below
+        if not (system == "Darwin" and machine == "arm64"):
+            # Non-Apple Silicon systems have PyTorch CPU bundled
+            installed.append("pytorch-cpu")
         
         # Check for downloaded providers (Phase 2)
         providers_dir = _get_providers_dir()
diff --git a/backend/providers/installer.py b/backend/providers/installer.py
index 08297b9d..a41f421e 100644
--- a/backend/providers/installer.py
+++ b/backend/providers/installer.py
@@ -62,6 +62,14 @@ def _get_provider_download_name(provider_type: str) -> str:
     elif system == "Linux":
         platform_suffix = "linux"
         ext = ""
+    elif system == "Darwin":
+        # Detect macOS architecture
+        machine = platform.machine()
+        if machine == "arm64":
+            platform_suffix = "macos-arm64"
+        else:
+            platform_suffix = "macos-x64"
+        ext = ""
     else:
         raise ValueError(f"Provider downloads not supported on {system}")
     
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index 07985db1eef00047b8abef0dcec27baa2fa36323..088d16109eafb4a4f3c7ce2037b867bcb95502e2 100644
GIT binary patch
delta 850
zcmZwFJ5N+W7zW@2E3#Y{6}hY+i@M&2o%@BvoSn;=P+C&b*%?a<3loc_CB)7jKw@J;
zaVY%<`~^EV#u%+=eaT9-p5)1Qra136^PM^T{$t`0zMOYATSZYU!VENF0p?*2W>5cg
z&s#@y>bRp1j=!pd)Azd7D5bMXS1J*2r64lOKy3DrB+sJMF~uM&qJ>eE(94Gz=UuQa
z@v!se^{b=p_J^Sx4BZ4wLIbYB6kLbtdgz+fR2hwB+GtOV&xS~&Jh4I<l7;1xxhS%r
z<9)QLI3M-ds1M8L$403|qCV+N9Mu((DRUA;QY31ZLnW-TfsY4Snw_``dK;Uo6EC!v
zB631w^hAc7iN`C!=Ya_?lE)Cn&W+9Ud=)cH&Gkm<EfYL*N21G`$SO+Wv5m_}W4NJ$
zayAweZ8kcMg4PE6drg>uS(t-)Sb#-n!4lknn{W%3;Wn(mDqLo)LmTeE25iDz*n$ph
z!#%hU51<PV;SoHBC-Ai1-+Oj(QF^L{s4z&yJjakR=@6VFMg`2+*htfV{#Ig~xzVB8
zgOmPqAg}{Hpum8G012u->FfGe>7p@=X-0UGib$SuAq`hVsLYr&&LwHarWjnHQeHJY
y>zTn>&w{JZdb^ExY`G}ZH(dQm)ZeHpMWL5QYu!Oz!@B=({StM#{`q<L)AV02zu-{-

delta 850
zcmZY7J5N+W6bJANE3!Nn6?v?npyK<$ydNaya_4bFX-P?EXDlr&Oe~g`5Ia8riH!-x
zrSu!{73|y?W3;06PZk<?l3ym%{Lh)0bMWKm$N_vk+gP0{ieeIGU>YW%4IP+0`MYt}
zIb>r;Yi9rGo8CY9U^=ami)@ULicHdpRH$mIlxE~z7D2~olN4lyx1QL=;yOvqLdYy^
zzJ2rhaJ~Dn?|Xee0;AA^YcK}aVZ7=4b{;EbNRmk_$@r=w#X}-rMM>P{?7WdRXK}br
z#dt7-IxEdV+5Xfj8LLHYR3cp&LrNP-E@Vr-M$1tP>$4dS3R0N*D(GEoFOIylvZ~Pv
zixuu2nWvzWAZHa9Nm-pkH5^k_HRo3`{nTD=l`1pOoQ@=F7fAUaDFj4j=~Buyx<Tsy
z56ICdbAzCz-rjB-CSVe#U>as%7CJBoH{d4Rf_b<N3$O?m8OzXxJFo()a2M{u8mz;8
zcmNM!10KO+cmhx1S+lqM{QSJM+Ge4gBj=+hl_ev`aSxW0W->E;mmj_qvrb<AR=0P&
z^8yGqVG9^=5FkN;ZjN_M^SgA)r4S9HATT2;s(>+6oI<XXP0B?b(@;Sc(O4Y3Vz+m?
uWx;`OPPevO@A*<u=<gW)QS5)P&liQ68=TGB<$34w{0jR*^Xtp@=kb3bM&Kp@


From 580179eba34da673f5069326a658641c09c584a7 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sun, 1 Feb 2026 01:23:20 -0800
Subject: [PATCH 12/33] Refactor TTS provider management and enhance
 documentation

- Renamed `bundled-mlx` to `apple-mlx` for clarity in provider types.
- Updated the ProviderSettings component to reflect the new provider naming.
- Improved logging for provider startup and error handling in the backend.
- Added scripts for building and installing PyTorch CPU and CUDA providers locally.
- Enhanced the documentation to include details on TTS provider architecture and development setup.
---
 CONTRIBUTING.md                               | 158 +++++++++++++++++-
 README.md                                     |  71 +++++---
 .../ServerSettings/ProviderSettings.tsx       |   6 +-
 backend/main.py                               |   2 +-
 backend/providers/__init__.py                 |  77 ++++++++-
 backend/providers/types.py                    |   2 +-
 package.json                                  |   1 +
 providers/pytorch-cpu/build.py                |   1 -
 providers/pytorch-cpu/build_and_install.py    |  57 +++++++
 .../pytorch-cpu/tts-provider-pytorch-cpu.spec |  48 ++++++
 providers/pytorch-cuda/build.py               |   1 -
 providers/pytorch-cuda/build_and_install.py   |  57 +++++++
 .../tts-provider-pytorch-cuda.spec            |  48 ++++++
 scripts/build-providers-local.py              |  46 +++++
 tauri/src-tauri/gen/Assets.car                | Bin 3847048 -> 3847048 bytes
 15 files changed, 526 insertions(+), 49 deletions(-)
 create mode 100644 providers/pytorch-cpu/build_and_install.py
 create mode 100644 providers/pytorch-cpu/tts-provider-pytorch-cpu.spec
 create mode 100644 providers/pytorch-cuda/build_and_install.py
 create mode 100644 providers/pytorch-cuda/tts-provider-pytorch-cuda.spec
 create mode 100755 scripts/build-providers-local.py

diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 765da827..6a954046 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -14,16 +14,19 @@ Thank you for your interest in contributing to Voicebox! This document provides
 ### Prerequisites
 
 - **[Bun](https://bun.sh)** - Fast JavaScript runtime and package manager
+
   ```bash
   curl -fsSL https://bun.sh/install | bash
   ```
 
 - **[Python 3.11+](https://python.org)** - For backend development
+
   ```bash
   python --version  # Should be 3.11 or higher
   ```
 
 - **[Rust](https://rustup.rs)** - For Tauri desktop app (installed automatically by Tauri CLI)
+
   ```bash
   rustc --version  # Check if installed
   ```
@@ -37,41 +40,46 @@ Thank you for your interest in contributing to Voicebox! This document provides
 **Manual setup (required for Windows):**
 
 1. **Fork and clone the repository**
+
    ```bash
    git clone https://github.com/YOUR_USERNAME/voicebox.git
    cd voicebox
    ```
 
 2. **Install JavaScript dependencies**
+
    ```bash
    bun install
    ```
+
    This installs dependencies for:
+
    - `app/` - Shared React frontend
    - `tauri/` - Tauri desktop wrapper
    - `web/` - Web deployment wrapper
 
 3. **Set up Python backend**
+
    ```bash
    cd backend
-   
+
    # Create virtual environment
    python -m venv venv
-   
+
    # Activate virtual environment
    source venv/bin/activate  # On macOS/Linux
    # or
    venv\Scripts\activate  # On Windows
-   
+
    # Install Python dependencies
    pip install -r requirements.txt
-   
+
    # Install MLX dependencies (Apple Silicon only - for faster inference)
    # On Apple Silicon, this enables native Metal acceleration
    if [[ $(uname -m) == "arm64" ]]; then
      pip install -r requirements-mlx.txt
    fi
-   
+
    # Install Qwen3-TTS (required for voice synthesis)
    pip install git+https://github.com/QwenLM/Qwen3-TTS.git
    ```
@@ -81,19 +89,24 @@ Thank you for your interest in contributing to Voicebox! This document provides
    Development requires two terminals: one for the Python backend, one for the Tauri app.
 
    **Terminal 1: Backend server** (start this first)
+
    ```bash
    cd backend
    source venv/bin/activate  # Activate venv if not already active
    bun run dev:server
    # Or manually: uvicorn main:app --reload --port 17493
    ```
+
    Backend will be available at `http://localhost:17493`
 
    **Terminal 2: Desktop app**
+
    ```bash
    bun run dev
    ```
+
    This will:
+
    - Create a placeholder sidecar binary (for Tauri compilation)
    - Start Vite dev server on port 5173
    - Launch Tauri window pointing to localhost:5173
@@ -104,26 +117,132 @@ Thank you for your interest in contributing to Voicebox! This document provides
    > The bundled server binary is only used in production builds.
 
    **Optional: Web app**
+
    ```bash
    bun run dev:web
    ```
+
    Web app will be available at `http://localhost:5174`
 
 ### Model Downloads
 
 Models are automatically downloaded from HuggingFace Hub on first use:
+
 - **Whisper** (transcription): Auto-downloads on first transcription
 - **Qwen3-TTS** (voice cloning): Auto-downloads on first generation (~2-4GB)
 
 First-time usage will be slower due to model downloads, but subsequent runs will use cached models.
 
+### TTS Provider Development
+
+Voicebox uses a modular provider system to support different inference backends. Understanding this architecture is important when working on TTS features.
+
+#### Provider Types
+
+**Bundled Providers** — Included with the app binary:
+
+- `apple-mlx` — Bundled with macOS Apple Silicon builds (`.dmg` for aarch64)
+  - Uses MLX for native Metal acceleration
+  - Configured in `.github/workflows/release.yml` with `backend: "mlx"`
+
+**Hybrid Provider:**
+
+- `pytorch-cpu` — Can be bundled OR downloaded depending on platform
+  - **Bundled** with macOS Intel builds (`.dmg` for x64)
+    - Configured in `.github/workflows/release.yml` with `backend: "pytorch"`
+  - **Downloaded** on first use for Windows/Linux builds (~300MB)
+  - Falls back to bundled version if external binary not found
+
+**External-Only Providers:**
+
+- `pytorch-cuda` — NVIDIA GPU-accelerated provider (~2.4GB)
+  - Windows/Linux only (no NVIDIA GPUs on macOS)
+  - Downloaded on demand, not bundled
+  - Optional for users with CUDA-capable GPUs
+
+#### Provider Architecture
+
+```
+backend/providers/
+├── __init__.py         # ProviderManager - lifecycle management
+├── base.py             # TTSProvider protocol
+├── bundled.py          # BundledProvider - wraps built-in backends
+├── local.py            # LocalProvider - wraps external subprocess
+├── installer.py        # Download and install external providers
+└── types.py            # Provider type definitions
+
+providers/
+├── pytorch-cpu/        # External PyTorch CPU provider
+│   ├── main.py         # FastAPI server
+│   ├── build.py        # PyInstaller build script
+│   └── build_and_install.py  # Build and install locally
+└── pytorch-cuda/       # External PyTorch CUDA provider
+    ├── main.py
+    ├── build.py
+    └── build_and_install.py
+```
+
+**How it works:**
+
+1. **Bundled providers** run in-process within the main backend
+2. **External providers** run as separate subprocess servers
+3. **LocalProvider** communicates with external providers via HTTP
+4. **ProviderManager** handles starting/stopping and health checks
+
+#### Building Providers Locally
+
+When developing provider features, you'll need to build and test external providers:
+
+**Build a single provider:**
+
+```bash
+cd providers/pytorch-cpu
+python build_and_install.py
+```
+
+**Build all providers:**
+
+```bash
+bun run build:providers
+```
+
+This script:
+
+- Builds the provider binary with PyInstaller
+- Detects your platform (Windows/macOS/Linux)
+- Copies to the correct location:
+  - macOS: `~/Library/Application Support/voicebox/providers/`
+  - Windows: `%APPDATA%\voicebox\providers\`
+  - Linux: `~/.local/share/voicebox/providers/`
+- Sets executable permissions on Unix
+
+**Testing provider changes:**
+
+1. Make changes to `providers/pytorch-cpu/main.py`
+2. Run `bun run build:providers`
+3. Restart the Voicebox app
+4. Select the provider in Settings → TTS Provider
+
+#### Provider Binary Distribution
+
+For production releases, provider binaries are:
+
+1. Built by GitHub Actions for all platforms
+2. Uploaded to Cloudflare R2 at `downloads.voicebox.sh/providers/v{VERSION}/`
+3. Downloaded on-demand by users based on their platform and GPU
+
+See `.github/workflows/release.yml` for the build matrix.
+
 ### Building
 
 **Build everything (recommended):**
+
 ```bash
 bun run build
 ```
+
 This automatically:
+
 1. Builds the Python server binary (`./scripts/build-server.sh`)
 2. Builds the Tauri desktop app (`cd tauri && bun run tauri build`)
 
@@ -132,13 +251,23 @@ Creates platform-specific installers (`.dmg`, `.msi`, `.AppImage`) in `tauri/src
 **Note:** The build process detects your platform and includes the appropriate backend (MLX for Apple Silicon, PyTorch for others).
 
 **Build server binary only:**
+
 ```bash
 bun run build:server
 # or
 ./scripts/build-server.sh
 ```
+
 Creates platform-specific binary in `tauri/src-tauri/binaries/`
 
+**Build provider binaries (for development):**
+
+```bash
+bun run build:providers
+```
+
+Builds all external provider binaries and installs them to the system provider directory. See [TTS Provider Development](#tts-provider-development) for details.
+
 **Building with local Qwen3-TTS development version:**
 
 If you're actively developing or modifying the Qwen3-TTS library, set the `QWEN_TTS_PATH` environment variable to point to your local clone:
@@ -151,34 +280,41 @@ bun run build:server
 This makes PyInstaller use your local qwen-tts version instead of the pip-installed package. Useful when testing changes to the TTS library before they're published to PyPI or when using an editable install (`pip install -e`).
 
 **Build web app:**
+
 ```bash
 cd web
 bun run build
 ```
+
 Output in `web/dist/`
 
 ### Generate OpenAPI Client
 
 After starting the backend server:
+
 ```bash
 ./scripts/generate-api.sh
 ```
+
 This downloads the OpenAPI schema and generates the TypeScript client in `app/src/lib/api/`
 
 ### Convert Assets to Web Formats
 
 To optimize images and videos for the web, run:
+
 ```bash
 bun run convert:assets
 ```
 
 This script:
+
 - Converts PNG → WebP (better compression, same quality)
 - Converts MOV → WebM (VP9 codec, smaller file size)
 - Processes files in `landing/public/` and `docs/public/`
 - **Deletes original files** after successful conversion
 
 **Requirements:** Install `webp` and `ffmpeg`:
+
 ```bash
 brew install webp ffmpeg
 ```
@@ -225,6 +361,7 @@ git push origin feature/your-feature-name
 ```
 
 Then create a pull request on GitHub with:
+
 - Clear description of changes
 - Screenshots (for UI changes)
 - Reference to related issues
@@ -370,21 +507,23 @@ Currently, testing is primarily manual. When adding tests:
 Releases are managed by maintainers:
 
 1. **Bump version using bumpversion:**
+
    ```bash
    # Install bumpversion (if not already installed)
    pip install bumpversion
-   
+
    # Bump patch version (0.1.0 -> 0.1.1)
    bumpversion patch
-   
+
    # Or bump minor version (0.1.0 -> 0.2.0)
    bumpversion minor
-   
+
    # Or bump major version (0.1.0 -> 1.0.0)
    bumpversion major
    ```
-   
+
    This automatically:
+
    - Updates version numbers in all files (`tauri.conf.json`, `Cargo.toml`, all `package.json` files, `backend/main.py`)
    - Creates a git commit with the version bump
    - Creates a git tag (e.g., `v0.1.1`, `v0.2.0`)
@@ -392,6 +531,7 @@ Releases are managed by maintainers:
 2. **Update CHANGELOG.md** with release notes
 
 3. **Push commits and tags:**
+
    ```bash
    git push
    git push --tags
diff --git a/README.md b/README.md
index 0b67840b..6b4cb0a0 100644
--- a/README.md
+++ b/README.md
@@ -78,12 +78,12 @@ Download a voice model, clone any voice from a few seconds of audio, and compose
 
 Voicebox is available now for macOS and Windows.
 
-| Platform | Download |
-|----------|----------|
-| macOS (Apple Silicon) | [voicebox_aarch64.app.tar.gz](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_aarch64.app.tar.gz) |
-| macOS (Intel) | [voicebox_x64.app.tar.gz](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_x64.app.tar.gz) |
-| Windows (MSI) | [voicebox_0.1.0_x64_en-US.msi](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64_en-US.msi) |
-| Windows (Setup) | [voicebox_0.1.0_x64-setup.exe](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64-setup.exe) |
+| Platform              | Download                                                                                                                    |
+| --------------------- | --------------------------------------------------------------------------------------------------------------------------- |
+| macOS (Apple Silicon) | [voicebox_aarch64.app.tar.gz](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_aarch64.app.tar.gz)   |
+| macOS (Intel)         | [voicebox_x64.app.tar.gz](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_x64.app.tar.gz)           |
+| Windows (MSI)         | [voicebox_0.1.0_x64_en-US.msi](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64_en-US.msi) |
+| Windows (Setup)       | [voicebox_0.1.0_x64-setup.exe](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64-setup.exe) |
 
 > **Linux builds coming soon** — Currently blocked by GitHub runner disk space limitations.
 
@@ -176,17 +176,17 @@ Full API documentation available at `http://localhost:8000/docs` when running.
 
 ## Tech Stack
 
-| Layer | Technology |
-|-------|------------|
-| Desktop App | Tauri (Rust) |
-| Frontend | React, TypeScript, Tailwind CSS |
-| State | Zustand, React Query |
-| Backend | FastAPI (Python) |
-| Voice Model | Qwen3-TTS (PyTorch or MLX) |
-| Transcription | Whisper (PyTorch or MLX) |
+| Layer            | Technology                                          |
+| ---------------- | --------------------------------------------------- |
+| Desktop App      | Tauri (Rust)                                        |
+| Frontend         | React, TypeScript, Tailwind CSS                     |
+| State            | Zustand, React Query                                |
+| Backend          | FastAPI (Python)                                    |
+| Voice Model      | Qwen3-TTS (PyTorch or MLX)                          |
+| Transcription    | Whisper (PyTorch or MLX)                            |
 | Inference Engine | MLX (Apple Silicon) / PyTorch (Windows/Linux/Intel) |
-| Database | SQLite |
-| Audio | WaveSurfer.js, librosa |
+| Database         | SQLite                                              |
+| Audio            | WaveSurfer.js, librosa                              |
 
 **Why this stack?**
 
@@ -194,6 +194,26 @@ Full API documentation available at `http://localhost:8000/docs` when running.
 - **FastAPI** — Async Python with automatic OpenAPI schema generation
 - **Type-safe end-to-end** — Generated TypeScript client from OpenAPI spec
 
+### TTS Provider Architecture
+
+Voicebox uses a modular provider system to support different inference backends:
+
+- **`apple-mlx`** — Bundled with macOS Apple Silicon builds
+
+  - Uses MLX with native Metal acceleration (4-5x faster)
+  - Works out of the box, no download required
+
+- **`pytorch-cpu`** — Universal CPU provider (bundled or downloaded)
+
+  - Bundled with macOS Intel builds
+  - Downloaded on first use for Windows/Linux (~300MB)
+
+- **`pytorch-cuda`** — Optional NVIDIA GPU-accelerated provider
+  - Windows/Linux only (~2.4GB)
+  - 4-5x faster inference on CUDA-capable GPUs
+
+macOS builds work out of the box with bundled providers. Windows and Linux users download a provider on first launch. The app automatically detects your hardware and recommends the best option. All downloadable providers are distributed via Cloudflare R2 for fast, global delivery.
+
 ---
 
 ## Roadmap
@@ -202,13 +222,13 @@ Voicebox is the beginning of something bigger. Here's what's coming:
 
 ### Coming Soon
 
-| Feature | Description |
-|---------|-------------|
-| **Real-time Synthesis** | Stream audio as it generates, word by word |
-| **Conversation Mode** | Multi-speaker dialogues with automatic turn-taking |
-| **Voice Effects** | Pitch shift, reverb, M3GAN-style effects |
-| **Timeline Editor** | Audio studio with word-level precision editing |
-| **More Models** | XTTS, Bark, and other open-source voice models |
+| Feature                 | Description                                        |
+| ----------------------- | -------------------------------------------------- |
+| **Real-time Synthesis** | Stream audio as it generates, word by word         |
+| **Conversation Mode**   | Multi-speaker dialogues with automatic turn-taking |
+| **Voice Effects**       | Pitch shift, reverb, M3GAN-style effects           |
+| **Timeline Editor**     | Audio studio with word-level precision editing     |
+| **More Models**         | XTTS, Bark, and other open-source voice models     |
 
 ### Future Vision
 
@@ -260,9 +280,10 @@ cd backend && pip install -r requirements.txt && cd ..
 bun run dev
 ```
 
-**Prerequisites:** [Bun](https://bun.sh), [Rust](https://rustup.rs), [Python 3.11+](https://python.org). 
+**Prerequisites:** [Bun](https://bun.sh), [Rust](https://rustup.rs), [Python 3.11+](https://python.org).
+
+**Performance:**
 
-**Performance:** 
 - **Apple Silicon (M1/M2/M3)**: Uses MLX backend with native Metal acceleration for 4-5x faster inference
 - **Windows/Linux/Intel Mac**: Uses PyTorch backend (CUDA GPU recommended, CPU supported but slower)
 
diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index 16af4a34..b0bc5c50 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -25,7 +25,7 @@ const isMacOS = () => navigator.platform.toLowerCase().includes('mac');
 
 type ProviderType =
   | 'auto'
-  | 'bundled-mlx'
+  | 'apple-mlx'
   | 'bundled-pytorch'
   | 'pytorch-cpu'
   | 'pytorch-cuda'
@@ -286,14 +286,14 @@ export function ProviderSettings() {
             {/* MLX bundled (macOS Apple Silicon only) */}
             {isMacOS() && (
               <div className="flex items-center space-x-3 py-2">
-                <RadioGroupItem value="bundled-mlx" id="mlx" />
+                <RadioGroupItem value="apple-mlx" id="mlx" />
                 <Label htmlFor="mlx" className="flex-1 cursor-pointer">
                   <div className="font-medium">MLX (Apple Silicon)</div>
                   <div className="text-sm text-muted-foreground">
                     Bundled with the app - optimized for M-series chips
                   </div>
                 </Label>
-                {currentProvider === 'bundled-mlx' && (
+                {currentProvider === 'apple-mlx' && (
                   <Badge variant="outline" className="ml-2">
                     Active
                   </Badge>
diff --git a/backend/main.py b/backend/main.py
index f6d00a1f..31089227 100644
--- a/backend/main.py
+++ b/backend/main.py
@@ -1514,7 +1514,7 @@ async def list_providers():
     
     # Get info for all known provider types
     all_providers = [
-        "bundled-mlx",
+        "apple-mlx",
         "bundled-pytorch",
         "pytorch-cpu",
         "pytorch-cuda",
diff --git a/backend/providers/__init__.py b/backend/providers/__init__.py
index a901059a..f35ded88 100644
--- a/backend/providers/__init__.py
+++ b/backend/providers/__init__.py
@@ -3,6 +3,7 @@
 """
 
 from typing import Optional
+import asyncio
 import platform
 from pathlib import Path
 
@@ -50,7 +51,7 @@ async def start_provider(self, provider_type: str) -> None:
         Args:
             provider_type: Type of provider to start
         """
-        if provider_type == "bundled-mlx":
+        if provider_type == "apple-mlx":
             # Use bundled MLX provider
             self.active_provider = self._get_default_provider()
         elif provider_type in ["pytorch-cpu", "pytorch-cuda"]:
@@ -61,8 +62,15 @@ async def start_provider(self, provider_type: str) -> None:
                 # Find a free port
                 port = self._get_free_port()
 
-                # Start provider subprocess
+                # Start provider subprocess with stdout/stderr capture
                 from ..config import get_data_dir
+                import logging
+                logger = logging.getLogger(__name__)
+
+                logger.info(f"Starting provider {provider_type} on port {port}")
+                logger.info(f"Provider binary: {provider_path}")
+                logger.info(f"Data directory: {get_data_dir()}")
+
                 process = subprocess.Popen(
                     [
                         str(provider_path),
@@ -71,16 +79,49 @@ async def start_provider(self, provider_type: str) -> None:
                     ],
                     stdout=subprocess.PIPE,
                     stderr=subprocess.PIPE,
+                    text=True,
+                    bufsize=1,
                 )
 
                 # Wait for provider to be ready
                 base_url = f"http://127.0.0.1:{port}"
-                await self._wait_for_provider_health(base_url, timeout=30)
+                try:
+                    await self._wait_for_provider_health(base_url, timeout=30)
+                except TimeoutError as e:
+                    # Capture subprocess output for debugging
+                    stdout_lines = []
+                    stderr_lines = []
+
+                    # Try to read available output
+                    import select
+                    try:
+                        if process.stdout and select.select([process.stdout], [], [], 0)[0]:
+                            stdout_lines = process.stdout.readlines()
+                        if process.stderr and select.select([process.stderr], [], [], 0)[0]:
+                            stderr_lines = process.stderr.readlines()
+                    except Exception:
+                        # select might not work on all platforms
+                        pass
+
+                    logger.error(f"Provider failed to start. Stdout: {stdout_lines}")
+                    logger.error(f"Provider failed to start. Stderr: {stderr_lines}")
+
+                    # Terminate the process
+                    process.terminate()
+                    try:
+                        process.wait(timeout=5)
+                    except subprocess.TimeoutExpired:
+                        process.kill()
+
+                    raise
 
                 # Create LocalProvider instance
                 self.active_provider = LocalProvider(base_url)
                 self._provider_process = process
                 self._provider_port = port
+
+                # Start background task to log subprocess output
+                asyncio.create_task(self._log_subprocess_output(process))
             else:
                 # No external binary, use bundled provider (if available)
                 if provider_type == "pytorch-cpu":
@@ -131,7 +172,7 @@ async def list_installed(self) -> list[str]:
 
         if system == "Darwin" and machine == "arm64":
             # Apple Silicon gets MLX
-            installed.append("bundled-mlx")
+            installed.append("apple-mlx")
 
         # PyTorch CPU is available on all platforms (check if bundled or downloaded)
         # For now, assume it's bundled on macOS Intel, Windows, Linux
@@ -163,7 +204,7 @@ async def get_provider_info(self, provider_type: str) -> dict:
         Returns:
             Provider information dictionary
         """
-        if provider_type in ["bundled-mlx", "bundled-pytorch"]:
+        if provider_type in ["apple-mlx", "bundled-pytorch"]:
             return {
                 "type": provider_type,
                 "name": "Bundled Provider",
@@ -203,7 +244,7 @@ async def _wait_for_provider_health(self, base_url: str, timeout: int = 30) -> N
         """Wait for provider to become healthy."""
         import httpx
         import asyncio
-        
+
         start_time = asyncio.get_event_loop().time()
         while True:
             try:
@@ -213,12 +254,32 @@ async def _wait_for_provider_health(self, base_url: str, timeout: int = 30) -> N
                         return
             except Exception:
                 pass
-            
+
             if asyncio.get_event_loop().time() - start_time > timeout:
                 raise TimeoutError(f"Provider did not become healthy within {timeout} seconds")
-            
+
             await asyncio.sleep(0.5)
 
+    async def _log_subprocess_output(self, process: subprocess.Popen) -> None:
+        """Log subprocess stdout and stderr."""
+        import logging
+        logger = logging.getLogger(__name__)
+
+        async def read_stream(stream, prefix):
+            if stream:
+                loop = asyncio.get_event_loop()
+                while True:
+                    line = await loop.run_in_executor(None, stream.readline)
+                    if not line:
+                        break
+                    logger.info(f"{prefix}: {line.rstrip()}")
+
+        await asyncio.gather(
+            read_stream(process.stdout, "Provider stdout"),
+            read_stream(process.stderr, "Provider stderr"),
+            return_exceptions=True,
+        )
+
 
 # Global provider manager instance
 _provider_manager: Optional[ProviderManager] = None
diff --git a/backend/providers/types.py b/backend/providers/types.py
index 8229cb74..b6b0aff1 100644
--- a/backend/providers/types.py
+++ b/backend/providers/types.py
@@ -8,7 +8,7 @@
 
 class ProviderType(str, Enum):
     """Available provider types."""
-    BUNDLED_MLX = "bundled-mlx"
+    BUNDLED_MLX = "apple-mlx"
     BUNDLED_PYTORCH = "bundled-pytorch"
     PYTORCH_CPU = "pytorch-cpu"
     PYTORCH_CUDA = "pytorch-cuda"
diff --git a/package.json b/package.json
index f6af4cbd..fd5b78ed 100644
--- a/package.json
+++ b/package.json
@@ -18,6 +18,7 @@
     "build:web": "cd web && bun run build",
     "build:landing": "cd landing && bun run build",
     "build:release": "./scripts/prepare-release.sh",
+    "build:providers": "python scripts/build-providers-local.py",
     "generate:api": "./scripts/generate-api.sh",
     "generate:keys": "cd tauri && bun tauri signer generate -w ~/.tauri/voicebox.key",
     "build:server": "./scripts/build-server.sh",
diff --git a/providers/pytorch-cpu/build.py b/providers/pytorch-cpu/build.py
index 6596c266..b70100c5 100644
--- a/providers/pytorch-cpu/build.py
+++ b/providers/pytorch-cpu/build.py
@@ -61,7 +61,6 @@ def build_provider():
         '--exclude-module', 'torch.utils.tensorboard',
         '--exclude-module', 'tensorboard',
         '--exclude-module', 'triton',
-        '--exclude-module', 'torch.distributed',
         '--exclude-module', 'torch._dynamo',
         '--exclude-module', 'torch._inductor',
         '--exclude-module', 'torch.testing',
diff --git a/providers/pytorch-cpu/build_and_install.py b/providers/pytorch-cpu/build_and_install.py
new file mode 100644
index 00000000..7a63e091
--- /dev/null
+++ b/providers/pytorch-cpu/build_and_install.py
@@ -0,0 +1,57 @@
+"""
+Build PyTorch CPU provider and install to local provider directory.
+"""
+
+import platform
+import shutil
+from pathlib import Path
+
+from build import build_provider
+
+
+def get_providers_dir() -> Path:
+    """Get the directory where providers are stored."""
+    system = platform.system()
+
+    if system == "Windows":
+        appdata = Path.home() / "AppData" / "Roaming"
+    elif system == "Darwin":
+        appdata = Path.home() / "Library" / "Application Support"
+    else:  # Linux
+        appdata = Path.home() / ".local" / "share"
+
+    providers_dir = appdata / "voicebox" / "providers"
+    providers_dir.mkdir(parents=True, exist_ok=True)
+    return providers_dir
+
+
+def main():
+    """Build and install provider."""
+    provider_dir = Path(__file__).parent
+
+    # Build the provider
+    print("Building PyTorch CPU provider...")
+    build_provider()
+
+    # Determine binary name
+    binary_name = "tts-provider-pytorch-cpu"
+    if platform.system() == "Windows":
+        binary_name += ".exe"
+
+    # Source and destination paths
+    source = provider_dir / "dist" / binary_name
+    destination = get_providers_dir() / binary_name
+
+    # Copy to provider directory
+    print(f"Installing to {destination}...")
+    shutil.copy2(source, destination)
+
+    # Make executable on Unix systems
+    if platform.system() != "Windows":
+        destination.chmod(0o755)
+
+    print(f"✓ Provider installed successfully to {destination}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec b/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec
new file mode 100644
index 00000000..e4208043
--- /dev/null
+++ b/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec
@@ -0,0 +1,48 @@
+# -*- mode: python ; coding: utf-8 -*-
+from PyInstaller.utils.hooks import collect_data_files
+from PyInstaller.utils.hooks import collect_submodules
+from PyInstaller.utils.hooks import copy_metadata
+
+datas = []
+hiddenimports = ['backend', 'backend.backends', 'backend.backends.pytorch_backend', 'backend.config', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.tasks', 'torch', 'transformers', 'qwen_tts', 'qwen_tts.inference', 'qwen_tts.inference.qwen3_tts_model', 'qwen_tts.inference.qwen3_tts_tokenizer', 'qwen_tts.core', 'qwen_tts.cli', 'pkg_resources.extern', 'fastapi', 'uvicorn', 'soundfile', 'numpy', 'librosa']
+datas += collect_data_files('qwen_tts')
+datas += copy_metadata('qwen-tts')
+hiddenimports += collect_submodules('qwen_tts')
+hiddenimports += collect_submodules('jaraco')
+
+
+a = Analysis(
+    ['main.py'],
+    pathex=['/Users/jamespine/Projects/voicebox'],
+    binaries=[],
+    datas=datas,
+    hiddenimports=hiddenimports,
+    hookspath=[],
+    hooksconfig={},
+    runtime_hooks=[],
+    excludes=['torch.utils.tensorboard', 'tensorboard', 'triton', 'torch._dynamo', 'torch._inductor', 'torch.testing', 'torch.utils.benchmark', 'IPython', 'matplotlib', 'PIL', 'cv2', 'torchvision', 'torchaudio'],
+    noarchive=False,
+    optimize=0,
+)
+pyz = PYZ(a.pure)
+
+exe = EXE(
+    pyz,
+    a.scripts,
+    a.binaries,
+    a.datas,
+    [],
+    name='tts-provider-pytorch-cpu',
+    debug=False,
+    bootloader_ignore_signals=False,
+    strip=False,
+    upx=True,
+    upx_exclude=[],
+    runtime_tmpdir=None,
+    console=True,
+    disable_windowed_traceback=False,
+    argv_emulation=False,
+    target_arch=None,
+    codesign_identity=None,
+    entitlements_file=None,
+)
diff --git a/providers/pytorch-cuda/build.py b/providers/pytorch-cuda/build.py
index 565885b2..28a6fc8e 100644
--- a/providers/pytorch-cuda/build.py
+++ b/providers/pytorch-cuda/build.py
@@ -63,7 +63,6 @@ def build_provider():
         '--exclude-module', 'torch.utils.tensorboard',
         '--exclude-module', 'tensorboard',
         '--exclude-module', 'triton',
-        '--exclude-module', 'torch.distributed',
         '--exclude-module', 'torch._dynamo',
         '--exclude-module', 'torch._inductor',
         '--exclude-module', 'torch.testing',
diff --git a/providers/pytorch-cuda/build_and_install.py b/providers/pytorch-cuda/build_and_install.py
new file mode 100644
index 00000000..227dca0e
--- /dev/null
+++ b/providers/pytorch-cuda/build_and_install.py
@@ -0,0 +1,57 @@
+"""
+Build PyTorch CUDA provider and install to local provider directory.
+"""
+
+import platform
+import shutil
+from pathlib import Path
+
+from build import build_provider
+
+
+def get_providers_dir() -> Path:
+    """Get the directory where providers are stored."""
+    system = platform.system()
+
+    if system == "Windows":
+        appdata = Path.home() / "AppData" / "Roaming"
+    elif system == "Darwin":
+        appdata = Path.home() / "Library" / "Application Support"
+    else:  # Linux
+        appdata = Path.home() / ".local" / "share"
+
+    providers_dir = appdata / "voicebox" / "providers"
+    providers_dir.mkdir(parents=True, exist_ok=True)
+    return providers_dir
+
+
+def main():
+    """Build and install provider."""
+    provider_dir = Path(__file__).parent
+
+    # Build the provider
+    print("Building PyTorch CUDA provider...")
+    build_provider()
+
+    # Determine binary name
+    binary_name = "tts-provider-pytorch-cuda"
+    if platform.system() == "Windows":
+        binary_name += ".exe"
+
+    # Source and destination paths
+    source = provider_dir / "dist" / binary_name
+    destination = get_providers_dir() / binary_name
+
+    # Copy to provider directory
+    print(f"Installing to {destination}...")
+    shutil.copy2(source, destination)
+
+    # Make executable on Unix systems
+    if platform.system() != "Windows":
+        destination.chmod(0o755)
+
+    print(f"✓ Provider installed successfully to {destination}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec b/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec
new file mode 100644
index 00000000..f8179e96
--- /dev/null
+++ b/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec
@@ -0,0 +1,48 @@
+# -*- mode: python ; coding: utf-8 -*-
+from PyInstaller.utils.hooks import collect_data_files
+from PyInstaller.utils.hooks import collect_submodules
+from PyInstaller.utils.hooks import copy_metadata
+
+datas = []
+hiddenimports = ['backend', 'backend.backends', 'backend.backends.pytorch_backend', 'backend.config', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.tasks', 'torch', 'torch.cuda', 'torch.backends.cudnn', 'transformers', 'qwen_tts', 'qwen_tts.inference', 'qwen_tts.inference.qwen3_tts_model', 'qwen_tts.inference.qwen3_tts_tokenizer', 'qwen_tts.core', 'qwen_tts.cli', 'pkg_resources.extern', 'fastapi', 'uvicorn', 'soundfile', 'numpy', 'librosa']
+datas += collect_data_files('qwen_tts')
+datas += copy_metadata('qwen-tts')
+hiddenimports += collect_submodules('qwen_tts')
+hiddenimports += collect_submodules('jaraco')
+
+
+a = Analysis(
+    ['main.py'],
+    pathex=['/Users/jamespine/Projects/voicebox'],
+    binaries=[],
+    datas=datas,
+    hiddenimports=hiddenimports,
+    hookspath=[],
+    hooksconfig={},
+    runtime_hooks=[],
+    excludes=['torch.utils.tensorboard', 'tensorboard', 'triton', 'torch._dynamo', 'torch._inductor', 'torch.testing', 'torch.utils.benchmark', 'IPython', 'matplotlib', 'PIL', 'cv2', 'torchvision', 'torchaudio'],
+    noarchive=False,
+    optimize=0,
+)
+pyz = PYZ(a.pure)
+
+exe = EXE(
+    pyz,
+    a.scripts,
+    a.binaries,
+    a.datas,
+    [],
+    name='tts-provider-pytorch-cuda',
+    debug=False,
+    bootloader_ignore_signals=False,
+    strip=False,
+    upx=True,
+    upx_exclude=[],
+    runtime_tmpdir=None,
+    console=True,
+    disable_windowed_traceback=False,
+    argv_emulation=False,
+    target_arch=None,
+    codesign_identity=None,
+    entitlements_file=None,
+)
diff --git a/scripts/build-providers-local.py b/scripts/build-providers-local.py
new file mode 100755
index 00000000..05edde2c
--- /dev/null
+++ b/scripts/build-providers-local.py
@@ -0,0 +1,46 @@
+#!/usr/bin/env python3
+"""
+Build and install all TTS providers locally for development.
+"""
+
+import subprocess
+import sys
+from pathlib import Path
+
+
+def main():
+    """Build and install all providers."""
+    project_root = Path(__file__).parent.parent
+    providers_dir = project_root / "providers"
+
+    providers = ["pytorch-cpu", "pytorch-cuda"]
+
+    for provider in providers:
+        provider_path = providers_dir / provider
+        script_path = provider_path / "build_and_install.py"
+
+        if not script_path.exists():
+            print(f"⚠ Skipping {provider}: build_and_install.py not found")
+            continue
+
+        print(f"\n{'=' * 60}")
+        print(f"Building and installing {provider}...")
+        print(f"{'=' * 60}\n")
+
+        try:
+            subprocess.run(
+                [sys.executable, str(script_path)],
+                cwd=provider_path,
+                check=True,
+            )
+        except subprocess.CalledProcessError as e:
+            print(f"✗ Failed to build {provider}: {e}")
+            sys.exit(1)
+
+    print(f"\n{'=' * 60}")
+    print("✓ All providers built and installed successfully!")
+    print(f"{'=' * 60}\n")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index 088d16109eafb4a4f3c7ce2037b867bcb95502e2..f87bc4fb862e49d7e9477935436913a22ea535ea 100644
GIT binary patch
delta 819
zcmZwGy>1gh5C`ycjEPAA2S`G20yu#A-gtL!Z+9mJm;E~B5mM68Axa7gBnrEYEZ!j!
z6i6v94-p9-fPxN-0;NDo%RjQxU{3mJv|G%~&hCwV{%VZi%h!HuG0U=r@o|6s@K67^
zv(H=Oo_;w#DR#!+ir(RS-D#G2K~h+0m`h}ss;FY#CCfBdRT45P9uiZz;+pZZPdKB5
zt+b0~>&@#|`<vYl6B<sa0dvrV3($g#FkeroomwT?kb?4_IbkeQ!X@UUGt361a}`al
zT`^lH#!884osD`_wm&vY!+nyjBIXIbD(%p4VIoV?$Ao6NSJ?iy;gl*R&l9~3?UhF9
zDM%NLW<@S>MByW&h$RVLD3gq{Uj8Q$@fgn&O=7#-e8D4^RuI!kM5df@%o-n9ZVP8T
zIUU991gWybX_{wkxVPJeORxZoa2c+^Rp`JHT!ZUy1D0V0R^cX`<+uf1SceU`4R_!!
z^k5V2!F_lDeRv3u;4wUbr}f_Mv(wX(lgN|PjyXk&spJB~I5>-z^4yzBSu;Bv%2Skl
zdZ_O3VCOk7*n$CY5FjB31x0<ZqwC+LJ)6C9o(0Qse^qjf$O~L6FDS%7DbBtR;x^>z
uyx`Hm437pDs6HBOH{WfpWm)k9|G*sL3F2~=>80sf_Yha>@1M3m&;JFzx8jTd

delta 839
zcmZwFJ5N+W6bJBy6<MB(3WzJ{qT>6o^L|jc%;QcdDftF=#?r#V#A0a)@jH-cVM1~F
z7We@y?A%xwt!Vv|4b^&+U(Vd-e`e0i;m=<ahw$}$Yopz0G!|h7TCf1~FbA`zf49!t
zM{MeN->~DZ***TI_fJ2VcC)X%)27myf>V-IQjuH<iE`jcnUqsh6&YzYBX;?5>w}NZ
zXA!sGzIlDL+4(s1gQ1^*Noc|~n1bstT@QV$n(8O(xUnXX4aJhOI*^mvQjtz5?vpH%
zjrTFO5@OV6y*})>J~jJBW)`w3<e8~R<svA`tSK2^VkMn+QH%#UR=m6ldY4)&6Mdgd
zP%;T(DFsro6be`p0wR||=72GbogCX2<tk{HTb<@B$E7I3Q}V@-s*<9BeOxA5D=d>t
z@UfiaiZywZvo<)`Yrzc6!W_)Q0xUusmf!~5gj=u-E3gW;;WFb6bl@(m!v@@g`_P3=
zcmNOK5p2O@cmhx189c8K_Fi0E^aC?eR+yybL14-lb&TGV)e%FsF0uTd>&jekKRQ%r
zaI*Un2)3aI3^)jopg`9ryQcn)+pv~%!%1YNNr{3NX@w@K3+KvupOqb(V)T(Ib=B~!
rX9s6J2fjY*?KIzSE;kzb2j2fA>L1kAM#C(P{!JHkt^WRb=gagz;z{6>


From 595747c3d01f42b4af15ba643c7657a59b7ff67f Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sun, 1 Feb 2026 02:29:40 -0800
Subject: [PATCH 13/33] Refactor provider health status and update build
 configurations

- Updated the `ProviderSettings` component to log the current active provider.
- Changed the provider health status to use specific names for MLX and PyTorch backends.
- Removed unnecessary exclusions from the build scripts for both PyTorch CPU and CUDA providers.
- Ensured consistency in the `.spec` files for PyTorch providers by aligning exclusion lists.
---
 .../ServerSettings/ProviderSettings.tsx       |   3 ++-
 backend/providers/bundled.py                  |  11 +++++++----
 providers/pytorch-cpu/build.py                |   1 -
 .../pytorch-cpu/tts-provider-pytorch-cpu.spec |   2 +-
 providers/pytorch-cuda/build.py               |   1 -
 .../tts-provider-pytorch-cuda.spec            |   2 +-
 tauri/src-tauri/gen/Assets.car                | Bin 3847048 -> 3847048 bytes
 7 files changed, 11 insertions(+), 9 deletions(-)

diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index b0bc5c50..41f820df 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -172,7 +172,8 @@ export function ProviderSettings() {
   const installedProviders = providersData?.installed || [];
 
   // Determine current active provider
-  const currentProvider = activeProvider?.provider || 'auto';
+  const currentProvider = activeProvider?.provider;
+  console.log('currentProvider', currentProvider);
   const selectedProvider = currentProvider as ProviderType;
 
   return (
diff --git a/backend/providers/bundled.py b/backend/providers/bundled.py
index 9c37e23c..bb34cd57 100644
--- a/backend/providers/bundled.py
+++ b/backend/providers/bundled.py
@@ -85,22 +85,25 @@ async def health(self) -> ProviderHealth:
         """Get provider health status."""
         backend = self._get_backend()
         backend_type = get_backend_type()
-        
+
         model_size = None
         if backend.is_loaded():
             # Try to get current model size from backend
             if hasattr(backend, '_current_model_size') and backend._current_model_size:
                 model_size = backend._current_model_size
-        
+
         device = None
         if backend_type == "mlx":
             device = "metal"
         elif hasattr(backend, 'device'):
             device = backend.device
-        
+
+        # Use apple-mlx for MLX backend, pytorch-cpu for PyTorch
+        provider_name = "apple-mlx" if backend_type == "mlx" else "pytorch-cpu"
+
         return ProviderHealth(
             status="healthy",
-            provider=f"bundled-{backend_type}",
+            provider=provider_name,
             version=None,  # Provider versioning not implemented yet
             model=model_size,
             device=device,
diff --git a/providers/pytorch-cpu/build.py b/providers/pytorch-cpu/build.py
index b70100c5..5d714d9c 100644
--- a/providers/pytorch-cpu/build.py
+++ b/providers/pytorch-cpu/build.py
@@ -63,7 +63,6 @@ def build_provider():
         '--exclude-module', 'triton',
         '--exclude-module', 'torch._dynamo',
         '--exclude-module', 'torch._inductor',
-        '--exclude-module', 'torch.testing',
         '--exclude-module', 'torch.utils.benchmark',
         '--exclude-module', 'IPython',
         '--exclude-module', 'matplotlib',
diff --git a/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec b/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec
index e4208043..8ab78036 100644
--- a/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec
+++ b/providers/pytorch-cpu/tts-provider-pytorch-cpu.spec
@@ -20,7 +20,7 @@ a = Analysis(
     hookspath=[],
     hooksconfig={},
     runtime_hooks=[],
-    excludes=['torch.utils.tensorboard', 'tensorboard', 'triton', 'torch._dynamo', 'torch._inductor', 'torch.testing', 'torch.utils.benchmark', 'IPython', 'matplotlib', 'PIL', 'cv2', 'torchvision', 'torchaudio'],
+    excludes=['torch.utils.tensorboard', 'tensorboard', 'triton', 'torch._dynamo', 'torch._inductor', 'torch.utils.benchmark', 'IPython', 'matplotlib', 'PIL', 'cv2', 'torchvision', 'torchaudio'],
     noarchive=False,
     optimize=0,
 )
diff --git a/providers/pytorch-cuda/build.py b/providers/pytorch-cuda/build.py
index 28a6fc8e..00630c3b 100644
--- a/providers/pytorch-cuda/build.py
+++ b/providers/pytorch-cuda/build.py
@@ -65,7 +65,6 @@ def build_provider():
         '--exclude-module', 'triton',
         '--exclude-module', 'torch._dynamo',
         '--exclude-module', 'torch._inductor',
-        '--exclude-module', 'torch.testing',
         '--exclude-module', 'torch.utils.benchmark',
         '--exclude-module', 'IPython',
         '--exclude-module', 'matplotlib',
diff --git a/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec b/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec
index f8179e96..01230506 100644
--- a/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec
+++ b/providers/pytorch-cuda/tts-provider-pytorch-cuda.spec
@@ -20,7 +20,7 @@ a = Analysis(
     hookspath=[],
     hooksconfig={},
     runtime_hooks=[],
-    excludes=['torch.utils.tensorboard', 'tensorboard', 'triton', 'torch._dynamo', 'torch._inductor', 'torch.testing', 'torch.utils.benchmark', 'IPython', 'matplotlib', 'PIL', 'cv2', 'torchvision', 'torchaudio'],
+    excludes=['torch.utils.tensorboard', 'tensorboard', 'triton', 'torch._dynamo', 'torch._inductor', 'torch.utils.benchmark', 'IPython', 'matplotlib', 'PIL', 'cv2', 'torchvision', 'torchaudio'],
     noarchive=False,
     optimize=0,
 )
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index f87bc4fb862e49d7e9477935436913a22ea535ea..6ed044ab061aef37a81f5257694180a702734d76 100644
GIT binary patch
delta 858
zcmZwGJ5N+W6bJCTtjO|QR6xK*K*jfgnZ5I*xy&<^lzam_V`*VwVzHDGVy8WcjS0o2
z^c(OM?A#b*)Wp#GC#(%}lV46Ilbl!P?tT5%*n>|eYfF<wQB1%nv|t>@pbb+;zt&FL
z`)v4NN3ny?^6kNE)oJ`W`k;OfRbD5{c~B&5)+AU6WW6uRYi>o5LdBAik=jUNXCL=L
zC7~s^di}-oXZx#*Z~C^^w+$GACR~AGxC$e6-?q{)>gc2b4-_L~D3&DokUSa1TsNbV
z66XIpiYuAV>vZb9s`ai}Ido)<G{m$?BwVy)yw&8q4#*U<4C0bR=vn<s^fI(&8&$|T
z`oI}kmof>JEctFqq`PG<Mbg>m%M!V+9!%b;`?0mqtV9e-2jmDWlvp8mWOdG@Ezc|^
zW0FOW7gi{h6HJ_UG~e6ZZow#w!8lC7BuqgYrr{b~hZ`^hvoHrY;Vj1jEW$15z!Kbs
zWmth#xC3|L9<0HAcmNOK5j?JUx1XGzR#8WrLkgsMj3km(WVG|-lFZin6iZBaaVX)f
zWPb22dWTz2fnXgrfB}atlpsLXhg+)tQL(_3GkAzyQ#umHb8<!p3eG0yt>a2x@<5E@
ze6YpE-tmS81GYZi*lfPyGesf4;1?J|{E0YU6l(hXtX2?lueJu~9mKi%`^U}qBYy$5
CeC5sn

delta 858
zcmZwGzfTlF6bJA<PUQG`sDOZ=pyKc0W@cw+=Fu$kYeQ+te_&@UEi6ndj#6^5)1Jh}
zgkrDsKj0s*u=8S!K^t1X<fQT3<dc`T#d~kw>>hmk-Z+3yCtK^&S(Z&f8|GjVS}+SU
z$G^5t+J}6+cUrvdeJ*(KwO(s{IsTx3kCk~rQdnu2OJta;sAAqF%QRP25;7_t5>vV2
zn(^~TIHQEEw2Nl@#q(!}o2zdI)E!U*#-It8U>q*PL_MHZ8ZXI)6qNVO31gWOE-@#a
zVKyk8t7vlViqSqXR!R)}tknl)>s_-n+$ZTOVxBOo(hdU`CbA@bOc<7Xh1dTMoKmIa
zMWL6Wwb&><1?hs(tjHyfD12lTk&@trGRZjW<$nqhkMW|=AhuSTrQ?xHD~RbNB2!K{
zW{nRlw}msFoQ`62g;ZJMG%U2--QR1$Buv3H%)l(nK^x}b3S5P2umFp&1lQrb#tN*$
z4OoM9xCysl12*9{+=08W1^3`SJb;JrsNUaue0ElH5_xjkF{el|m0V!h2WQbzo_kX%
zYeu(2d5V$`54GAo+I<2HwxI(Y1W3q1K~W#=>iTDC&zG;9XTfq@V3iyr@&fnD3koq%
zilZM0aU1e<(Xih!-G0Xc)&0&+^Oac6vf?X#fic8W#Dy%=^TS+kATA-_{hL2UT&RD1
I+<8Co2W4#J_W%F@


From be30a0ac6bdccc00eb9b100632b1335b857153d5 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sun, 1 Feb 2026 23:21:27 -0800
Subject: [PATCH 14/33] Update provider documentation and enhance build
 configurations

- Clarified the bundling of PyTorch CPU providers for Windows and macOS Intel builds in documentation.
- Improved handling of platform-specific dependencies in the build process, including asyncio support for PyInstaller.
- Updated backend logic to gracefully handle missing dependencies and provide clearer error messages.
- Enhanced progress management to ensure compatibility with PyInstaller's async handling.
- Removed unnecessary exclusions from the build scripts for PyTorch providers to streamline the build process.
---
 CONTRIBUTING.md                 |   7 +--
 README.md                       |   6 +--
 backend/backends/__init__.py    |  31 +++++++++---
 backend/build_binary.py         |  32 ++++++++++--
 backend/main.py                 |  87 +++++++++++++++++++++-----------
 backend/providers/__init__.py   |  11 ++--
 backend/utils/progress.py       |  14 +++--
 backend/voicebox-server.spec    |   2 +-
 providers/pytorch-cpu/build.py  |  18 +------
 providers/pytorch-cuda/build.py |  18 +------
 tauri/src-tauri/gen/Assets.car  | Bin 3847048 -> 3847048 bytes
 11 files changed, 132 insertions(+), 94 deletions(-)

diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 6a954046..45d898e7 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -148,9 +148,10 @@ Voicebox uses a modular provider system to support different inference backends.
 **Hybrid Provider:**
 
 - `pytorch-cpu` — Can be bundled OR downloaded depending on platform
-  - **Bundled** with macOS Intel builds (`.dmg` for x64)
-    - Configured in `.github/workflows/release.yml` with `backend: "pytorch"`
-  - **Downloaded** on first use for Windows/Linux builds (~300MB)
+  - **Bundled** with Windows and macOS Intel builds
+    - macOS Intel: `.dmg` for x64 with `backend: "pytorch"`
+    - Windows: `.exe` installer with PyTorch CPU included
+  - **Downloaded** on first use for Linux builds (~300MB)
   - Falls back to bundled version if external binary not found
 
 **External-Only Providers:**
diff --git a/README.md b/README.md
index 6b4cb0a0..74672d6e 100644
--- a/README.md
+++ b/README.md
@@ -205,14 +205,14 @@ Voicebox uses a modular provider system to support different inference backends:
 
 - **`pytorch-cpu`** — Universal CPU provider (bundled or downloaded)
 
-  - Bundled with macOS Intel builds
-  - Downloaded on first use for Windows/Linux (~300MB)
+  - Bundled with Windows and macOS Intel builds
+  - Downloaded on first use for Linux (~300MB)
 
 - **`pytorch-cuda`** — Optional NVIDIA GPU-accelerated provider
   - Windows/Linux only (~2.4GB)
   - 4-5x faster inference on CUDA-capable GPUs
 
-macOS builds work out of the box with bundled providers. Windows and Linux users download a provider on first launch. The app automatically detects your hardware and recommends the best option. All downloadable providers are distributed via Cloudflare R2 for fast, global delivery.
+macOS and Windows builds work out of the box with bundled providers. Linux users download a provider on first launch. The app automatically detects your hardware and recommends the best option. All downloadable providers are distributed via Cloudflare R2 for fast, global delivery.
 
 ---
 
diff --git a/backend/backends/__init__.py b/backend/backends/__init__.py
index f7c47ba9..5f0c9b7e 100644
--- a/backend/backends/__init__.py
+++ b/backend/backends/__init__.py
@@ -118,22 +118,37 @@ def is_loaded(self) -> bool:
 def get_tts_backend() -> TTSBackend:
     """
     Get or create TTS backend instance based on platform.
-    
+
     Returns:
         TTS backend instance (MLX or PyTorch)
+
+    Raises:
+        ImportError: If required dependencies (mlx or torch) are not available
     """
     global _tts_backend
-    
+
     if _tts_backend is None:
         backend_type = get_backend_type()
-        
+
         if backend_type == "mlx":
-            from .mlx_backend import MLXTTSBackend
-            _tts_backend = MLXTTSBackend()
+            try:
+                from .mlx_backend import MLXTTSBackend
+                _tts_backend = MLXTTSBackend()
+            except ImportError as e:
+                raise ImportError(
+                    f"MLX backend dependencies not available. "
+                    f"Please install mlx and mlx_audio or download a provider. Error: {e}"
+                )
         else:
-            from .pytorch_backend import PyTorchTTSBackend
-            _tts_backend = PyTorchTTSBackend()
-    
+            try:
+                from .pytorch_backend import PyTorchTTSBackend
+                _tts_backend = PyTorchTTSBackend()
+            except ImportError as e:
+                raise ImportError(
+                    f"PyTorch backend dependencies not available. "
+                    f"Please download a TTS provider (pytorch-cpu or pytorch-cuda) from the Downloads page. Error: {e}"
+                )
+
     return _tts_backend
 
 
diff --git a/backend/build_binary.py b/backend/build_binary.py
index fb65863e..3d695fdb 100644
--- a/backend/build_binary.py
+++ b/backend/build_binary.py
@@ -59,9 +59,16 @@ def build_server():
         # Fix for pkg_resources and jaraco namespace packages
         '--hidden-import', 'pkg_resources.extern',
         '--collect-submodules', 'jaraco',
+        # Asyncio and threading support for PyInstaller
+        '--hidden-import', 'asyncio',
+        '--hidden-import', 'asyncio.subprocess',
+        '--hidden-import', 'concurrent.futures',
+        '--hidden-import', 'concurrent.futures.thread',
     ])
 
     # Platform-specific TTS backend handling
+    system = platform.system()
+
     if is_apple_silicon():
         print("Building for Apple Silicon - including MLX dependencies (bundled)")
         args.extend([
@@ -79,13 +86,30 @@ def build_server():
             '--collect-data', 'mlx',
             '--collect-data', 'mlx_audio',
         ])
+    elif system == "Windows" or (system == "Darwin" and not is_apple_silicon()):
+        # Windows and Intel macOS: Bundle PyTorch CPU provider
+        print(f"Building for {system} - including PyTorch CPU provider (bundled)")
+        args.extend([
+            '--hidden-import', 'backend.backends',
+            '--hidden-import', 'backend.backends.pytorch_backend',
+            '--hidden-import', 'torch',
+            '--hidden-import', 'transformers',
+            '--hidden-import', 'qwen_tts',
+            '--hidden-import', 'qwen_tts.inference',
+            '--hidden-import', 'qwen_tts.inference.qwen3_tts_model',
+            '--hidden-import', 'qwen_tts.inference.qwen3_tts_tokenizer',
+            '--hidden-import', 'qwen_tts.core',
+            '--hidden-import', 'qwen_tts.cli',
+            '--copy-metadata', 'qwen-tts',
+            '--collect-submodules', 'qwen_tts',
+            '--collect-data', 'qwen_tts',
+        ])
     else:
-        print("Building for Windows/Linux - excluding PyTorch/Qwen-TTS (providers downloaded separately)")
-        # Note: PyTorch and Qwen-TTS are NOT included - users will download providers separately
-        # Only include backend abstraction (no actual TTS implementation)
+        # Linux: No bundled provider - users download providers separately
+        print("Building for Linux - no bundled provider (users download separately)")
         args.extend([
             '--hidden-import', 'backend.backends',
-            '--hidden-import', 'backend.backends.pytorch_backend',  # Keep for reference, but won't work without PyTorch
+            '--hidden-import', 'backend.backends.pytorch_backend',
         ])
 
     args.extend([
diff --git a/backend/main.py b/backend/main.py
index 31089227..f0c774a5 100644
--- a/backend/main.py
+++ b/backend/main.py
@@ -14,7 +14,6 @@
 import asyncio
 import uvicorn
 import argparse
-import torch
 import tempfile
 import io
 from pathlib import Path
@@ -23,6 +22,14 @@
 import signal
 import os
 
+# Optional torch import - not available on all platforms (e.g. Windows/Linux without bundled provider)
+try:
+    import torch
+    TORCH_AVAILABLE = True
+except ImportError:
+    torch = None  # type: ignore
+    TORCH_AVAILABLE = False
+
 from . import database, models, profiles, history, tts, transcribe, config, export_import, channels, stories, __version__
 from .database import get_db, Generation as DBGeneration, VoiceProfile as DBVoiceProfile
 from .utils.progress import get_progress_manager
@@ -72,20 +79,32 @@ async def shutdown_async():
 @app.get("/health", response_model=models.HealthResponse)
 async def health():
     """Health check endpoint."""
-    from huggingface_hub import hf_hub_download, constants as hf_constants
+    from huggingface_hub import constants as hf_constants
     from pathlib import Path
-    import os
 
-    tts_model = await tts.get_tts_model_async()
+    # Try to get TTS model provider, but it may not be available if dependencies aren't installed
+    tts_model = None
+    try:
+        tts_model = await tts.get_tts_model_async()
+    except ImportError as e:
+        # Provider dependencies not available (e.g., PyTorch not bundled on this platform)
+        # This is expected on Windows/Linux builds without a bundled provider
+        print(f"Provider not available: {e}")
+
     backend_type = get_backend_type()
 
     # Check for GPU availability (CUDA or MPS)
-    has_cuda = torch.cuda.is_available()
-    has_mps = hasattr(torch.backends, 'mps') and torch.backends.mps.is_available()
+    # PyTorch might not be available if no provider is bundled
+    has_cuda = False
+    has_mps = False
+    if TORCH_AVAILABLE and torch is not None:
+        has_cuda = torch.cuda.is_available()
+        has_mps = hasattr(torch.backends, 'mps') and torch.backends.mps.is_available()
+
     gpu_available = has_cuda or has_mps
 
     gpu_type = None
-    if has_cuda:
+    if has_cuda and torch is not None:
         gpu_type = f"CUDA ({torch.cuda.get_device_name(0)})"
     elif has_mps:
         gpu_type = "MPS (Apple Silicon)"
@@ -93,26 +112,27 @@ async def health():
         gpu_type = "Metal (Apple Silicon via MLX)"
 
     vram_used = None
-    if has_cuda:
+    if has_cuda and torch is not None:
         vram_used = torch.cuda.memory_allocated() / 1024 / 1024  # MB
-    
+
     # Check if model is loaded - use the same logic as model status endpoint
     model_loaded = False
     model_size = None
-    try:
-        # Use the same check as model status endpoint
-        if tts_model.is_loaded():
-            model_loaded = True
-            # Get the actual loaded model size
-            # Check _current_model_size first (more reliable for actually loaded models)
-            model_size = getattr(tts_model, '_current_model_size', None)
-            if not model_size:
-                # Fallback to model_size attribute (which should be set when model loads)
-                model_size = getattr(tts_model, 'model_size', None)
-    except Exception:
-        # If there's an error checking, assume not loaded
-        model_loaded = False
-        model_size = None
+    if tts_model is not None:
+        try:
+            # Use the same check as model status endpoint
+            if tts_model.is_loaded():
+                model_loaded = True
+                # Get the actual loaded model size
+                # Check _current_model_size first (more reliable for actually loaded models)
+                model_size = getattr(tts_model, '_current_model_size', None)
+                if not model_size:
+                    # Fallback to model_size attribute (which should be set when model loads)
+                    model_size = getattr(tts_model, 'model_size', None)
+        except Exception:
+            # If there's an error checking, assume not loaded
+            model_loaded = False
+            model_size = None
     
     # Check if default model is downloaded (cached)
     model_downloaded = None
@@ -1836,11 +1856,12 @@ async def get_active_tasks():
 def _get_gpu_status() -> str:
     """Get GPU availability status."""
     backend_type = get_backend_type()
-    if torch.cuda.is_available():
-        return f"CUDA ({torch.cuda.get_device_name(0)})"
-    elif hasattr(torch.backends, 'mps') and torch.backends.mps.is_available():
-        return "MPS (Apple Silicon)"
-    elif backend_type == "mlx":
+    if TORCH_AVAILABLE and torch is not None:
+        if torch.cuda.is_available():
+            return f"CUDA ({torch.cuda.get_device_name(0)})"
+        elif hasattr(torch.backends, 'mps') and torch.backends.mps.is_available():
+            return "MPS (Apple Silicon)"
+    if backend_type == "mlx":
         return "Metal (Apple Silicon via MLX)"
     return "None (CPU only)"
 
@@ -1879,8 +1900,14 @@ async def shutdown_event():
     """Run on application shutdown."""
     print("voicebox API shutting down...")
     # Unload models to free memory
-    tts.unload_tts_model()
-    transcribe.unload_whisper_model()
+    try:
+        tts.unload_tts_model()
+    except Exception as e:
+        print(f"Warning: Failed to unload TTS model: {e}")
+    try:
+        transcribe.unload_whisper_model()
+    except Exception as e:
+        print(f"Warning: Failed to unload Whisper model: {e}")
 
 
 # ============================================
diff --git a/backend/providers/__init__.py b/backend/providers/__init__.py
index f35ded88..cbe1c2cf 100644
--- a/backend/providers/__init__.py
+++ b/backend/providers/__init__.py
@@ -171,15 +171,12 @@ async def list_installed(self) -> list[str]:
         machine = platform.machine()
 
         if system == "Darwin" and machine == "arm64":
-            # Apple Silicon gets MLX
+            # Apple Silicon gets MLX bundled
             installed.append("apple-mlx")
-
-        # PyTorch CPU is available on all platforms (check if bundled or downloaded)
-        # For now, assume it's bundled on macOS Intel, Windows, Linux
-        # Downloaded binaries will be detected below
-        if not (system == "Darwin" and machine == "arm64"):
-            # Non-Apple Silicon systems have PyTorch CPU bundled
+        elif system == "Windows" or (system == "Darwin" and machine != "arm64"):
+            # Windows and Intel macOS get PyTorch CPU bundled
             installed.append("pytorch-cpu")
+        # Linux: no bundled provider - users must download
         
         # Check for downloaded providers (Phase 2)
         providers_dir = _get_providers_dir()
diff --git a/backend/utils/progress.py b/backend/utils/progress.py
index 418a88c7..5d8202d2 100644
--- a/backend/utils/progress.py
+++ b/backend/utils/progress.py
@@ -49,11 +49,17 @@ def _notify_listeners_threadsafe(self, model_name: str, progress_data: Dict):
                     queue.put_nowait(progress_data.copy())
                 except RuntimeError:
                     # Not in async context (running in background thread)
-                    # Use call_soon_threadsafe to safely put on queue
+                    # Use asyncio.run_coroutine_threadsafe for better PyInstaller compatibility
                     if self._main_loop and self._main_loop.is_running():
-                        self._main_loop.call_soon_threadsafe(
-                            lambda q=queue, d=progress_data.copy(): q.put_nowait(d) if not q.full() else None
-                        )
+                        async def put_data_async():
+                            try:
+                                queue.put_nowait(progress_data.copy())
+                            except asyncio.QueueFull:
+                                pass  # Queue full, drop update
+                        try:
+                            asyncio.run_coroutine_threadsafe(put_data_async(), self._main_loop)
+                        except Exception as e:
+                            logger.warning(f"Failed to schedule progress update: {e}")
                     else:
                         logger.debug(f"No main loop available for {model_name}, skipping notification")
             except asyncio.QueueFull:
diff --git a/backend/voicebox-server.spec b/backend/voicebox-server.spec
index dc6fe876..a6ff1e41 100644
--- a/backend/voicebox-server.spec
+++ b/backend/voicebox-server.spec
@@ -3,7 +3,7 @@ from PyInstaller.utils.hooks import collect_data_files
 from PyInstaller.utils.hooks import collect_submodules
 
 datas = []
-hiddenimports = ['backend', 'backend.main', 'backend.config', 'backend.database', 'backend.models', 'backend.profiles', 'backend.history', 'backend.tts', 'backend.transcribe', 'backend.platform_detect', 'backend.providers', 'backend.providers.base', 'backend.providers.bundled', 'backend.providers.types', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.validation', 'fastapi', 'uvicorn', 'sqlalchemy', 'librosa', 'soundfile', 'pkg_resources.extern', 'backend.backends', 'backend.backends.mlx_backend', 'mlx', 'mlx.core', 'mlx.nn', 'mlx_audio', 'mlx_audio.tts', 'mlx_audio.stt']
+hiddenimports = ['backend', 'backend.main', 'backend.config', 'backend.database', 'backend.models', 'backend.profiles', 'backend.history', 'backend.tts', 'backend.transcribe', 'backend.platform_detect', 'backend.providers', 'backend.providers.base', 'backend.providers.bundled', 'backend.providers.types', 'backend.utils.audio', 'backend.utils.cache', 'backend.utils.progress', 'backend.utils.hf_progress', 'backend.utils.validation', 'fastapi', 'uvicorn', 'sqlalchemy', 'librosa', 'soundfile', 'pkg_resources.extern', 'asyncio', 'asyncio.subprocess', 'concurrent.futures', 'concurrent.futures.thread', 'backend.backends', 'backend.backends.mlx_backend', 'mlx', 'mlx.core', 'mlx.nn', 'mlx_audio', 'mlx_audio.tts', 'mlx_audio.stt']
 datas += collect_data_files('mlx')
 datas += collect_data_files('mlx_audio')
 hiddenimports += collect_submodules('jaraco')
diff --git a/providers/pytorch-cpu/build.py b/providers/pytorch-cpu/build.py
index 5d714d9c..e71996a7 100644
--- a/providers/pytorch-cpu/build.py
+++ b/providers/pytorch-cpu/build.py
@@ -55,23 +55,7 @@ def build_provider():
         '--hidden-import', 'numpy',
         '--hidden-import', 'librosa',
     ])
-    
-    # Exclude large unused modules to reduce binary size
-    args.extend([
-        '--exclude-module', 'torch.utils.tensorboard',
-        '--exclude-module', 'tensorboard',
-        '--exclude-module', 'triton',
-        '--exclude-module', 'torch._dynamo',
-        '--exclude-module', 'torch._inductor',
-        '--exclude-module', 'torch.utils.benchmark',
-        '--exclude-module', 'IPython',
-        '--exclude-module', 'matplotlib',
-        '--exclude-module', 'PIL',
-        '--exclude-module', 'cv2',
-        '--exclude-module', 'torchvision',
-        '--exclude-module', 'torchaudio',
-    ])
-    
+
     args.extend([
         '--noconfirm',
         '--clean',
diff --git a/providers/pytorch-cuda/build.py b/providers/pytorch-cuda/build.py
index 00630c3b..1eec21a8 100644
--- a/providers/pytorch-cuda/build.py
+++ b/providers/pytorch-cuda/build.py
@@ -57,23 +57,7 @@ def build_provider():
         '--hidden-import', 'numpy',
         '--hidden-import', 'librosa',
     ])
-    
-    # Exclude large unused modules to reduce binary size
-    args.extend([
-        '--exclude-module', 'torch.utils.tensorboard',
-        '--exclude-module', 'tensorboard',
-        '--exclude-module', 'triton',
-        '--exclude-module', 'torch._dynamo',
-        '--exclude-module', 'torch._inductor',
-        '--exclude-module', 'torch.utils.benchmark',
-        '--exclude-module', 'IPython',
-        '--exclude-module', 'matplotlib',
-        '--exclude-module', 'PIL',
-        '--exclude-module', 'cv2',
-        '--exclude-module', 'torchvision',
-        '--exclude-module', 'torchaudio',
-    ])
-    
+
     args.extend([
         '--noconfirm',
         '--clean',
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index 6ed044ab061aef37a81f5257694180a702734d76..c9020db2ed0176ead670e76d10bd339fd140d47e 100644
GIT binary patch
delta 810
zcmZwEyG~S56b4|%5gBfdiXe<2pyGYQ+WYJ)g@=6&k3dOhXDlr&Oe}_$5M$#5kkFV=
z97-R+gvW4VjER+&{sgIpoqX;8ueJ8x_aCi2_;R|oG(Ivi(t&B1f-YQ#NtihPy>{B&
zr_qBIy?gLg?H<3^-FD5%NuNb#CTq)N%$oVi2<C{QP)1du%1lcs4WqLsf)-pWp@Ut2
z^ZM2PYVX6q^#`s6SD+17VHB>xSTk^)JX*UHL*g+p=YwQYlV-s>#R8A2B0-c*8150)
zb9dge*zDDvkL_9o$8Dt~BUuF|NfEO~RxDQ~$4Ddvr{N%}l_?iNZ)0b+Rg;LaxMG=+
zTwx*}m~}p~Vuck-nrMo<B#44l7eRy6S!mZeYvnU##w&-3N-kJ3T9!!oil>yFPD4RP
zXYc7eXuiL*-GOnKfJvBwX}AtuxB)le7R<nHn1wmG17{fv(1W|M2upAemSF`};XXWo
zhp+~Z;4wUbr|_)V*?#`_&r4nj5mjVT#=@lXfq8-Bq-2Q~Z$ealXeaG`3jcTN^$)jR
z0E2bd00IsIDv+R>!!6zXs!Pry#-x~&7KJ1|^QF@0mqbZXO68Jo)jr#Je#Bn?WW#_3
a*PLu@&b({QefoB^x!js>ejaUp9{UH(tKJ|0

delta 810
zcmZwFyKWOf6b4`$W3ss#2nmUCNCKGqiD$fXb-`w4c1C%Gl<DXYB?Sc%h22IGqTvA|
zr9n!uDR}^-JO&m*NK{brM=?#vNMHN^=Zwzi+xPkiKA(2i=4-Xu985z7voHfKSUCRG
zJ#Fo?=D~*AJNP2^j^C+PqwqRf&VwRhlP1AJAnScjUUMsg6spV_8L5pVcJ{arDhe&R
z)myJ$z1-hyzaQJ-*w*0+G~g;U;TlX;W1Gb$dURBQ2P#X(P!=Wm5Iq^iTtA^n3G;uC
z;!39To=!C?vJZ{IVIpIsA*M|v;Yv%!TTRaEfTS|XAT9~Q%<5mzn~*Kli;z<317~Di
zOe9pa<ohv_?&m2NQ75A>3vzuu*}PMY%WSn#h%zW0kP%qO@rB%x)hUs-Jh2#!i54?n
z_(G|iVB&nDmErDA2GcMDvoHtqumCN%4maQ?EW#~Vf@Qc3XBn%|hC9%KHMk4wumPKJ
z5AMSQ=)yyI1drhfJgs(jp8fg#LYFp$7)bN7BoVD5qn#%gWwO@CGRJ}!cM{%8<|k({
zJluW`1Y6Jp1|0g3g8*3_Zma5N!2(mx;12sHcO;DG<ctm!oQ=*~$CbY1K8)gg@`>%?
dNl$|TTb=X<i*M^IAHN<A*6YjFkE6k-slWU7;79-f


From 9b07a8480d43b3f638a28961a02d96c257be3c17 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Sun, 1 Feb 2026 23:25:03 -0800
Subject: [PATCH 15/33] Update Windows configuration in release workflow to use
 PyTorch backend

- Changed the backend setting for Windows from "none" to "pytorch" to ensure compatibility with bundled PyTorch CPU providers.
- Updated comments for clarity regarding the Windows setup.
---
 .github/workflows/release.yml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 648e1c36..177e684d 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -148,11 +148,11 @@ jobs:
             args: ""
             python-version: "3.12"
             backend: "none"
-          # Windows - No TTS bundled, providers downloaded separately
+          # Windows - PyTorch CPU bundled (works out of the box)
           - platform: "windows-latest"
             args: ""
             python-version: "3.12"
-            backend: "none"
+            backend: "pytorch"
 
     runs-on: ${{ matrix.platform }}
 

From e4f3647f9a01072d6a3fe17d58b578964f5d120e Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 00:17:57 -0800
Subject: [PATCH 16/33] Add CPU-only PyTorch installation for Linux in release
 workflow

- Included a conditional installation of CPU-only PyTorch packages for Ubuntu 22.04 to reduce unnecessary CUDA dependencies.
- Updated the release workflow to ensure compatibility with CPU-focused builds on Linux.
---
 .github/workflows/release.yml | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 177e684d..4ee9475f 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -64,6 +64,10 @@ jobs:
         run: |
           python -m pip install --upgrade pip
           pip install pyinstaller
+          # Install CPU-only torch on Linux to avoid CUDA bloat
+          if [ "${{ matrix.platform }}" == "ubuntu-22.04" ]; then
+            pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu
+          fi
           pip install -r providers/pytorch-cpu/requirements.txt
           pip install -r backend/requirements.txt
 

From 4c4b3e5463eaf1d41e5bc3422c208bd0a65e20be Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 00:36:24 -0800
Subject: [PATCH 17/33] Update dependencies and enhance project configuration

- Removed `lucide-react` version 0.454.0 and downgraded to version 0.316.0 in `bun.lock`.
- Added `@tailwindcss/vite` and `tailwindcss` as development dependencies in `package.json`.
- Updated Vite configuration to include Tailwind CSS plugin.
- Set the HTML document to use a dark theme by adding the `class="dark"` attribute to the `<html>` tag.
---
 .github/workflows/release.yml | 17 +++++++++++------
 bun.lock                      |  7 +++----
 web/index.html                |  2 +-
 web/package.json              |  2 ++
 web/vite.config.ts            |  3 ++-
 5 files changed, 19 insertions(+), 12 deletions(-)

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 4ee9475f..bfc92e62 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -59,15 +59,20 @@ jobs:
           python-version: ${{ matrix.python-version }}
           cache: "pip"
 
-      - name: Install Python dependencies (CPU)
-        if: matrix.provider == 'pytorch-cpu'
+      - name: Install CPU-only torch (Linux)
+        if: matrix.provider == 'pytorch-cpu' && matrix.platform == 'ubuntu-22.04'
+        run: |
+          python -m pip install --upgrade pip
+          pip install pyinstaller
+          pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu
+          pip install -r providers/pytorch-cpu/requirements.txt
+          pip install -r backend/requirements.txt
+
+      - name: Install Python dependencies (CPU - non-Linux)
+        if: matrix.provider == 'pytorch-cpu' && matrix.platform != 'ubuntu-22.04'
         run: |
           python -m pip install --upgrade pip
           pip install pyinstaller
-          # Install CPU-only torch on Linux to avoid CUDA bloat
-          if [ "${{ matrix.platform }}" == "ubuntu-22.04" ]; then
-            pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cpu
-          fi
           pip install -r providers/pytorch-cpu/requirements.txt
           pip install -r backend/requirements.txt
 
diff --git a/bun.lock b/bun.lock
index 2a2e89f0..bcbf37be 100644
--- a/bun.lock
+++ b/bun.lock
@@ -48,7 +48,6 @@
         "clsx": "^2.1.1",
         "date-fns": "^3.6.0",
         "framer-motion": "^12.29.0",
-        "lucide-react": "^0.454.0",
         "motion": "^12.29.0",
         "react": "^18.3.0",
         "react-dom": "^18.3.0",
@@ -128,6 +127,7 @@
         "zustand": "^4.5.0",
       },
       "devDependencies": {
+        "@tailwindcss/vite": "^4.1.18",
         "@types/react": "^18.3.0",
         "@types/react-dom": "^18.3.0",
         "@typescript-eslint/eslint-plugin": "^7.0.0",
@@ -136,6 +136,7 @@
         "eslint": "^8.57.0",
         "eslint-plugin-react-hooks": "^4.6.0",
         "eslint-plugin-react-refresh": "^0.4.0",
+        "tailwindcss": "^4.1.0",
         "typescript": "^5.6.0",
         "vite": "^5.4.0",
       },
@@ -890,7 +891,7 @@
 
     "lru-cache": ["lru-cache@5.1.1", "", { "dependencies": { "yallist": "^3.0.2" } }, "sha512-KpNARQA3Iwv+jTA0utUVVbrh+Jlrr1Fv0e56GGzAFOXN7dk/FviaDW8LHmK52DlcH4WP2n6gI8vN1aesBFgo9w=="],
 
-    "lucide-react": ["lucide-react@0.454.0", "", { "peerDependencies": { "react": "^16.5.1 || ^17.0.0 || ^18.0.0 || ^19.0.0-rc" } }, "sha512-hw7zMDwykCLnEzgncEEjHeA6+45aeEzRYuKHuyRSOPkhko+J3ySGjGIzu+mmMfDFG1vazHepMaYFYHbTFAZAAQ=="],
+    "lucide-react": ["lucide-react@0.316.0", "", { "peerDependencies": { "react": "^16.5.1 || ^17.0.0 || ^18.0.0" } }, "sha512-dTmYX1H4IXsRfVcj/KUxworV6814ApTl7iXaS21AimK2RUEl4j4AfOmqD3VR8phe5V91m4vEJ8tCK4uT1jE5nA=="],
 
     "magic-string": ["magic-string@0.30.21", "", { "dependencies": { "@jridgewell/sourcemap-codec": "^1.5.5" } }, "sha512-vd2F4YUyEXKGcLHoq+TEyCjxueSeHnFxyyjNp80yg0XV4vUhnDer/lvvlqM/arB5bXQN5K2/3oinyCRyx8T2CQ=="],
 
@@ -1146,8 +1147,6 @@
 
     "@typescript-eslint/typescript-estree/semver": ["semver@7.7.3", "", { "bin": { "semver": "bin/semver.js" } }, "sha512-SdsKMrI9TdgjdweUSR9MweHA4EJ8YxHn8DFaDisvhVlUOe4BF1tLD7GAj0lIqWVl+dPb/rExr0Btby5loQm20Q=="],
 
-    "@voicebox/landing/lucide-react": ["lucide-react@0.316.0", "", { "peerDependencies": { "react": "^16.5.1 || ^17.0.0 || ^18.0.0" } }, "sha512-dTmYX1H4IXsRfVcj/KUxworV6814ApTl7iXaS21AimK2RUEl4j4AfOmqD3VR8phe5V91m4vEJ8tCK4uT1jE5nA=="],
-
     "@voicebox/landing/tailwind-merge": ["tailwind-merge@3.4.0", "", {}, "sha512-uSaO4gnW+b3Y2aWoWfFpX62vn2sR3skfhbjsEnaBI81WD1wBLlHZe5sWf0AqjksNdYTbGBEd0UasQMT3SNV15g=="],
 
     "@voicebox/landing/tailwindcss": ["tailwindcss@3.4.19", "", { "dependencies": { "@alloc/quick-lru": "^5.2.0", "arg": "^5.0.2", "chokidar": "^3.6.0", "didyoumean": "^1.2.2", "dlv": "^1.1.3", "fast-glob": "^3.3.2", "glob-parent": "^6.0.2", "is-glob": "^4.0.3", "jiti": "^1.21.7", "lilconfig": "^3.1.3", "micromatch": "^4.0.8", "normalize-path": "^3.0.0", "object-hash": "^3.0.0", "picocolors": "^1.1.1", "postcss": "^8.4.47", "postcss-import": "^15.1.0", "postcss-js": "^4.0.1", "postcss-load-config": "^4.0.2 || ^5.0 || ^6.0", "postcss-nested": "^6.2.0", "postcss-selector-parser": "^6.1.2", "resolve": "^1.22.8", "sucrase": "^3.35.0" }, "bin": { "tailwind": "lib/cli.js", "tailwindcss": "lib/cli.js" } }, "sha512-3ofp+LL8E+pK/JuPLPggVAIaEuhvIz4qNcf3nA1Xn2o/7fb7s/TYpHhwGDv1ZU3PkBluUVaF8PyCHcm48cKLWQ=="],
diff --git a/web/index.html b/web/index.html
index 1ae976ad..c7a4be9f 100644
--- a/web/index.html
+++ b/web/index.html
@@ -1,5 +1,5 @@
 <!doctype html>
-<html lang="en">
+<html lang="en" class="dark">
   <head>
     <meta charset="UTF-8" />
     <link rel="icon" type="image/svg+xml" href="/vite.svg" />
diff --git a/web/package.json b/web/package.json
index 1f44b3df..0fa0534d 100644
--- a/web/package.json
+++ b/web/package.json
@@ -17,6 +17,7 @@
     "wavesurfer.js": "^7.0.0"
   },
   "devDependencies": {
+    "@tailwindcss/vite": "^4.1.18",
     "@types/react": "^18.3.0",
     "@types/react-dom": "^18.3.0",
     "@typescript-eslint/eslint-plugin": "^7.0.0",
@@ -25,6 +26,7 @@
     "eslint": "^8.57.0",
     "eslint-plugin-react-hooks": "^4.6.0",
     "eslint-plugin-react-refresh": "^0.4.0",
+    "tailwindcss": "^4.1.0",
     "typescript": "^5.6.0",
     "vite": "^5.4.0"
   }
diff --git a/web/vite.config.ts b/web/vite.config.ts
index 27a79a73..e418b3ef 100644
--- a/web/vite.config.ts
+++ b/web/vite.config.ts
@@ -1,9 +1,10 @@
 import path from 'node:path';
+import tailwindcss from '@tailwindcss/vite';
 import react from '@vitejs/plugin-react';
 import { defineConfig } from 'vite';
 
 export default defineConfig({
-  plugins: [react()],
+  plugins: [tailwindcss(), react()],
   resolve: {
     alias: {
       '@': path.resolve(__dirname, '../app/src'),

From f090759d8fe7424ca3c3c143459447f3546253fd Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 02:19:05 -0800
Subject: [PATCH 18/33] Add Docker support and update dependencies

- Introduced Docker support with CPU-only and GPU-enabled configurations via Dockerfiles and docker-compose files.
- Added a .dockerignore file to exclude unnecessary files from Docker images.
- Updated bun.lock and package.json to include new dependencies for icon handling.
- Enhanced README with Docker usage instructions and deployment options.
- Refactored components to utilize new icon libraries for improved UI consistency.
---
 .dockerignore                                 |  55 ++
 .github/workflows/release.yml                 |  66 ++
 Dockerfile                                    |  38 +
 Dockerfile.cuda                               |  52 ++
 README.md                                     |  20 +-
 app/package.json                              |   2 +
 .../components/AudioPlayer/AudioPlayer.tsx    |   2 +-
 .../Generation/FloatingGenerateBox.tsx        |   7 +-
 .../components/Generation/GenerationForm.tsx  |  17 +-
 app/src/components/History/HistoryTable.tsx   |  35 +-
 .../ServerSettings/ModelManagement.tsx        |  14 +-
 .../ServerSettings/ModelProgress.tsx          |  15 +-
 .../ServerSettings/ProviderSettings.tsx       |  17 +-
 .../ServerSettings/ServerStatus.tsx           |   5 +-
 app/src/components/Sidebar.tsx                |  20 +-
 .../components/StoriesTab/StoryChatItem.tsx   |  30 +-
 .../VoiceProfiles/ProfileAvatar.tsx           |  80 ++
 .../components/VoiceProfiles/ProfileCard.tsx  |  30 +-
 app/src/components/VoicesTab/VoicesTab.tsx    |  12 +-
 app/src/components/ui/radio-group.tsx         |  40 +-
 app/src/lib/hooks/useGenerationForm.ts        |   5 -
 app/src/lib/hooks/useModelDownloadToast.tsx   |  35 +-
 backend/main.py                               |  16 +-
 backend/providers/checksums.py                |  11 +
 bun.lock                                      |   8 +
 docker-compose.cpu.yml                        |  26 +
 docker-compose.yml                            |  34 +
 docs/mint.json                                |   2 +-
 docs/overview/docker.mdx                      | 403 ++++++++
 docs/overview/installation.mdx                |   7 +-
 docs/plans/DOCKER_DEPLOYMENT.md               | 265 ++----
 docs2/MIGRATION.md                            |  94 ++
 docs2/content/docs/AUTOUPDATER.md             | 203 ++++
 docs2/content/docs/AUTOUPDATER_QUICKSTART.md  | 129 +++
 docs2/content/docs/README.md                  |  67 ++
 docs2/content/docs/TROUBLESHOOTING.md         | 360 +++++++
 docs2/content/docs/api/meta.json              |   4 +
 docs2/content/docs/developer/contributing.mdx | 336 +++++++
 docs2/content/docs/developer/meta.json        |  17 +
 docs2/content/docs/developer/setup.mdx        | 245 +++++
 docs2/content/docs/index.mdx                  |  50 +
 docs2/content/docs/meta.json                  |   4 +
 .../docs/overview/creating-voice-profiles.mdx | 297 ++++++
 docs2/content/docs/overview/meta.json         |  17 +
 docs2/content/docs/overview/quick-start.mdx   | 166 ++++
 docs2/content/docs/plans/DOCKER_DEPLOYMENT.md | 786 ++++++++++++++++
 .../content/docs/plans/EXTERNAL_PROVIDERS.md  | 461 +++++++++
 docs2/content/docs/plans/MLX_AUDIO.md         | 431 +++++++++
 docs2/content/docs/plans/OPENAI_SUPPORT.md    | 238 +++++
 docs2/content/docs/plans/meta.json            |   4 +
 docs2/lib/layout.shared.tsx                   |   9 +
 docs2/mdx-components.tsx                      |  39 +
 docs2/openapi.json                            | 877 ++++++++++++++++++
 docs2/package.json                            |  32 +
 providers/README.md                           |  77 +-
 tauri/src-tauri/gen/Assets.car                | Bin 3847048 -> 3847048 bytes
 tauri/src-tauri/src/main.rs                   |  43 +-
 web/src/assets.d.ts                           |   4 +
 web/src/platform/updater.ts                   |   4 -
 web/src/vite-env.d.ts                         |  12 +
 web/tsconfig.json                             |   1 +
 61 files changed, 5982 insertions(+), 394 deletions(-)
 create mode 100644 .dockerignore
 create mode 100644 Dockerfile
 create mode 100644 Dockerfile.cuda
 create mode 100644 app/src/components/VoiceProfiles/ProfileAvatar.tsx
 create mode 100644 backend/providers/checksums.py
 create mode 100644 docker-compose.cpu.yml
 create mode 100644 docker-compose.yml
 create mode 100644 docs/overview/docker.mdx
 create mode 100644 docs2/MIGRATION.md
 create mode 100644 docs2/content/docs/AUTOUPDATER.md
 create mode 100644 docs2/content/docs/AUTOUPDATER_QUICKSTART.md
 create mode 100644 docs2/content/docs/README.md
 create mode 100644 docs2/content/docs/TROUBLESHOOTING.md
 create mode 100644 docs2/content/docs/api/meta.json
 create mode 100644 docs2/content/docs/developer/contributing.mdx
 create mode 100644 docs2/content/docs/developer/meta.json
 create mode 100644 docs2/content/docs/developer/setup.mdx
 create mode 100644 docs2/content/docs/index.mdx
 create mode 100644 docs2/content/docs/meta.json
 create mode 100644 docs2/content/docs/overview/creating-voice-profiles.mdx
 create mode 100644 docs2/content/docs/overview/meta.json
 create mode 100644 docs2/content/docs/overview/quick-start.mdx
 create mode 100644 docs2/content/docs/plans/DOCKER_DEPLOYMENT.md
 create mode 100644 docs2/content/docs/plans/EXTERNAL_PROVIDERS.md
 create mode 100644 docs2/content/docs/plans/MLX_AUDIO.md
 create mode 100644 docs2/content/docs/plans/OPENAI_SUPPORT.md
 create mode 100644 docs2/content/docs/plans/meta.json
 create mode 100644 docs2/lib/layout.shared.tsx
 create mode 100644 docs2/mdx-components.tsx
 create mode 100644 docs2/openapi.json
 create mode 100644 docs2/package.json
 create mode 100644 web/src/assets.d.ts
 create mode 100644 web/src/vite-env.d.ts

diff --git a/.dockerignore b/.dockerignore
new file mode 100644
index 00000000..1f1ea4be
--- /dev/null
+++ b/.dockerignore
@@ -0,0 +1,55 @@
+# Dependencies
+node_modules/
+__pycache__/
+*.pyc
+*.pyo
+*.pyd
+.Python
+env/
+venv/
+
+# Build outputs
+build/
+*.egg-info/
+.eggs/
+target/
+
+# Keep web/dist for the Docker image
+!web/dist
+
+# Development
+.git/
+.github/
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+
+# Data and logs
+data/
+*.log
+*.sqlite
+*.db
+
+# OS
+.DS_Store
+Thumbs.db
+
+# Documentation
+docs/
+landing/
+mlx-test/
+
+# Test files
+*.test.ts
+*.test.tsx
+*.spec.ts
+*.spec.tsx
+
+# Keep these out
+.env
+.env.local
+*.pem
+*.key
+credentials.json
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index bfc92e62..1da7da39 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -299,3 +299,69 @@ jobs:
           prerelease: false
           args: ${{ matrix.args }}
           includeUpdaterJson: true
+
+  # ============================================
+  # Build and Push Docker Images
+  # ============================================
+  docker:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      packages: write
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Set up Docker Buildx
+        uses: docker/setup-buildx-action@v3
+
+      - name: Login to GitHub Container Registry
+        uses: docker/login-action@v3
+        with:
+          registry: ghcr.io
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Setup Bun
+        uses: oven-sh/setup-bun@v2
+
+      - name: Install dependencies and build web UI
+        run: |
+          bun install
+          cd web
+          bun run build
+
+      - name: Extract version from tag
+        id: version
+        run: |
+          if [[ $GITHUB_REF == refs/tags/v* ]]; then
+            VERSION=${GITHUB_REF#refs/tags/v}
+          else
+            VERSION="dev"
+          fi
+          echo "version=$VERSION" >> $GITHUB_OUTPUT
+
+      - name: Build and push CPU image
+        uses: docker/build-push-action@v5
+        with:
+          context: .
+          file: ./Dockerfile
+          platforms: linux/amd64,linux/arm64
+          push: true
+          tags: |
+            ghcr.io/jamiepine/voicebox:latest
+            ghcr.io/jamiepine/voicebox:${{ steps.version.outputs.version }}
+          cache-from: type=gha
+          cache-to: type=gha,mode=max
+
+      - name: Build and push CUDA image
+        uses: docker/build-push-action@v5
+        with:
+          context: .
+          file: ./Dockerfile.cuda
+          platforms: linux/amd64
+          push: true
+          tags: |
+            ghcr.io/jamiepine/voicebox:latest-cuda
+            ghcr.io/jamiepine/voicebox:${{ steps.version.outputs.version }}-cuda
+          cache-from: type=gha
+          cache-to: type=gha,mode=max
diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 00000000..6600e511
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,38 @@
+# Base Dockerfile for Voicebox (CPU-only)
+# For GPU support, use Dockerfile.cuda
+
+FROM python:3.12-slim
+
+WORKDIR /app
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y \
+    ffmpeg \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy backend
+COPY backend/ /app/backend/
+COPY providers/ /app/providers/
+
+# Copy pre-built web UI
+COPY web/dist/ /app/web/dist/
+
+# Install Python dependencies (without PyTorch - will be downloaded via provider system)
+RUN python -m pip install --upgrade pip && \
+    pip install --no-cache-dir \
+    fastapi uvicorn[standard] pydantic sqlalchemy alembic \
+    librosa soundfile numpy python-multipart Pillow \
+    huggingface_hub transformers accelerate
+
+# Create data directory for profiles/generations
+RUN mkdir -p /app/data
+
+# Health check
+HEALTHCHECK --interval=30s --timeout=10s --retries=3 --start-period=40s \
+  CMD curl -f http://localhost:8000/health || exit 1
+
+EXPOSE 8000
+
+# Run server with web UI
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
diff --git a/Dockerfile.cuda b/Dockerfile.cuda
new file mode 100644
index 00000000..b6e67296
--- /dev/null
+++ b/Dockerfile.cuda
@@ -0,0 +1,52 @@
+# Dockerfile for Voicebox with NVIDIA GPU support (CUDA)
+
+FROM nvidia/cuda:12.1.1-runtime-ubuntu22.04
+
+WORKDIR /app
+
+# Install Python 3.12
+RUN apt-get update && apt-get install -y \
+    software-properties-common \
+    && add-apt-repository ppa:deadsnakes/ppa \
+    && apt-get update && apt-get install -y \
+    python3.12 \
+    python3.12-dev \
+    python3-pip \
+    ffmpeg \
+    curl \
+    && rm -rf /var/lib/apt/lists/*
+
+# Set Python 3.12 as default
+RUN update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.12 1 && \
+    update-alternatives --install /usr/bin/python python /usr/bin/python3.12 1
+
+# Copy backend
+COPY backend/ /app/backend/
+COPY providers/ /app/providers/
+
+# Copy pre-built web UI
+COPY web/dist/ /app/web/dist/
+
+# Install PyTorch with CUDA support first
+RUN python -m pip install --upgrade pip && \
+    pip install --no-cache-dir \
+    torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
+
+# Install remaining dependencies
+RUN pip install --no-cache-dir \
+    fastapi uvicorn[standard] pydantic sqlalchemy alembic \
+    transformers accelerate huggingface_hub \
+    librosa soundfile numpy python-multipart Pillow \
+    qwen-tts
+
+# Create data directory
+RUN mkdir -p /app/data
+
+# Health check
+HEALTHCHECK --interval=30s --timeout=10s --retries=3 --start-period=40s \
+  CMD curl -f http://localhost:8000/health || exit 1
+
+EXPOSE 8000
+
+# Run server with web UI
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
diff --git a/README.md b/README.md
index 74672d6e..32bf7133 100644
--- a/README.md
+++ b/README.md
@@ -76,7 +76,7 @@ Download a voice model, clone any voice from a few seconds of audio, and compose
 
 ## Download
 
-Voicebox is available now for macOS and Windows.
+### Desktop App
 
 | Platform              | Download                                                                                                                    |
 | --------------------- | --------------------------------------------------------------------------------------------------------------------------- |
@@ -85,7 +85,23 @@ Voicebox is available now for macOS and Windows.
 | Windows (MSI)         | [voicebox_0.1.0_x64_en-US.msi](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64_en-US.msi) |
 | Windows (Setup)       | [voicebox_0.1.0_x64-setup.exe](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64-setup.exe) |
 
-> **Linux builds coming soon** — Currently blocked by GitHub runner disk space limitations.
+> **Linux desktop builds coming soon** — Currently blocked by GitHub runner disk space limitations.
+
+### Docker (Server Deployment)
+
+Run Voicebox with the web UI in Docker:
+
+```bash
+# CPU-only (supports amd64 and arm64)
+docker run -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest
+
+# NVIDIA GPU
+docker run --gpus all -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest-cuda
+```
+
+See [Docker Deployment Guide](docs/plans/DOCKER_DEPLOYMENT.md) for full documentation.
 
 ---
 
diff --git a/app/package.json b/app/package.json
index 07028409..b9ef942a 100644
--- a/app/package.json
+++ b/app/package.json
@@ -19,6 +19,8 @@
     "@hookform/resolvers": "^3.9.0",
     "@hugeicons/core-free-icons": "^3.1.1",
     "@hugeicons/react": "^1.1.4",
+    "@iconify-json/svg-spinners": "^1.2.4",
+    "@iconify/react": "^6.0.2",
     "@radix-ui/react-alert-dialog": "^1.1.1",
     "@radix-ui/react-avatar": "^1.1.0",
     "@radix-ui/react-dialog": "^1.1.1",
diff --git a/app/src/components/AudioPlayer/AudioPlayer.tsx b/app/src/components/AudioPlayer/AudioPlayer.tsx
index c49f7a38..6656c9d3 100644
--- a/app/src/components/AudioPlayer/AudioPlayer.tsx
+++ b/app/src/components/AudioPlayer/AudioPlayer.tsx
@@ -460,7 +460,7 @@ export function AudioPlayer() {
     // Use double requestAnimationFrame to ensure DOM is fully rendered
     let rafId1: number;
     let rafId2: number;
-    let timeoutId: number | null = null;
+    let timeoutId: ReturnType<typeof setTimeout> | null = null;
 
     rafId1 = requestAnimationFrame(() => {
       rafId2 = requestAnimationFrame(() => {
diff --git a/app/src/components/Generation/FloatingGenerateBox.tsx b/app/src/components/Generation/FloatingGenerateBox.tsx
index dc835dfb..1fa586e8 100644
--- a/app/src/components/Generation/FloatingGenerateBox.tsx
+++ b/app/src/components/Generation/FloatingGenerateBox.tsx
@@ -1,7 +1,8 @@
+import { SparklesIcon, TextSquareIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { useMatchRoute } from '@tanstack/react-router';
 import { AnimatePresence, motion } from 'framer-motion';
-import { HugeiconsIcon } from '@hugeicons/react';
-import { Loading01Icon, TextSquareIcon, SparklesIcon } from '@hugeicons/core-free-icons';
 import { useEffect, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import { Form, FormControl, FormField, FormItem, FormMessage } from '@/components/ui/form';
@@ -302,7 +303,7 @@ export function FloatingGenerateBox({
                   size="icon"
                 >
                   {isPending ? (
-                    <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
+                    <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
                   ) : (
                     <HugeiconsIcon icon={SparklesIcon} size={16} className="h-4 w-4" />
                   )}
diff --git a/app/src/components/Generation/GenerationForm.tsx b/app/src/components/Generation/GenerationForm.tsx
index edf7b749..d652a1d7 100644
--- a/app/src/components/Generation/GenerationForm.tsx
+++ b/app/src/components/Generation/GenerationForm.tsx
@@ -1,5 +1,6 @@
+import { Mic01Icon } from '@hugeicons/core-free-icons';
 import { HugeiconsIcon } from '@hugeicons/react';
-import { Loading01Icon, Mic01Icon } from '@hugeicons/core-free-icons';
+import { Icon } from '@iconify/react';
 import { Button } from '@/components/ui/button';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import {
@@ -47,7 +48,11 @@ export function GenerationForm() {
               <FormLabel>Voice Profile</FormLabel>
               {selectedProfile ? (
                 <div className="mt-2 p-3 border rounded-md bg-muted/50 flex items-center gap-2">
-                  <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4 text-muted-foreground" />
+                  <HugeiconsIcon
+                    icon={Mic01Icon}
+                    size={16}
+                    className="h-4 w-4 text-muted-foreground"
+                  />
                   <span className="font-medium">{selectedProfile.name}</span>
                   <span className="text-sm text-muted-foreground">{selectedProfile.language}</span>
                 </div>
@@ -171,14 +176,10 @@ export function GenerationForm() {
               />
             </div>
 
-            <Button
-              type="submit"
-              className="w-full"
-              disabled={isPending || !selectedProfileId}
-            >
+            <Button type="submit" className="w-full" disabled={isPending || !selectedProfileId}>
               {isPending ? (
                 <>
-                  <HugeiconsIcon icon={Loading01Icon} size={16} className="mr-2 h-4 w-4 animate-spin" />
+                  <Icon icon="svg-spinners:ring-resize" className="mr-2 h-4 w-4 animate-spin" />
                   Generating...
                 </>
               ) : (
diff --git a/app/src/components/History/HistoryTable.tsx b/app/src/components/History/HistoryTable.tsx
index 0c889046..7a861e19 100644
--- a/app/src/components/History/HistoryTable.tsx
+++ b/app/src/components/History/HistoryTable.tsx
@@ -1,13 +1,13 @@
-import { HugeiconsIcon } from '@hugeicons/react';
 import {
-  WaveIcon,
-  Download01Icon,
   Archive01Icon,
-  Loading01Icon,
+  Delete01Icon,
+  Download01Icon,
   MoreHorizontalIcon,
   PlayIcon,
-  Delete01Icon,
+  WaveIcon,
 } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { useEffect, useRef, useState } from 'react';
 import { Button } from '@/components/ui/button';
 import {
@@ -55,7 +55,9 @@ export function HistoryTable() {
   const [importDialogOpen, setImportDialogOpen] = useState(false);
   const [selectedFile, setSelectedFile] = useState<File | null>(null);
   const [deleteDialogOpen, setDeleteDialogOpen] = useState(false);
-  const [generationToDelete, setGenerationToDelete] = useState<{ id: string; name: string } | null>(null);
+  const [generationToDelete, setGenerationToDelete] = useState<{ id: string; name: string } | null>(
+    null,
+  );
   const limit = 20;
   const { toast } = useToast();
 
@@ -223,7 +225,10 @@ export function HistoryTable() {
   if (isLoading && page === 0) {
     return (
       <div className="flex items-center justify-center h-full">
-        <HugeiconsIcon icon={Loading01Icon} size={32} className="h-8 w-8 animate-spin text-muted-foreground" />
+        <Icon
+          icon="svg-spinners:ring-resize"
+          className="h-8 w-8 animate-spin text-muted-foreground"
+        />
       </div>
     );
   }
@@ -269,7 +274,11 @@ export function HistoryTable() {
                 >
                   {/* Waveform icon */}
                   <div className="flex items-center shrink-0">
-                    <HugeiconsIcon icon={WaveIcon} size={20} className="h-5 w-5 text-muted-foreground" />
+                    <HugeiconsIcon
+                      icon={WaveIcon}
+                      size={20}
+                      className="h-5 w-5 text-muted-foreground"
+                    />
                   </div>
 
                   {/* Left side - Meta information */}
@@ -353,7 +362,12 @@ export function HistoryTable() {
             {/* Load more trigger element */}
             {hasMore && (
               <div ref={loadMoreRef} className="flex items-center justify-center py-4">
-                {isFetching && <HugeiconsIcon icon={Loading01Icon} size={24} className="h-6 w-6 animate-spin text-muted-foreground" />}
+                {isFetching && (
+                  <Icon
+                    icon="svg-spinners:ring-resize"
+                    className="h-6 w-6 animate-spin text-muted-foreground"
+                  />
+                )}
               </div>
             )}
 
@@ -372,7 +386,8 @@ export function HistoryTable() {
           <DialogHeader>
             <DialogTitle>Delete Generation</DialogTitle>
             <DialogDescription>
-              Are you sure you want to delete this generation from "{generationToDelete?.name}"? This action cannot be undone.
+              Are you sure you want to delete this generation from "{generationToDelete?.name}"?
+              This action cannot be undone.
             </DialogDescription>
           </DialogHeader>
           <DialogFooter>
diff --git a/app/src/components/ServerSettings/ModelManagement.tsx b/app/src/components/ServerSettings/ModelManagement.tsx
index f7e10fdb..b1c7c123 100644
--- a/app/src/components/ServerSettings/ModelManagement.tsx
+++ b/app/src/components/ServerSettings/ModelManagement.tsx
@@ -1,6 +1,7 @@
-import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
+import { Delete01Icon, Download01Icon } from '@hugeicons/core-free-icons';
 import { HugeiconsIcon } from '@hugeicons/react';
-import { Download01Icon, Loading01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
+import { Icon } from '@iconify/react';
+import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
 import { useCallback, useState } from 'react';
 import {
   AlertDialog,
@@ -154,7 +155,10 @@ export function ModelManagement() {
       <CardContent className="space-y-4">
         {isLoading ? (
           <div className="flex items-center justify-center py-8">
-            <HugeiconsIcon icon={Loading01Icon} size={24} className="h-6 w-6 animate-spin text-muted-foreground" />
+            <Icon
+              icon="svg-spinners:ring-resize"
+              className="h-6 w-6 animate-spin text-muted-foreground"
+            />
           </div>
         ) : modelStatus ? (
           <div className="space-y-4">
@@ -246,7 +250,7 @@ export function ModelManagement() {
             >
               {deleteMutation.isPending ? (
                 <>
-                  <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 mr-2 animate-spin" />
+                  <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 mr-2 animate-spin" />
                   Deleting...
                 </>
               ) : (
@@ -320,7 +324,7 @@ function ModelItem({ model, onDownload, onDelete, isDownloading, formatSize }: M
           </div>
         ) : showDownloading ? (
           <Button size="sm" variant="outline" disabled>
-            <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 mr-2 animate-spin" />
+            <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 mr-2 animate-spin" />
             Downloading...
           </Button>
         ) : (
diff --git a/app/src/components/ServerSettings/ModelProgress.tsx b/app/src/components/ServerSettings/ModelProgress.tsx
index 30229c50..efd35427 100644
--- a/app/src/components/ServerSettings/ModelProgress.tsx
+++ b/app/src/components/ServerSettings/ModelProgress.tsx
@@ -1,5 +1,6 @@
+import { CancelCircleIcon } from '@hugeicons/core-free-icons';
 import { HugeiconsIcon } from '@hugeicons/react';
-import { Loading01Icon, CancelCircleIcon } from '@hugeicons/core-free-icons';
+import { Icon } from '@iconify/react';
 import { useEffect, useState } from 'react';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import { Progress } from '@/components/ui/progress';
@@ -13,7 +14,11 @@ interface ModelProgressProps {
   isDownloading?: boolean;
 }
 
-export function ModelProgress({ modelName, displayName, isDownloading = false }: ModelProgressProps) {
+export function ModelProgress({
+  modelName,
+  displayName,
+  isDownloading = false,
+}: ModelProgressProps) {
   const [progress, setProgress] = useState<ModelProgressType | null>(null);
   const serverUrl = useServerStore((state) => state.serverUrl);
 
@@ -75,10 +80,12 @@ export function ModelProgress({ modelName, displayName, isDownloading = false }:
   const getStatusIcon = () => {
     switch (progress.status) {
       case 'error':
-        return <HugeiconsIcon icon={CancelCircleIcon} size={16} className="h-4 w-4 text-destructive" />;
+        return (
+          <HugeiconsIcon icon={CancelCircleIcon} size={16} className="h-4 w-4 text-destructive" />
+        );
       case 'downloading':
       case 'extracting':
-        return <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />;
+        return <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />;
       default:
         return null;
     }
diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index 41f820df..612b3983 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -1,5 +1,6 @@
-import { Delete01Icon, Download01Icon, Loading01Icon } from '@hugeicons/core-free-icons';
+import { Delete01Icon, Download01Icon } from '@hugeicons/core-free-icons';
 import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
 import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
 import { useCallback, useState } from 'react';
 import {
@@ -162,7 +163,7 @@ export function ProviderSettings() {
         </CardHeader>
         <CardContent>
           <div className="flex items-center justify-center py-8">
-            <HugeiconsIcon icon={Loading01Icon} size={24} className="h-6 w-6 animate-spin" />
+            <Icon icon="svg-spinners:ring-resize" className="h-6 w-6 animate-spin" />
           </div>
         </CardContent>
       </Card>
@@ -210,11 +211,7 @@ export function ProviderSettings() {
                     disabled={downloadingProvider === 'pytorch-cuda'}
                   >
                     {downloadingProvider === 'pytorch-cuda' ? (
-                      <HugeiconsIcon
-                        icon={Loading01Icon}
-                        size={16}
-                        className="h-4 w-4 animate-spin"
-                      />
+                      <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
                     ) : (
                       <>
                         <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-1" />
@@ -257,11 +254,7 @@ export function ProviderSettings() {
                     disabled={downloadingProvider === 'pytorch-cpu'}
                   >
                     {downloadingProvider === 'pytorch-cpu' ? (
-                      <HugeiconsIcon
-                        icon={Loading01Icon}
-                        size={16}
-                        className="h-4 w-4 animate-spin"
-                      />
+                      <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
                     ) : (
                       <>
                         <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-1" />
diff --git a/app/src/components/ServerSettings/ServerStatus.tsx b/app/src/components/ServerSettings/ServerStatus.tsx
index 8b5e5197..8437552e 100644
--- a/app/src/components/ServerSettings/ServerStatus.tsx
+++ b/app/src/components/ServerSettings/ServerStatus.tsx
@@ -1,5 +1,6 @@
+import { CancelCircleIcon } from '@hugeicons/core-free-icons';
 import { HugeiconsIcon } from '@hugeicons/react';
-import { Loading01Icon, CancelCircleIcon } from '@hugeicons/core-free-icons';
+import { Icon } from '@iconify/react';
 import { Badge } from '@/components/ui/badge';
 import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
 import { useServerHealth } from '@/lib/hooks/useServer';
@@ -33,7 +34,7 @@ export function ServerStatus() {
 
         {isLoading ? (
           <div className="flex items-center gap-2">
-            <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
+            <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
             <span className="text-sm">Checking connection...</span>
           </div>
         ) : error ? (
diff --git a/app/src/components/Sidebar.tsx b/app/src/components/Sidebar.tsx
index 04442db0..39314788 100644
--- a/app/src/components/Sidebar.tsx
+++ b/app/src/components/Sidebar.tsx
@@ -1,6 +1,14 @@
-import { Link, useMatchRoute } from '@tanstack/react-router';
+import {
+  Book01Icon,
+  Mic01Icon,
+  PackageIcon,
+  ServerStack01Icon,
+  SpeakerIcon,
+  VolumeHighIcon,
+} from '@hugeicons/core-free-icons';
 import { HugeiconsIcon } from '@hugeicons/react';
-import { PackageIcon, Book01Icon, Loading01Icon, Mic01Icon, McpServerIcon, SpeakerIcon, VolumeHighIcon } from '@hugeicons/core-free-icons';
+import { Icon } from '@iconify/react';
+import { Link, useMatchRoute } from '@tanstack/react-router';
 import voiceboxLogo from '@/assets/voicebox-logo.png';
 import { cn } from '@/lib/utils/cn';
 import { useGenerationStore } from '@/stores/generationStore';
@@ -16,7 +24,7 @@ const tabs = [
   { id: 'voices', path: '/voices', icon: Mic01Icon, label: 'Voices' },
   { id: 'audio', path: '/audio', icon: SpeakerIcon, label: 'Audio' },
   { id: 'models', path: '/models', icon: PackageIcon, label: 'Models' },
-  { id: 'server', path: '/server', icon: McpServerIcon, label: 'Server' },
+  { id: 'server', path: '/server', icon: ServerStack01Icon, label: 'Server' },
 ];
 
 export function Sidebar({ isMacOS }: SidebarProps) {
@@ -43,9 +51,7 @@ export function Sidebar({ isMacOS }: SidebarProps) {
           const Icon = tab.icon;
           // For index route, use exact match; for others, use default matching
           const isActive =
-            tab.path === '/'
-              ? matchRoute({ to: '/' })
-              : matchRoute({ to: tab.path });
+            tab.path === '/' ? matchRoute({ to: '/' }) : matchRoute({ to: tab.path });
 
           return (
             <Link
@@ -76,7 +82,7 @@ export function Sidebar({ isMacOS }: SidebarProps) {
             isPlayerVisible ? 'mb-[120px]' : 'mb-0',
           )}
         >
-          <HugeiconsIcon icon={Loading01Icon} size={24} className="h-6 w-6 text-accent animate-spin" />
+          <Icon icon="svg-spinners:ring-resize" className="h-6 w-6 text-accent animate-spin" />
         </div>
       )}
     </div>
diff --git a/app/src/components/StoriesTab/StoryChatItem.tsx b/app/src/components/StoriesTab/StoryChatItem.tsx
index c1dd793f..ac16352a 100644
--- a/app/src/components/StoriesTab/StoryChatItem.tsx
+++ b/app/src/components/StoriesTab/StoryChatItem.tsx
@@ -1,8 +1,7 @@
 import { useSortable } from '@dnd-kit/sortable';
 import { CSS } from '@dnd-kit/utilities';
 import { HugeiconsIcon } from '@hugeicons/react';
-import { DragDropVerticalIcon, Mic01Icon, MoreHorizontalIcon, PlayIcon, Delete01Icon } from '@hugeicons/core-free-icons';
-import { useState } from 'react';
+import { DragDropVerticalIcon, MoreHorizontalIcon, PlayIcon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { Button } from '@/components/ui/button';
 import {
   DropdownMenu,
@@ -11,10 +10,10 @@ import {
   DropdownMenuTrigger,
 } from '@/components/ui/dropdown-menu';
 import { Textarea } from '@/components/ui/textarea';
+import { ProfileAvatar } from '@/components/VoiceProfiles/ProfileAvatar';
 import type { StoryItemDetail } from '@/lib/api/types';
 import { cn } from '@/lib/utils/cn';
 import { useStoryStore } from '@/stores/storyStore';
-import { useServerStore } from '@/stores/serverStore';
 
 interface StoryChatItemProps {
   item: StoryItemDetail;
@@ -36,10 +35,6 @@ export function StoryChatItem({
   isDragging,
 }: StoryChatItemProps) {
   const seek = useStoryStore((state) => state.seek);
-  const serverUrl = useServerStore((state) => state.serverUrl);
-  const [avatarError, setAvatarError] = useState(false);
-
-  const avatarUrl = `${serverUrl}/profiles/${item.profile_id}/avatar`;
 
   // Check if this item is currently playing based on timecode
   const itemStartMs = item.start_time_ms;
@@ -81,21 +76,12 @@ export function StoryChatItem({
 
       {/* Voice Avatar */}
       <div className="shrink-0">
-        <div className="h-10 w-10 rounded-full bg-muted flex items-center justify-center overflow-hidden">
-          {!avatarError ? (
-            <img
-              src={avatarUrl}
-              alt={`${item.profile_name} avatar`}
-              className={cn(
-                'h-full w-full object-cover transition-all duration-200',
-                !isCurrentlyPlaying && 'grayscale'
-              )}
-              onError={() => setAvatarError(true)}
-            />
-          ) : (
-            <HugeiconsIcon icon={Mic01Icon} size={20} className="h-5 w-5 text-muted-foreground" />
-          )}
-        </div>
+        <ProfileAvatar
+          profileId={item.profile_id}
+          size="lg"
+          grayscale={!isCurrentlyPlaying}
+          alt={`${item.profile_name} avatar`}
+        />
       </div>
 
       {/* Content */}
diff --git a/app/src/components/VoiceProfiles/ProfileAvatar.tsx b/app/src/components/VoiceProfiles/ProfileAvatar.tsx
new file mode 100644
index 00000000..0743fb3f
--- /dev/null
+++ b/app/src/components/VoiceProfiles/ProfileAvatar.tsx
@@ -0,0 +1,80 @@
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Mic01Icon } from '@hugeicons/core-free-icons';
+import { useState } from 'react';
+import { cn } from '@/lib/utils/cn';
+import { useServerStore } from '@/stores/serverStore';
+
+interface ProfileAvatarProps {
+  profileId: string;
+  avatarPath?: string | null;
+  size?: 'sm' | 'md' | 'lg' | 'xl';
+  grayscale?: boolean;
+  className?: string;
+  alt?: string;
+}
+
+const sizeClasses = {
+  sm: 'h-6 w-6',
+  md: 'h-8 w-8',
+  lg: 'h-10 w-10',
+  xl: 'h-24 w-24',
+};
+
+const iconSizes = {
+  sm: 14,
+  md: 16,
+  lg: 20,
+  xl: 40,
+};
+
+const iconClassNames = {
+  sm: 'h-3.5 w-3.5',
+  md: 'h-4 w-4',
+  lg: 'h-5 w-5',
+  xl: 'h-10 w-10',
+};
+
+export function ProfileAvatar({
+  profileId,
+  avatarPath,
+  size = 'md',
+  grayscale = false,
+  className,
+  alt = 'Profile avatar',
+}: ProfileAvatarProps) {
+  const [avatarError, setAvatarError] = useState(false);
+  const serverUrl = useServerStore((state) => state.serverUrl);
+
+  // If avatarPath is explicitly null or empty string, don't try to load avatar
+  // Otherwise, always try to load (avatarPath might not be available in all contexts)
+  const avatarUrl =
+    avatarPath === null || avatarPath === '' ? null : `${serverUrl}/profiles/${profileId}/avatar`;
+
+  return (
+    <div
+      className={cn(
+        sizeClasses[size],
+        'rounded-full bg-muted flex items-center justify-center shrink-0 overflow-hidden',
+        className,
+      )}
+    >
+      {avatarUrl && !avatarError ? (
+        <img
+          src={avatarUrl}
+          alt={alt}
+          className={cn(
+            'h-full w-full object-cover transition-all duration-200',
+            grayscale && 'grayscale',
+          )}
+          onError={() => setAvatarError(true)}
+        />
+      ) : (
+        <HugeiconsIcon
+          icon={Mic01Icon}
+          size={iconSizes[size]}
+          className={cn(iconClassNames[size], 'text-muted-foreground')}
+        />
+      )}
+    </div>
+  );
+}
diff --git a/app/src/components/VoiceProfiles/ProfileCard.tsx b/app/src/components/VoiceProfiles/ProfileCard.tsx
index 5e2588fa..40742f40 100644
--- a/app/src/components/VoiceProfiles/ProfileCard.tsx
+++ b/app/src/components/VoiceProfiles/ProfileCard.tsx
@@ -1,5 +1,5 @@
 import { HugeiconsIcon } from '@hugeicons/react';
-import { Download01Icon, Edit01Icon, Mic01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
+import { Download01Icon, Edit01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useState } from 'react';
 import { Badge } from '@/components/ui/badge';
 import { Button } from '@/components/ui/button';
@@ -13,10 +13,10 @@ import {
   DialogHeader,
   DialogTitle,
 } from '@/components/ui/dialog';
+import { ProfileAvatar } from '@/components/VoiceProfiles/ProfileAvatar';
 import type { VoiceProfileResponse } from '@/lib/api/types';
 import { useDeleteProfile, useExportProfile } from '@/lib/hooks/useProfiles';
 import { cn } from '@/lib/utils/cn';
-import { useServerStore } from '@/stores/serverStore';
 import { useUIStore } from '@/stores/uiStore';
 
 interface ProfileCardProps {
@@ -25,19 +25,15 @@ interface ProfileCardProps {
 
 export function ProfileCard({ profile }: ProfileCardProps) {
   const [deleteDialogOpen, setDeleteDialogOpen] = useState(false);
-  const [avatarError, setAvatarError] = useState(false);
   const deleteProfile = useDeleteProfile();
   const exportProfile = useExportProfile();
   const setEditingProfileId = useUIStore((state) => state.setEditingProfileId);
   const setProfileDialogOpen = useUIStore((state) => state.setProfileDialogOpen);
   const selectedProfileId = useUIStore((state) => state.selectedProfileId);
   const setSelectedProfileId = useUIStore((state) => state.setSelectedProfileId);
-  const serverUrl = useServerStore((state) => state.serverUrl);
 
   const isSelected = selectedProfileId === profile.id;
 
-  const avatarUrl = profile.avatar_path ? `${serverUrl}/profiles/${profile.id}/avatar` : null;
-
   const handleSelect = () => {
     setSelectedProfileId(isSelected ? null : profile.id);
   };
@@ -73,21 +69,13 @@ export function ProfileCard({ profile }: ProfileCardProps) {
       >
         <CardHeader className="p-3 pb-2">
           <CardTitle className="flex items-center gap-1.5 text-base font-medium">
-            <div className="h-6 w-6 rounded-full bg-muted flex items-center justify-center shrink-0 overflow-hidden">
-              {avatarUrl && !avatarError ? (
-                <img
-                  src={avatarUrl}
-                  alt={`${profile.name} avatar`}
-                  className={cn(
-                    'h-full w-full object-cover transition-all duration-200',
-                    !isSelected && 'grayscale',
-                  )}
-                  onError={() => setAvatarError(true)}
-                />
-              ) : (
-                <HugeiconsIcon icon={Mic01Icon} size={14} className="h-3.5 w-3.5 text-muted-foreground" />
-              )}
-            </div>
+            <ProfileAvatar
+              profileId={profile.id}
+              avatarPath={profile.avatar_path}
+              size="sm"
+              grayscale={!isSelected}
+              alt={`${profile.name} avatar`}
+            />
             <span className="break-words">{profile.name}</span>
           </CardTitle>
         </CardHeader>
diff --git a/app/src/components/VoicesTab/VoicesTab.tsx b/app/src/components/VoicesTab/VoicesTab.tsx
index c1e98a33..f1b34fa3 100644
--- a/app/src/components/VoicesTab/VoicesTab.tsx
+++ b/app/src/components/VoicesTab/VoicesTab.tsx
@@ -1,6 +1,6 @@
 import { useQuery, useQueryClient } from '@tanstack/react-query';
 import { HugeiconsIcon } from '@hugeicons/react';
-import { Edit01Icon, MoreHorizontalIcon, Add01Icon, Delete01Icon, Mic01Icon } from '@hugeicons/core-free-icons';
+import { Edit01Icon, MoreHorizontalIcon, Add01Icon, Delete01Icon } from '@hugeicons/core-free-icons';
 import { useMemo, useRef } from 'react';
 import { Button } from '@/components/ui/button';
 import {
@@ -19,6 +19,7 @@ import {
   TableRow,
 } from '@/components/ui/table';
 import { ProfileForm } from '@/components/VoiceProfiles/ProfileForm';
+import { ProfileAvatar } from '@/components/VoiceProfiles/ProfileAvatar';
 import { apiClient } from '@/lib/api/client';
 import type { VoiceProfileResponse } from '@/lib/api/types';
 import { BOTTOM_SAFE_AREA_PADDING } from '@/lib/constants/ui';
@@ -185,9 +186,12 @@ function VoiceRow({
     <TableRow className="cursor-pointer" onClick={onEdit}>
       <TableCell>
         <div className="flex items-center gap-2">
-          <div className="h-8 w-8 rounded-lg bg-muted flex items-center justify-center shrink-0">
-            <HugeiconsIcon icon={Mic01Icon} size={16} className="h-4 w-4 text-muted-foreground" />
-          </div>
+          <ProfileAvatar
+            profileId={profile.id}
+            avatarPath={profile.avatar_path}
+            size="md"
+            alt={`${profile.name} avatar`}
+          />
           <div>
             <div className="font-medium">{profile.name}</div>
             {profile.description && (
diff --git a/app/src/components/ui/radio-group.tsx b/app/src/components/ui/radio-group.tsx
index c82678c3..a04aa433 100644
--- a/app/src/components/ui/radio-group.tsx
+++ b/app/src/components/ui/radio-group.tsx
@@ -1,25 +1,19 @@
-"use client"
+'use client';
 
-import * as React from "react"
-import * as RadioGroupPrimitive from "@radix-ui/react-radio-group"
-import { HugeiconsIcon } from '@hugeicons/react';
 import { CircleIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import * as RadioGroupPrimitive from '@radix-ui/react-radio-group';
+import * as React from 'react';
 
-import { cn } from "@/lib/utils/cn"
+import { cn } from '@/lib/utils/cn';
 
 const RadioGroup = React.forwardRef<
   React.ElementRef<typeof RadioGroupPrimitive.Root>,
   React.ComponentPropsWithoutRef<typeof RadioGroupPrimitive.Root>
 >(({ className, ...props }, ref) => {
-  return (
-    <RadioGroupPrimitive.Root
-      className={cn("grid gap-2", className)}
-      {...props}
-      ref={ref}
-    />
-  )
-})
-RadioGroup.displayName = RadioGroupPrimitive.Root.displayName
+  return <RadioGroupPrimitive.Root className={cn('grid gap-2', className)} {...props} ref={ref} />;
+});
+RadioGroup.displayName = RadioGroupPrimitive.Root.displayName;
 
 const RadioGroupItem = React.forwardRef<
   React.ElementRef<typeof RadioGroupPrimitive.Item>,
@@ -29,17 +23,21 @@ const RadioGroupItem = React.forwardRef<
     <RadioGroupPrimitive.Item
       ref={ref}
       className={cn(
-        "aspect-square h-4 w-4 rounded-full border border-accent text-accent ring-offset-background focus:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50",
-        className
+        'aspect-square h-4 w-4 rounded-full border border-accent text-accent ring-offset-background focus:outline-none focus-visible:ring-2 focus-visible:ring-ring focus-visible:ring-offset-2 disabled:cursor-not-allowed disabled:opacity-50',
+        className,
       )}
       {...props}
     >
       <RadioGroupPrimitive.Indicator className="flex items-center justify-center">
-        <HugeiconsIcon icon={CircleIcon} size={10} className="h-2.5 w-2.5 fill-current text-current" />
+        <HugeiconsIcon
+          icon={CircleIcon}
+          size={10}
+          className="h-2.5 w-2.5 fill-current text-current"
+        />
       </RadioGroupPrimitive.Indicator>
     </RadioGroupPrimitive.Item>
-  )
-})
-RadioGroupItem.displayName = RadioGroupPrimitive.Item.displayName
+  );
+});
+RadioGroupItem.displayName = RadioGroupPrimitive.Item.displayName;
 
-export { RadioGroup, RadioGroupItem }
+export { RadioGroup, RadioGroupItem };
diff --git a/app/src/lib/hooks/useGenerationForm.ts b/app/src/lib/hooks/useGenerationForm.ts
index c6fdba50..70955824 100644
--- a/app/src/lib/hooks/useGenerationForm.ts
+++ b/app/src/lib/hooks/useGenerationForm.ts
@@ -91,11 +91,6 @@ export function useGenerationForm(options: UseGenerationFormOptions = {}) {
         instruct: data.instruct || undefined,
       });
 
-      toast({
-        title: 'Generation complete!',
-        description: `Audio generated (${result.duration.toFixed(2)}s)`,
-      });
-
       const audioUrl = apiClient.getAudioUrl(result.id);
       setAudioWithAutoPlay(audioUrl, result.id, selectedProfileId, data.text.substring(0, 50));
 
diff --git a/app/src/lib/hooks/useModelDownloadToast.tsx b/app/src/lib/hooks/useModelDownloadToast.tsx
index 56c13b9d..10fb7bdc 100644
--- a/app/src/lib/hooks/useModelDownloadToast.tsx
+++ b/app/src/lib/hooks/useModelDownloadToast.tsx
@@ -1,5 +1,6 @@
+import { CancelCircleIcon, CheckmarkCircle02Icon } from '@hugeicons/core-free-icons';
 import { HugeiconsIcon } from '@hugeicons/react';
-import { CheckmarkCircle02Icon, Loading01Icon, CancelCircleIcon } from '@hugeicons/core-free-icons';
+import { Icon } from '@iconify/react';
 import { useCallback, useEffect, useRef } from 'react';
 import { Progress } from '@/components/ui/progress';
 import { useToast } from '@/components/ui/use-toast';
@@ -60,7 +61,7 @@ export function useModelDownloadToast({
       title: displayName,
       description: (
         <div className="flex items-center gap-2">
-          <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />
+          <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
           <span>Connecting to download...</span>
         </div>
       ),
@@ -97,19 +98,35 @@ export function useModelDownloadToast({
 
           switch (progress.status) {
             case 'complete':
-              statusIcon = <HugeiconsIcon icon={CheckmarkCircle02Icon} size={16} className="h-4 w-4 text-green-500" />;
+              statusIcon = (
+                <HugeiconsIcon
+                  icon={CheckmarkCircle02Icon}
+                  size={16}
+                  className="h-4 w-4 text-green-500"
+                />
+              );
               statusText = 'Download complete';
               break;
             case 'error':
-              statusIcon = <HugeiconsIcon icon={CancelCircleIcon} size={16} className="h-4 w-4 text-destructive" />;
+              statusIcon = (
+                <HugeiconsIcon
+                  icon={CancelCircleIcon}
+                  size={16}
+                  className="h-4 w-4 text-destructive"
+                />
+              );
               statusText = `Error: ${progress.error || 'Unknown error'}`;
               break;
             case 'downloading':
-              statusIcon = <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />;
+              statusIcon = (
+                <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
+              );
               statusText = progress.filename || 'Downloading...';
               break;
             case 'extracting':
-              statusIcon = <HugeiconsIcon icon={Loading01Icon} size={16} className="h-4 w-4 animate-spin" />;
+              statusIcon = (
+                <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
+              );
               statusText = 'Extracting...';
               break;
           }
@@ -155,7 +172,11 @@ export function useModelDownloadToast({
               toastUpdateRef.current({
                 title: (
                   <div className="flex items-center gap-2">
-                    <HugeiconsIcon icon={CheckmarkCircle02Icon} size={16} className="h-4 w-4 text-green-500" />
+                    <HugeiconsIcon
+                      icon={CheckmarkCircle02Icon}
+                      size={16}
+                      className="h-4 w-4 text-green-500"
+                    />
                     <span>{displayName}</span>
                   </div>
                 ),
diff --git a/backend/main.py b/backend/main.py
index f0c774a5..306a0639 100644
--- a/backend/main.py
+++ b/backend/main.py
@@ -59,10 +59,8 @@
 # ROOT & HEALTH ENDPOINTS
 # ============================================
 
-@app.get("/")
-async def root():
-    """Root endpoint."""
-    return {"message": "voicebox API", "version": __version__}
+# Root endpoint removed - web UI served at / instead
+# API info available at /health
 
 
 @app.post("/shutdown")
@@ -1849,6 +1847,16 @@ async def get_active_tasks():
     )
 
 
+# ============================================
+# WEB UI STATIC FILES
+# ============================================
+
+# Serve web UI at root if dist directory exists
+_web_dist_path = Path(__file__).parent.parent / "web" / "dist"
+if _web_dist_path.exists():
+    app.mount("/", StaticFiles(directory=str(_web_dist_path), html=True), name="web")
+
+
 # ============================================
 # STARTUP & SHUTDOWN
 # ============================================
diff --git a/backend/providers/checksums.py b/backend/providers/checksums.py
new file mode 100644
index 00000000..75798b10
--- /dev/null
+++ b/backend/providers/checksums.py
@@ -0,0 +1,11 @@
+# Provider checksums - embedded at build time for security
+# This file is auto-generated during CI builds
+# In development, checksums are empty (verification is skipped)
+
+PROVIDER_CHECKSUMS = {
+    # Populated during release builds with SHA256 checksums of provider binaries
+    # Example:
+    # "tts-provider-pytorch-cpu-windows.exe": "abc123...",
+    # "tts-provider-pytorch-cuda-windows.exe": "def456...",
+    # "tts-provider-pytorch-cuda-linux": "789xyz...",
+}
diff --git a/bun.lock b/bun.lock
index bcbf37be..add8f83f 100644
--- a/bun.lock
+++ b/bun.lock
@@ -21,6 +21,8 @@
         "@hookform/resolvers": "^3.9.0",
         "@hugeicons/core-free-icons": "^3.1.1",
         "@hugeicons/react": "^1.1.4",
+        "@iconify-json/svg-spinners": "^1.2.4",
+        "@iconify/react": "^6.0.2",
         "@radix-ui/react-alert-dialog": "^1.1.1",
         "@radix-ui/react-avatar": "^1.1.0",
         "@radix-ui/react-dialog": "^1.1.1",
@@ -285,6 +287,12 @@
 
     "@humanwhocodes/object-schema": ["@humanwhocodes/object-schema@2.0.3", "", {}, "sha512-93zYdMES/c1D69yZiKDBj0V24vqNzB/koF26KPaagAfd3P/4gUlh3Dys5ogAK+Exi9QyzlD8x/08Zt7wIKcDcA=="],
 
+    "@iconify-json/svg-spinners": ["@iconify-json/svg-spinners@1.2.4", "", { "dependencies": { "@iconify/types": "*" } }, "sha512-ayn0pogFPwJA1WFZpDnoq9/hjDxN+keeCMyThaX4d3gSJ3y0mdKUxIA/b1YXWGtY9wVtZmxwcvOIeEieG4+JNg=="],
+
+    "@iconify/react": ["@iconify/react@6.0.2", "", { "dependencies": { "@iconify/types": "^2.0.0" }, "peerDependencies": { "react": ">=16" } }, "sha512-SMmC2sactfpJD427WJEDN6PMyznTFMhByK9yLW0gOTtnjzzbsi/Ke/XqsumsavFPwNiXs8jSiYeZTmLCLwO+Fg=="],
+
+    "@iconify/types": ["@iconify/types@2.0.0", "", {}, "sha512-+wluvCrRhXrhyOmRDJ3q8mux9JkKy5SJ/v8ol2tu4FVjyYvtEzkc/3pK15ET6RKg4b4w4BmTk1+gsCUhf21Ykg=="],
+
     "@img/colour": ["@img/colour@1.0.0", "", {}, "sha512-A5P/LfWGFSl6nsckYtjw9da+19jB8hkJ6ACTGcDfEJ0aE+l2n2El7dsVM7UVHZQ9s2lmYMWlrS21YLy2IR1LUw=="],
 
     "@img/sharp-darwin-arm64": ["@img/sharp-darwin-arm64@0.34.5", "", { "optionalDependencies": { "@img/sharp-libvips-darwin-arm64": "1.2.4" }, "os": "darwin", "cpu": "arm64" }, "sha512-imtQ3WMJXbMY4fxb/Ndp6HBTNVtWCUI0WdobyheGf5+ad6xX8VIDO8u2xE4qc/fr08CKG/7dDseFtn6M6g/r3w=="],
diff --git a/docker-compose.cpu.yml b/docker-compose.cpu.yml
new file mode 100644
index 00000000..7093c8d7
--- /dev/null
+++ b/docker-compose.cpu.yml
@@ -0,0 +1,26 @@
+version: '3.8'
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - LOG_LEVEL=info
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
+
+volumes:
+  voicebox-data:
+    driver: local
+  huggingface-cache:
+    driver: local
diff --git a/docker-compose.yml b/docker-compose.yml
new file mode 100644
index 00000000..f8225205
--- /dev/null
+++ b/docker-compose.yml
@@ -0,0 +1,34 @@
+version: '3.8'
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - GPU_MEMORY_FRACTION=0.8
+      - LOG_LEVEL=info
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
+
+volumes:
+  voicebox-data:
+    driver: local
+  huggingface-cache:
+    driver: local
diff --git a/docs/mint.json b/docs/mint.json
index c4f582ea..bbe0c409 100644
--- a/docs/mint.json
+++ b/docs/mint.json
@@ -40,7 +40,7 @@
     {
       "group": "Getting Started",
       "icon": "rocket",
-      "pages": ["overview/introduction", "overview/installation", "overview/quick-start"]
+      "pages": ["overview/introduction", "overview/installation", "overview/docker", "overview/quick-start"]
     },
     {
       "group": "Features",
diff --git a/docs/overview/docker.mdx b/docs/overview/docker.mdx
new file mode 100644
index 00000000..8fff55c8
--- /dev/null
+++ b/docs/overview/docker.mdx
@@ -0,0 +1,403 @@
+---
+title: "Docker Deployment"
+description: "Run Voicebox in Docker with the web UI for server deployments"
+---
+
+## Overview
+
+Voicebox is available as Docker images that include both the backend API and web UI. Run the full Voicebox experience in a container with a single command.
+
+**What's included:**
+- FastAPI backend with all TTS/Whisper capabilities
+- Complete web UI (same React app as the desktop version)
+- Provider download system (downloads PyTorch on first use)
+- Multi-architecture support (amd64, arm64)
+
+## Quick Start
+
+<Tabs>
+  <Tab title="NVIDIA GPU">
+    ```bash
+    docker run --gpus all -p 8000:8000 \
+      -v voicebox-data:/app/data \
+      ghcr.io/jamiepine/voicebox:latest-cuda
+    ```
+
+    Open http://localhost:8000 in your browser.
+  </Tab>
+
+  <Tab title="CPU Only">
+    ```bash
+    docker run -p 8000:8000 \
+      -v voicebox-data:/app/data \
+      ghcr.io/jamiepine/voicebox:latest
+    ```
+
+    Open http://localhost:8000 in your browser.
+  </Tab>
+
+  <Tab title="Docker Compose">
+    Clone the repo or download `docker-compose.yml`:
+
+    ```bash
+    # CUDA variant (default)
+    docker compose up -d
+
+    # CPU-only variant
+    docker compose -f docker-compose.cpu.yml up -d
+    ```
+
+    Open http://localhost:8000 in your browser.
+  </Tab>
+</Tabs>
+
+<Note>
+  On first launch, you'll be prompted to download a TTS provider (PyTorch CPU ~300MB or PyTorch CUDA ~2.4GB). This happens once and is cached in the `huggingface-cache` volume.
+</Note>
+
+## Available Images
+
+Images are automatically built and published to GitHub Container Registry on each release.
+
+| Image | Description | Platforms |
+|-------|-------------|-----------|
+| `ghcr.io/jamiepine/voicebox:latest` | Latest CPU-only release | linux/amd64, linux/arm64 |
+| `ghcr.io/jamiepine/voicebox:0.1.13` | Specific version (CPU) | linux/amd64, linux/arm64 |
+| `ghcr.io/jamiepine/voicebox:latest-cuda` | Latest with NVIDIA GPU support | linux/amd64 |
+| `ghcr.io/jamiepine/voicebox:0.1.13-cuda` | Specific version (CUDA) | linux/amd64 |
+
+<Tip>
+  Pin to a specific version in production to avoid unexpected updates:
+  ```yaml
+  image: ghcr.io/jamiepine/voicebox:0.1.13-cuda
+  ```
+</Tip>
+
+## Docker Compose Examples
+
+### GPU Deployment (Recommended)
+
+```yaml
+version: '3.8'
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - GPU_MEMORY_FRACTION=0.8
+      - LOG_LEVEL=info
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+```
+
+### CPU Deployment
+
+```yaml
+version: '3.8'
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - LOG_LEVEL=info
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+```
+
+## Volume Mounts
+
+<CardGroup cols={2}>
+  <Card title="voicebox-data" icon="database">
+    Stores voice profiles, generated audio, and database
+  </Card>
+  <Card title="huggingface-cache" icon="download">
+    Caches downloaded TTS/Whisper models (saves re-downloading)
+  </Card>
+</CardGroup>
+
+<Warning>
+  Always mount `/app/data` to preserve your voice profiles and generations across container restarts.
+</Warning>
+
+## Environment Variables
+
+Configure Voicebox behavior with environment variables:
+
+| Variable | Default | Description |
+|----------|---------|-------------|
+| `GPU_MEMORY_FRACTION` | `0.9` | Fraction of GPU memory to use (0.0-1.0) |
+| `LOG_LEVEL` | `info` | Logging level: `debug`, `info`, `warning`, `error` |
+| `DATA_DIR` | `/app/data` | Directory for profiles and generations |
+
+Example:
+```bash
+docker run -e GPU_MEMORY_FRACTION=0.8 \
+           -e LOG_LEVEL=debug \
+           -p 8000:8000 \
+           ghcr.io/jamiepine/voicebox:latest-cuda
+```
+
+## Cloud Deployment
+
+### AWS EC2
+
+<Steps>
+  <Step title="Launch GPU Instance">
+    Use g4dn.xlarge or p3.2xlarge with NVIDIA GPU
+  </Step>
+
+  <Step title="Install Docker & NVIDIA Container Toolkit">
+    ```bash
+    # Install Docker
+    curl -fsSL https://get.docker.com -o get-docker.sh
+    sudo sh get-docker.sh
+
+    # Install NVIDIA Container Toolkit
+    distribution=$(. /etc/os-release;echo $ID$VERSION_ID)
+    curl -fsSL https://nvidia.github.io/libnvidia-container/gpgkey | sudo gpg --dearmor -o /usr/share/keyrings/nvidia-container-toolkit-keyring.gpg
+    curl -s -L https://nvidia.github.io/libnvidia-container/$distribution/libnvidia-container.list | \
+      sed 's#deb https://#deb [signed-by=/usr/share/keyrings/nvidia-container-toolkit-keyring.gpg] https://#g' | \
+      sudo tee /etc/apt/sources.list.d/nvidia-container-toolkit.list
+    sudo apt-get update
+    sudo apt-get install -y nvidia-container-toolkit
+    sudo systemctl restart docker
+    ```
+  </Step>
+
+  <Step title="Deploy">
+    ```bash
+    docker run -d --gpus all -p 8000:8000 \
+      -v voicebox-data:/app/data \
+      --restart unless-stopped \
+      ghcr.io/jamiepine/voicebox:latest-cuda
+    ```
+  </Step>
+</Steps>
+
+### DigitalOcean
+
+<Steps>
+  <Step title="Create GPU Droplet">
+    ```bash
+    doctl compute droplet create voicebox \
+      --size gpu-h100x1-80gb \
+      --image ubuntu-22-04-x64 \
+      --region nyc3
+    ```
+  </Step>
+
+  <Step title="SSH and Deploy">
+    ```bash
+    ssh root@<droplet-ip>
+    curl -fsSL https://get.docker.com | sh
+    docker run -d --gpus all -p 80:8000 \
+      ghcr.io/jamiepine/voicebox:latest-cuda
+    ```
+  </Step>
+</Steps>
+
+### Fly.io
+
+Create `fly.toml`:
+
+```toml
+app = "voicebox"
+
+[build]
+  image = "ghcr.io/jamiepine/voicebox:latest"
+
+[[services]]
+  http_checks = []
+  internal_port = 8000
+  protocol = "tcp"
+
+  [[services.ports]]
+    port = 80
+    handlers = ["http"]
+
+  [[services.ports]]
+    port = 443
+    handlers = ["tls", "http"]
+
+[mounts]
+  source = "voicebox_data"
+  destination = "/app/data"
+```
+
+Deploy:
+```bash
+fly launch
+fly deploy
+```
+
+## Updates
+
+Docker images are automatically built and published on each GitHub release.
+
+<Tabs>
+  <Tab title="Latest Tag">
+    Always get the newest version:
+
+    ```bash
+    docker pull ghcr.io/jamiepine/voicebox:latest
+    docker compose up -d
+    ```
+  </Tab>
+
+  <Tab title="Pinned Version">
+    Update to a specific version:
+
+    ```yaml
+    services:
+      voicebox:
+        image: ghcr.io/jamiepine/voicebox:0.1.13-cuda
+    ```
+
+    ```bash
+    docker compose pull
+    docker compose up -d
+    ```
+  </Tab>
+
+  <Tab title="Automatic Updates">
+    Use Watchtower for automatic updates:
+
+    ```yaml
+    services:
+      voicebox:
+        image: ghcr.io/jamiepine/voicebox:latest-cuda
+        # ... other config ...
+
+      watchtower:
+        image: containrrr/watchtower
+        volumes:
+          - /var/run/docker.sock:/var/run/docker.sock
+        command: --interval 3600 # Check hourly
+    ```
+  </Tab>
+</Tabs>
+
+## GPU Requirements
+
+### NVIDIA GPU
+
+Requires:
+- **Docker version:** 19.03+
+- **NVIDIA Driver:** 450.80.02+
+- **NVIDIA Container Toolkit:** Installed and configured
+
+Verify GPU access:
+```bash
+docker run --rm --gpus all nvidia/cuda:12.1.1-base-ubuntu22.04 nvidia-smi
+```
+
+If this works, Voicebox will detect and use your GPU automatically.
+
+### AMD GPU (ROCm)
+
+AMD GPU support via ROCm is not currently available in pre-built images. If you need ROCm support, build a custom image using the ROCm base.
+
+## Troubleshooting
+
+### GPU Not Detected
+
+<Accordion title="Check NVIDIA Docker">
+  ```bash
+  # Verify NVIDIA Container Toolkit is installed
+  docker run --rm --gpus all nvidia/cuda:12.1.1-base-ubuntu22.04 nvidia-smi
+  ```
+
+  If this fails, reinstall NVIDIA Container Toolkit.
+</Accordion>
+
+<Accordion title="Insufficient GPU Memory">
+  Reduce GPU memory usage:
+
+  ```bash
+  docker run -e GPU_MEMORY_FRACTION=0.5 \
+    --gpus all -p 8000:8000 \
+    ghcr.io/jamiepine/voicebox:latest-cuda
+  ```
+
+  Or use CPU-only mode:
+  ```bash
+  docker run -p 8000:8000 \
+    ghcr.io/jamiepine/voicebox:latest
+  ```
+</Accordion>
+
+<Accordion title="Port Already in Use">
+  Change the host port:
+
+  ```bash
+  docker run -p 8080:8000 ghcr.io/jamiepine/voicebox:latest
+  ```
+
+  Then open http://localhost:8080
+</Accordion>
+
+<Accordion title="Permission Errors">
+  Run with specific user:
+
+  ```bash
+  docker run --user $(id -u):$(id -g) \
+    -v $(pwd)/data:/app/data \
+    ghcr.io/jamiepine/voicebox:latest
+  ```
+</Accordion>
+
+## Building From Source
+
+If you need to customize the Docker image:
+
+```bash
+# Clone the repo
+git clone https://github.com/jamiepine/voicebox.git
+cd voicebox
+
+# Build web UI
+bun install
+cd web && bun run build && cd ..
+
+# Build Docker image
+docker build -t voicebox:custom .
+
+# Or CUDA variant
+docker build -f Dockerfile.cuda -t voicebox:custom-cuda .
+```
+
+## Next Steps
+
+<CardGroup cols={2}>
+  <Card title="API Reference" icon="code" href="/api/overview">
+    Integrate Voicebox into your applications
+  </Card>
+  <Card title="Remote Mode" icon="server" href="/overview/remote-mode">
+    Connect desktop app to Docker backend
+  </Card>
+</CardGroup>
diff --git a/docs/overview/installation.mdx b/docs/overview/installation.mdx
index 04ddc5ba..508951c7 100644
--- a/docs/overview/installation.mdx
+++ b/docs/overview/installation.mdx
@@ -7,13 +7,16 @@ description: "Download and install Voicebox on macOS, Windows, or Linux"
 
 Voicebox is available for macOS and Windows, with Linux builds coming soon.
 
-<CardGroup cols={2}>
+<CardGroup cols={3}>
   <Card title="macOS" icon="apple">
     Download for Apple Silicon or Intel Macs
   </Card>
   <Card title="Windows" icon="windows">
     Download MSI installer or Setup executable
   </Card>
+  <Card title="Docker" icon="docker" href="/overview/docker">
+    Run with web UI in a container
+  </Card>
 </CardGroup>
 
 ### macOS
@@ -61,7 +64,7 @@ Voicebox is available for macOS and Windows, with Linux builds coming soon.
 ### Linux
 
 <Note>
-  Linux builds are coming soon. Currently blocked by GitHub runner disk space limitations.
+  Linux desktop builds are coming soon. For server deployments, use [Docker](/overview/docker).
 </Note>
 
 ## First Launch
diff --git a/docs/plans/DOCKER_DEPLOYMENT.md b/docs/plans/DOCKER_DEPLOYMENT.md
index 6af65ed7..6312ed41 100644
--- a/docs/plans/DOCKER_DEPLOYMENT.md
+++ b/docs/plans/DOCKER_DEPLOYMENT.md
@@ -1,24 +1,31 @@
 # Docker Deployment Guide
 
-**Status:** In Development for v0.2.0
-**Requested By:** Reddit community ([thread](https://reddit.com/r/LocalLLaMA/...))
+**Status:** Implemented
+**Images:** `ghcr.io/jamiepine/voicebox`
 
 ## Overview
 
-Docker support makes Voicebox easier to deploy, especially for:
+Voicebox is available as Docker images with the full web UI included. Images are automatically built and published to GitHub Container Registry on each release.
 
-- **Consistent Environments**: Same setup across dev/staging/prod
-- **GPU Passthrough**: Easy NVIDIA/AMD GPU access
+**What's included:**
+- FastAPI backend with all TTS/Whisper capabilities
+- Complete web UI (same React app as the Tauri desktop version)
+- Provider download system (downloads TTS providers on first use, just like desktop)
+- Multi-architecture support (amd64, arm64 for CPU variant)
+
+Docker support is ideal for:
 - **Server Deployments**: Run on headless Linux servers
-- **Multi-User Setups**: Isolate instances per user/team
+- **GPU Passthrough**: Easy NVIDIA GPU access
+- **Consistent Environments**: Same setup across dev/staging/prod
 - **Cloud Platforms**: Deploy to AWS, GCP, Azure, DigitalOcean
+- **Multi-User Setups**: Isolate instances per user/team
 
 ## Quick Start
 
 ### Using Pre-Built Images (Recommended)
 
 ```bash
-# CPU-only version
+# CPU-only version (supports amd64 and arm64)
 docker run -p 8000:8000 -v voicebox-data:/app/data \
   ghcr.io/jamiepine/voicebox:latest
 
@@ -26,184 +33,80 @@ docker run -p 8000:8000 -v voicebox-data:/app/data \
 docker run --gpus all -p 8000:8000 -v voicebox-data:/app/data \
   ghcr.io/jamiepine/voicebox:latest-cuda
 
-# AMD GPU version (experimental)
-docker run --device=/dev/kfd --device=/dev/dri -p 8000:8000 \
-  -v voicebox-data:/app/data \
-  ghcr.io/jamiepine/voicebox:latest-rocm
+# Specific version (pinned for stability)
+docker run -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:0.1.13
 ```
 
 Then open: `http://localhost:8000`
 
-### Using Docker Compose (Easiest)
+The web UI will load automatically. On first use, you'll be prompted to download a TTS provider (PyTorch CPU ~300MB or PyTorch CUDA ~2.4GB).
 
-Create `docker-compose.yml`:
+### Using Docker Compose (Easiest)
 
-```yaml
-version: '3.8'
+Use the provided `docker-compose.yml` (CUDA) or `docker-compose.cpu.yml` in the repository root:
 
-services:
-  voicebox:
-    image: ghcr.io/jamiepine/voicebox:latest-cuda
-    ports:
-      - "8000:8000"
-    volumes:
-      - voicebox-data:/app/data
-      - huggingface-cache:/root/.cache/huggingface
-    environment:
-      - GPU_MEMORY_FRACTION=0.8  # Use 80% of GPU memory
-      - TTS_MODE=local
-      - WHISPER_MODE=local
-    deploy:
-      resources:
-        reservations:
-          devices:
-            - driver: nvidia
-              count: 1
-              capabilities: [gpu]
+```bash
+# CUDA (default)
+docker compose up -d
 
-volumes:
-  voicebox-data:
-  huggingface-cache:
+# Or CPU-only
+docker compose -f docker-compose.cpu.yml up -d
 ```
 
-Run:
-```bash
-docker compose up -d
+To pin to a specific version, edit the compose file:
+```yaml
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:0.1.13-cuda  # Pinned version
 ```
 
 ## Building From Source
 
-### Basic Dockerfile
-
-```dockerfile
-# Dockerfile
-FROM python:3.11-slim
-
-WORKDIR /app
-
-# Install system dependencies
-RUN apt-get update && apt-get install -y \
-    git \
-    build-essential \
-    ffmpeg \
-    && rm -rf /var/lib/apt/lists/*
-
-# Copy application
-COPY backend/ /app/backend/
-COPY requirements.txt /app/
-
-# Install Python dependencies
-RUN pip install --no-cache-dir -r requirements.txt
-RUN pip install --no-cache-dir git+https://github.com/QwenLM/Qwen3-TTS.git
-
-# Create data directory
-RUN mkdir -p /app/data
-
-# Expose port
-EXPOSE 8000
-
-# Run server
-CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
-```
+See `Dockerfile` and `Dockerfile.cuda` in the repository root.
 
 Build and run:
 ```bash
-docker build -t voicebox .
-docker run -p 8000:8000 -v $(pwd)/data:/app/data voicebox
-```
-
-### Multi-Stage Build (Optimized)
-
-Smaller image size by separating build and runtime:
-
-```dockerfile
-# Dockerfile.optimized
-# Stage 1: Build dependencies
-FROM python:3.11-slim AS builder
-
-WORKDIR /build
-
-RUN apt-get update && apt-get install -y \
-    git build-essential && \
-    rm -rf /var/lib/apt/lists/*
-
-COPY backend/requirements.txt .
-RUN pip install --no-cache-dir --target=/build/packages \
-    -r requirements.txt
-
-RUN pip install --no-cache-dir --target=/build/packages \
-    git+https://github.com/QwenLM/Qwen3-TTS.git
-
-# Stage 2: Runtime
-FROM python:3.11-slim
-
-WORKDIR /app
-
-# Install only runtime dependencies
-RUN apt-get update && apt-get install -y \
-    ffmpeg \
-    && rm -rf /var/lib/apt/lists/*
+# Build web UI first
+bun install
+cd web && bun run build && cd ..
 
-# Copy installed packages from builder
-COPY --from=builder /build/packages /usr/local/lib/python3.11/site-packages/
-
-# Copy application code
-COPY backend/ /app/backend/
+# Build CPU image
+docker build -t voicebox .
+docker run -p 8000:8000 -v voicebox-data:/app/data voicebox
 
-# Create data directory
-RUN mkdir -p /app/data
+# Or build CUDA image
+docker build -f Dockerfile.cuda -t voicebox:cuda .
+docker run --gpus all -p 8000:8000 -v voicebox-data:/app/data voicebox:cuda
+```
 
-EXPOSE 8000
+### Architecture
 
-CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
-```
+The Docker images include:
+- **Backend**: FastAPI server with TTS/Whisper endpoints
+- **Web UI**: Pre-built React app served as static files from the backend
+- **Provider System**: Downloads PyTorch CPU/CUDA providers on first use (same UX as desktop app)
 
-Build:
-```bash
-docker build -f Dockerfile.optimized -t voicebox:slim .
-```
+Images are automatically built on release and tagged with both version number and `latest`.
 
 ## GPU Support
 
 ### NVIDIA GPUs (CUDA)
 
-**Dockerfile:**
-```dockerfile
-FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04
-
-# Install Python
-RUN apt-get update && apt-get install -y \
-    python3.11 python3-pip git ffmpeg && \
-    rm -rf /var/lib/apt/lists/*
-
-WORKDIR /app
-
-# Install PyTorch with CUDA support
-COPY backend/requirements.txt .
-RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
-
-# Install other dependencies
-RUN pip3 install -r requirements.txt
-RUN pip3 install git+https://github.com/QwenLM/Qwen3-TTS.git
-
-COPY backend/ /app/backend/
-
-EXPOSE 8000
-CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
-```
+The CUDA image includes PyTorch with CUDA 12.1 support:
 
 **Run with GPU:**
 ```bash
 docker run --gpus all -p 8000:8000 \
   -v voicebox-data:/app/data \
-  voicebox:cuda
+  ghcr.io/jamiepine/voicebox:latest-cuda
 ```
 
 **Docker Compose with GPU:**
 ```yaml
 services:
   voicebox:
-    image: voicebox:cuda
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
     deploy:
       resources:
         reservations:
@@ -213,47 +116,9 @@ services:
               capabilities: [gpu]
 ```
 
-### AMD GPUs (ROCm) - Experimental
-
-**Dockerfile:**
-```dockerfile
-FROM rocm/dev-ubuntu-22.04:6.0
-
-# Install Python
-RUN apt-get update && apt-get install -y \
-    python3.11 python3-pip git ffmpeg && \
-    rm -rf /var/lib/apt/lists/*
+### AMD GPUs (ROCm)
 
-WORKDIR /app
-
-# Install PyTorch with ROCm support
-COPY backend/requirements.txt .
-RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/rocm6.0
-
-# Install other dependencies
-RUN pip3 install -r requirements.txt
-RUN pip3 install git+https://github.com/QwenLM/Qwen3-TTS.git
-
-# Set ROCm environment variables
-ENV HSA_OVERRIDE_GFX_VERSION=10.3.0
-ENV ROCM_PATH=/opt/rocm
-
-COPY backend/ /app/backend/
-
-EXPOSE 8000
-CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
-```
-
-**Run with AMD GPU:**
-```bash
-docker run --device=/dev/kfd --device=/dev/dri \
-  --group-add video --ipc=host --cap-add=SYS_PTRACE \
-  --security-opt seccomp=unconfined \
-  -p 8000:8000 -v voicebox-data:/app/data \
-  voicebox:rocm
-```
-
-**Note:** ROCm support varies by GPU model. Works best on Linux. See [AMD ROCm docs](https://rocm.docs.amd.com) for compatibility.
+ROCm support is not currently available in pre-built images. If you need ROCm, build a custom image using the ROCm base and PyTorch ROCm builds.
 
 ## Volume Mounts
 
@@ -734,13 +599,27 @@ docker logs -f voicebox
 docker compose logs -f voicebox
 ```
 
-## Next Steps
+## Updates
+
+Docker images are automatically built and published on each GitHub release. To update:
+
+```bash
+# Pull latest
+docker pull ghcr.io/jamiepine/voicebox:latest
+docker compose up -d
+
+# Or pin to a specific version
+docker pull ghcr.io/jamiepine/voicebox:0.1.13
+```
+
+For automatic updates, use [Watchtower](https://containrrr.dev/watchtower/).
+
+## Future Enhancements
 
-- [ ] Publish official images to GitHub Container Registry
-- [ ] Add Kubernetes Helm charts
-- [ ] Create Docker Desktop extension
-- [ ] Add automated vulnerability scanning
-- [ ] Support ARM64 builds for Raspberry Pi / Apple Silicon
+- Kubernetes Helm charts
+- Docker Desktop extension
+- Automated vulnerability scanning
+- ROCm image variant
 
 ## Contributing
 
diff --git a/docs2/MIGRATION.md b/docs2/MIGRATION.md
new file mode 100644
index 00000000..98f2be32
--- /dev/null
+++ b/docs2/MIGRATION.md
@@ -0,0 +1,94 @@
+# Documentation Migration: Mintlify → Fumadocs
+
+This document summarizes the migration of documentation from `/docs` (Mintlify) to `/docs2` (Fumadocs).
+
+## What Was Done
+
+### 1. Files Copied
+
+- ✅ All 29 MDX files from `/docs` folders (overview, api, developer, plans)
+- ✅ All 4 root-level markdown files (AUTOUPDATER.md, AUTOUPDATER_QUICKSTART.md, TROUBLESHOOTING.md, README.md)
+- ✅ All images (3 webp files) → `public/images/`
+- ✅ All logo files (2 png files) → `public/logo/`
+
+### 2. Component Migration
+
+Created compatibility layer in `components/mintlify-compat.tsx` that maps Mintlify components to Fumadocs equivalents:
+
+- `<Frame>` → Simple div wrapper (images are zoomable by default in Fumadocs)
+- `<CardGroup>` → `<Cards>` (Fumadocs component)
+- `<Card>` → `<Card>` (with icon string → Lucide icon mapping)
+- `<Steps>` / `<Step>` → Direct mapping to Fumadocs components
+- `<Tip>`, `<Note>`, `<Info>` → `<Callout type="info">`
+- `<Warning>` → `<Callout type="warn">`
+- `<Danger>` → `<Callout type="error">`
+- `<AccordionGroup>` / `<Accordion>` → HTML `<details>` / `<summary>` elements
+
+### 3. Navigation Structure
+
+Created `meta.json` files for each folder:
+
+- `content/docs/meta.json` - Root documentation
+- `content/docs/overview/meta.json` - Overview pages
+- `content/docs/api/meta.json` - API reference
+- `content/docs/developer/meta.json` - Developer docs
+- `content/docs/plans/meta.json` - Plans/roadmap
+
+### 4. Link Fixes
+
+- Fixed incorrect `/guides/...` paths → `/overview/...`
+- All internal links now use correct paths
+
+### 5. Branding
+
+- Updated `lib/layout.shared.tsx` to use "Voicebox" as the nav title
+
+## File Structure
+
+```
+docs2/
+├── components/
+│   └── mintlify-compat.tsx    # Mintlify → Fumadocs component mappings
+├── content/docs/
+│   ├── meta.json              # Root navigation
+│   ├── overview/              # 12 MDX files
+│   ├── api/                   # 5 MDX files
+│   ├── developer/             # 12 MDX files
+│   ├── plans/                 # 4 MD files
+│   └── *.md                   # 4 root markdown files
+├── public/
+│   ├── images/                # 3 webp files
+│   └── logo/                  # 2 png files
+└── mdx-components.tsx         # MDX component configuration
+```
+
+## Icon Mapping
+
+The following icon strings are mapped to Lucide icons:
+
+- `microphone` → Mic
+- `film` → Film
+- `code` → Code
+- `shield` → Shield
+- `download` → Download
+- `rocket` → Rocket
+- `apple` → Apple
+- `windows` → Windows
+- `server` → Server
+- `user` → User
+- `waveform` → Waveform
+
+## Next Steps
+
+1. **Test the build**: Run `npm run build` (requires Node.js >= 20.9.0)
+2. **Start dev server**: Run `npm run dev` to preview
+3. **Customize styling**: Update `app/global.css` if needed
+4. **Add more icons**: Extend `iconMap` in `mintlify-compat.tsx` as needed
+5. **Review navigation**: Adjust `meta.json` files to customize page order
+
+## Notes
+
+- Image paths (`/images/...`) work as-is since Next.js serves from `public/`
+- All Mintlify components are now compatible with Fumadocs
+- Navigation structure follows Fumadocs conventions
+- No breaking changes to content - all MDX files work with compatibility layer
diff --git a/docs2/content/docs/AUTOUPDATER.md b/docs2/content/docs/AUTOUPDATER.md
new file mode 100644
index 00000000..76148c52
--- /dev/null
+++ b/docs2/content/docs/AUTOUPDATER.md
@@ -0,0 +1,203 @@
+---
+title: "Auto-Updater Documentation"
+description: "How Voicebox automatic updates work for users and developers"
+---
+
+Voicebox includes automatic updates powered by Tauri's updater plugin. This document explains how it works for both users and developers.
+
+## 1. Generate Signing Keys
+
+Run this command to generate your signing keypair:
+
+```bash
+cd tauri && bun tauri signer generate -w ~/.tauri/voicebox.key
+```
+
+This creates:
+
+- **Private key**: `~/.tauri/voicebox.key` (keep this secret!)
+- **Public key**: `~/.tauri/voicebox.key.pub`
+
+## 2. Update Configuration
+
+Copy the content from `~/.tauri/voicebox.key.pub` and replace the placeholder in `tauri/src-tauri/tauri.conf.json`:
+
+```json
+{
+	"plugins": {
+		"updater": {
+			"pubkey": "PASTE_PUBLIC_KEY_CONTENT_HERE",
+			"endpoints": [
+				"https://github.com/YOUR_USERNAME/voicebox/releases/latest/download/latest.json"
+			]
+		}
+	}
+}
+```
+
+Update the endpoint URL with your actual GitHub username/organization.
+
+## 3. Building with Signatures
+
+When building releases, set these environment variables:
+
+**macOS/Linux:**
+
+```bash
+export TAURI_SIGNING_PRIVATE_KEY="$(cat ~/.tauri/voicebox.key)"
+export TAURI_SIGNING_PRIVATE_KEY_PASSWORD=""
+bun run build
+```
+
+**Windows PowerShell:**
+
+```powershell
+$env:TAURI_SIGNING_PRIVATE_KEY = Get-Content ~/.tauri/voicebox.key -Raw
+$env:TAURI_SIGNING_PRIVATE_KEY_PASSWORD = ""
+bun run build
+```
+
+## 4. GitHub Release Setup
+
+When you create a GitHub release, the build process will generate:
+
+- Installers for each platform
+- `.sig` signature files
+- `latest.json` update manifest
+
+### Manual Release Process
+
+1. Build the app with signing keys set
+2. Create a new GitHub release
+3. Upload all files from `tauri/src-tauri/target/release/bundle/`
+4. Create `latest.json` in your release assets:
+
+```json
+{
+	"version": "0.2.0",
+	"notes": "Bug fixes and improvements",
+	"pub_date": "2026-01-25T12:00:00Z",
+	"platforms": {
+		"darwin-aarch64": {
+			"signature": "CONTENT_FROM_.app.tar.gz.sig",
+			"url": "https://github.com/YOUR_USERNAME/voicebox/releases/download/v0.2.0/voicebox_0.2.0_aarch64.dmg"
+		},
+		"darwin-x86_64": {
+			"signature": "CONTENT_FROM_.app.tar.gz.sig",
+			"url": "https://github.com/YOUR_USERNAME/voicebox/releases/download/v0.2.0/voicebox_0.2.0_x64.dmg"
+		},
+		"linux-x86_64": {
+			"signature": "CONTENT_FROM_.AppImage.sig",
+			"url": "https://github.com/YOUR_USERNAME/voicebox/releases/download/v0.2.0/voicebox_0.2.0_amd64.AppImage"
+		},
+		"windows-x86_64": {
+			"signature": "CONTENT_FROM_.msi.sig",
+			"url": "https://github.com/YOUR_USERNAME/voicebox/releases/download/v0.2.0/voicebox_0.2.0_x64_en-US.msi"
+		}
+	}
+}
+```
+
+### Automated GitHub Actions (Recommended)
+
+Create `.github/workflows/release.yml`:
+
+```yaml
+name: Release
+
+on:
+  push:
+    tags:
+      - "v*"
+
+jobs:
+  release:
+    strategy:
+      matrix:
+        platform: [macos-latest, ubuntu-22.04, windows-latest]
+
+    runs-on: ${{ matrix.platform }}
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - name: Setup Bun
+        uses: oven-sh/setup-bun@v1
+
+      - name: Install Rust
+        uses: dtolnay/rust-toolchain@stable
+
+      - name: Install dependencies (Ubuntu)
+        if: matrix.platform == 'ubuntu-22.04'
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y libwebkit2gtk-4.1-dev libappindicator3-dev librsvg2-dev patchelf
+
+      - name: Install dependencies
+        run: bun install
+
+      - name: Build
+        env:
+          TAURI_SIGNING_PRIVATE_KEY: ${{ secrets.TAURI_SIGNING_PRIVATE_KEY }}
+          TAURI_SIGNING_PRIVATE_KEY_PASSWORD: ${{ secrets.TAURI_SIGNING_PRIVATE_KEY_PASSWORD }}
+        run: bun run build
+
+      - name: Upload Release
+        uses: softprops/action-gh-release@v1
+        with:
+          files: tauri/src-tauri/target/release/bundle/**/*
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+```
+
+Add your private key to GitHub secrets:
+
+- Go to Settings → Secrets and variables → Actions
+- Add `TAURI_SIGNING_PRIVATE_KEY` with the content of `~/.tauri/voicebox.key`
+- Add `TAURI_SIGNING_PRIVATE_KEY_PASSWORD` (empty string if no password)
+
+## Frontend Integration
+
+The frontend integration is complete with automatic update notifications and manual update checks:
+
+- **Update Notification Banner** - Appears automatically when updates are available
+- **Settings Panel** - Manual "Check for Updates" button in Settings tab
+- **Update Hook** - React hook handles all update operations
+
+See `docs/AUTOUPDATER_QUICKSTART.md` for a quick setup guide.
+
+## Security Notes
+
+- Never commit your private key to version control
+- Store private keys securely (use GitHub secrets for CI/CD)
+- The public key in `tauri.conf.json` is safe to commit
+- Updates are cryptographically verified before installation
+- HTTP endpoints are blocked by default (HTTPS only)
+
+## Testing Updates
+
+1. Build version 0.1.0 and install it
+2. Update version in `tauri.conf.json` to 0.2.0
+3. Build version 0.2.0 with signatures
+4. Create a local server or GitHub release with `latest.json`
+5. Run version 0.1.0 and trigger update check
+6. Verify update downloads and installs correctly
+
+## Troubleshooting
+
+**"Invalid signature" error:**
+
+- Verify public key matches the private key used to sign
+- Ensure signature files (.sig) are uploaded correctly
+
+**"No update available" when one exists:**
+
+- Check endpoint URL is correct
+- Verify `latest.json` format matches specification
+- Ensure version in latest.json is higher than current version
+
+**Build fails with signing:**
+
+- Confirm environment variables are set correctly
+- Check private key file exists and is readable
+- Verify private key format (should start with `dW50cnVzdGVkIGNvbW1lbnQ6`)
diff --git a/docs2/content/docs/AUTOUPDATER_QUICKSTART.md b/docs2/content/docs/AUTOUPDATER_QUICKSTART.md
new file mode 100644
index 00000000..5614536d
--- /dev/null
+++ b/docs2/content/docs/AUTOUPDATER_QUICKSTART.md
@@ -0,0 +1,129 @@
+---
+title: "Autoupdater Quick Start"
+description: "Quick guide to activate the Tauri v2 autoupdater"
+---
+
+The Tauri v2 autoupdater has been fully configured and integrated. Follow these steps to activate it.
+
+## What's Already Done
+
+✅ Rust plugin installed and initialized
+✅ Tauri configuration set up with updater settings
+✅ Permissions granted for update operations
+✅ GitHub Actions workflow updated with signing support
+✅ Frontend components created and integrated
+✅ Update notifications on app startup
+✅ Manual update check in Settings tab
+
+## Required Steps (5 minutes)
+
+### 1. Generate Signing Keys
+
+```bash
+bun run generate:keys
+```
+
+This creates:
+
+- Private key: `~/.tauri/voicebox.key` (keep secret!)
+- Public key: `~/.tauri/voicebox.key.pub` (safe to share)
+
+### 2. Update Tauri Config
+
+Open `tauri/src-tauri/tauri.conf.json` and:
+
+1. Replace `"REPLACE_WITH_YOUR_PUBLIC_KEY"` with the content from `~/.tauri/voicebox.key.pub`
+2. Update the endpoint URL with your GitHub username:
+   ```json
+   "endpoints": [
+     "https://github.com/YOUR_USERNAME/voicebox/releases/latest/download/latest.json"
+   ]
+   ```
+
+### 3. Add GitHub Secrets
+
+Go to your repo Settings → Secrets and variables → Actions:
+
+1. Add `TAURI_SIGNING_PRIVATE_KEY`:
+
+   ```bash
+   cat ~/.tauri/voicebox.key
+   ```
+
+   Copy the entire output and paste as the secret value
+
+2. Add `TAURI_SIGNING_PRIVATE_KEY_PASSWORD`:
+   Leave empty (or add your password if you set one)
+
+### 4. Test the Setup
+
+To test locally before creating a release:
+
+```bash
+bun run build:release
+```
+
+This will verify your keys are set up correctly.
+
+## How It Works
+
+### For Users
+
+1. App checks for updates on startup (only in Tauri builds)
+2. If an update is available, a banner appears at the top
+3. Users can click "Install Now" to download and install
+4. App restarts automatically after installation
+
+### For Developers
+
+1. Create a new git tag: `git tag v0.2.0 && git push --tags`
+2. GitHub Actions builds signed releases for all platforms
+3. Uploads installers and generates `latest.json` manifest
+4. Users running older versions will be notified automatically
+
+## UI Components
+
+### Update Notification Banner
+
+- Shows at top of app when update is available
+- Appears automatically on startup
+- Displays download/install progress
+
+### Settings Panel
+
+- Located in Settings tab
+- Shows current version
+- Manual "Check for Updates" button
+- Update status and progress
+
+## Troubleshooting
+
+**"Public key not configured"**
+
+- Make sure you copied the entire content from `voicebox.key.pub`
+- The key should start with `dW50cnVzdGVkIGNvbW1lbnQ6`
+
+**"Failed to check for updates"**
+
+- Endpoint URL might be incorrect
+- No releases published yet (expected for first setup)
+
+**Build fails with signing error**
+
+- Check that GitHub secrets are set correctly
+- Verify private key file exists at `~/.tauri/voicebox.key`
+
+## Next Release Workflow
+
+1. Update version in `tauri/src-tauri/tauri.conf.json`
+2. Commit changes
+3. Create and push tag: `git tag v0.2.0 && git push --tags`
+4. GitHub Actions will automatically build and create a draft release
+5. Review the release and publish it
+6. Users will be notified of the update
+
+## See Also
+
+- Full documentation: `docs/AUTOUPDATER.md`
+- Build script: `scripts/prepare-release.sh`
+- GitHub workflow: `.github/workflows/release.yml`
diff --git a/docs2/content/docs/README.md b/docs2/content/docs/README.md
new file mode 100644
index 00000000..66f7833d
--- /dev/null
+++ b/docs2/content/docs/README.md
@@ -0,0 +1,67 @@
+---
+title: "Documentation README"
+description: "Voicebox documentation development guide"
+---
+
+This directory contains the documentation for Voicebox, built with [Fumadocs](https://fumadocs.dev).
+
+## Development
+
+### Prerequisites
+
+Install Mintlify globally using bun:
+
+```bash
+bun add -g mintlify
+```
+
+Or use the helper script:
+
+```bash
+bun run install:mintlify
+```
+
+### Running Locally
+
+```bash
+bun run dev
+```
+
+This will start the Mintlify dev server.
+
+The docs will be available at `http://localhost:3000`
+
+### Structure
+
+```
+docs/
+├── mint.json           # Mintlify configuration
+├── custom.css          # Custom styles
+├── overview/           # Getting started & feature docs
+├── guides/             # User guides
+├── api/                # API reference
+├── development/        # Developer documentation
+├── logo/               # Logo assets
+└── public/             # Static assets
+```
+
+### Writing Docs
+
+- Use `.mdx` files for all documentation pages
+- Follow the existing structure in `mint.json` for navigation
+- Use Mintlify components for enhanced formatting (Card, CardGroup, Accordion, etc.)
+- Reference the [Mintlify documentation](https://mintlify.com/docs) for available components
+
+## Deployment
+
+Docs are automatically deployed when changes are pushed to the main branch.
+
+To manually deploy:
+
+```bash
+mintlify deploy
+```
+
+## Contributing
+
+See [CONTRIBUTING.md](../CONTRIBUTING.md) for contribution guidelines.
diff --git a/docs2/content/docs/TROUBLESHOOTING.md b/docs2/content/docs/TROUBLESHOOTING.md
new file mode 100644
index 00000000..18a6c255
--- /dev/null
+++ b/docs2/content/docs/TROUBLESHOOTING.md
@@ -0,0 +1,360 @@
+---
+title: "Troubleshooting Guide"
+description: "Common issues and solutions for Voicebox"
+---
+
+Common issues and solutions for Voicebox.
+
+## Installation Issues
+
+### macOS: "Voicebox cannot be opened because it is from an unidentified developer"
+
+**Solution:**
+
+1. Right-click the `.dmg` file
+2. Select "Open"
+3. Click "Open" in the security dialog
+4. Alternatively, go to System Settings → Privacy & Security → Allow Voicebox
+
+### Windows: "Windows protected your PC"
+
+**Solution:**
+
+1. Click "More info"
+2. Click "Run anyway"
+3. Windows Defender may flag new software; this is normal for unsigned apps
+
+### Linux: AppImage won't run
+
+**Solution:**
+
+```bash
+chmod +x voicebox-*.AppImage
+./voicebox-*.AppImage
+```
+
+## Runtime Issues
+
+### Server won't start
+
+**Symptoms:** App opens but shows "Server not connected"
+
+**Solutions:**
+
+1. **Check Python installation**
+
+   ```bash
+   python --version  # Should be 3.11+
+   ```
+
+2. **Check server binary exists**
+
+   - Look in `tauri/src-tauri/binaries/` for your platform
+   - Binary should match your system architecture
+
+3. **Check permissions**
+
+   ```bash
+   # macOS/Linux
+   chmod +x tauri/src-tauri/binaries/voicebox-server-*
+   ```
+
+4. **Check logs**
+   - macOS: Open Console.app and search for "voicebox"
+   - Linux: Check `~/.local/share/voicebox/` for logs
+   - Windows: Check Event Viewer
+
+### "Model download failed"
+
+**Symptoms:** First generation fails with download error
+
+**Solutions:**
+
+1. **Check internet connection**
+
+   - Models download from HuggingFace Hub (~2-4GB)
+   - First download may take several minutes
+
+2. **Check disk space**
+
+   - Models are cached in `~/.cache/huggingface/`
+   - Ensure at least 5GB free space
+
+3. **Manual download** (if automatic fails)
+   ```bash
+   pip install huggingface_hub
+   huggingface-cli download Qwen/Qwen3-TTS-12Hz-1.7B-Base
+   ```
+
+### "Out of memory" errors
+
+**Symptoms:** Generation fails with CUDA/VRAM errors
+
+**Solutions:**
+
+1. **Use smaller model**
+
+   - Switch to 0.6B model instead of 1.7B
+   - Settings → Model Management → Load 0.6B
+
+2. **Close other applications**
+
+   - Free up GPU memory
+   - Close browser tabs, other ML apps
+
+3. **Use CPU mode**
+   - Slower but works without GPU
+   - Backend automatically falls back to CPU
+
+### MLX "Failed to load the default metallib" error (Apple Silicon)
+
+**Symptoms:** Generation fails with "library not found" or "metallib" errors
+
+**Solutions:**
+
+1. **Rebuild server binary**
+
+   ```bash
+   bun run build:server
+   ```
+
+   The build script should automatically include MLX Metal shader libraries.
+
+2. **Check MLX installation**
+
+   ```bash
+   pip install -r backend/requirements-mlx.txt
+   ```
+
+3. **Verify backend detection**
+   - Check server logs for "Backend: MLX"
+   - If showing "Backend: PYTORCH", MLX may not be installed correctly
+
+### Audio playback issues
+
+**Symptoms:** Generated audio won't play
+
+**Solutions:**
+
+1. **Check audio format**
+
+   - Audio is saved as WAV files
+   - Ensure your system supports WAV playback
+
+2. **Try downloading audio**
+
+   - Right-click → Download
+   - Play in external player
+
+3. **Check browser permissions** (web version)
+   - Allow audio autoplay in browser settings
+
+### Slow generation
+
+**Symptoms:** Generation takes >30 seconds
+
+**Solutions:**
+
+1. **Check backend type** (Apple Silicon)
+
+   - Check Settings → Server Status
+   - Should show "Backend: MLX" on Apple Silicon
+   - If showing "Backend: PYTORCH", install MLX: `pip install -r backend/requirements-mlx.txt`
+   - MLX provides 4-5x faster inference on Apple Silicon
+
+2. **Use GPU** (if available)
+
+   - Check Settings → Server Status
+   - Should show "GPU available: true"
+   - Apple Silicon: Should show "Metal (Apple Silicon via MLX)"
+   - Windows/Linux: Should show "CUDA" if GPU available
+
+3. **Enable caching**
+
+   - Voice prompts are cached automatically
+   - Second generation with same voice should be faster
+
+4. **Use smaller model**
+
+   - 0.6B model is faster than 1.7B
+   - Quality difference is minimal for most voices
+
+5. **Check system resources**
+   - Close other CPU/GPU intensive apps
+   - Ensure adequate RAM (8GB+ recommended)
+
+## API Issues
+
+### "Connection refused" when using API
+
+**Solutions:**
+
+1. **Check server is running**
+
+   ```bash
+   curl http://localhost:8000/health
+   ```
+
+2. **Check remote mode**
+
+   - If connecting remotely, ensure server is started with `--host 0.0.0.0`
+   - Check firewall settings
+
+3. **Check port availability**
+   - Default port is 8000
+   - Ensure no other service is using it
+
+### CORS errors in browser
+
+**Solutions:**
+
+1. **Use desktop app** (recommended)
+
+   - Desktop app doesn't have CORS restrictions
+
+2. **Configure CORS** (for web deployment)
+   - Update `backend/main.py` CORS settings
+   - Add your domain to allowed origins
+
+## Update Issues
+
+### "Update check failed"
+
+**Solutions:**
+
+1. **Check internet connection**
+
+   - Updates are fetched from GitHub releases
+
+2. **Check GitHub access**
+
+   - Ensure `github.com` is accessible
+   - Check firewall/proxy settings
+
+3. **Manual update**
+   - Download latest release from GitHub
+   - Install manually
+
+### "Invalid signature" error
+
+**Solutions:**
+
+1. **Re-download installer**
+
+   - Signature may be corrupted
+   - Download fresh copy from GitHub
+
+2. **Check release integrity**
+   - Verify `.sig` file matches installer
+   - Report issue if signature is invalid
+
+## Data Issues
+
+### Profiles disappeared
+
+**Solutions:**
+
+1. **Check data directory**
+
+   - macOS: `~/Library/Application Support/voicebox/`
+   - Windows: `%APPDATA%/voicebox/`
+   - Linux: `~/.local/share/voicebox/`
+
+2. **Check database**
+
+   - Database: `data/voicebox.db`
+   - Ensure file exists and is readable
+
+3. **Restore from backup**
+   - Profiles can be exported/imported
+   - Check for backup files
+
+### "Database locked" error
+
+**Solutions:**
+
+1. **Close other instances**
+
+   - Ensure only one Voicebox instance is running
+
+2. **Restart app**
+
+   - Close and reopen Voicebox
+
+3. **Check file permissions**
+   - Ensure database file is writable
+   - Check directory permissions
+
+## Development Issues
+
+### Build fails
+
+**Solutions:**
+
+1. **Check Rust installation**
+
+   ```bash
+   rustc --version
+   rustup update
+   ```
+
+2. **Check Tauri dependencies**
+
+   ```bash
+   cd tauri
+   bun install
+   ```
+
+3. **Clean build**
+   ```bash
+   cd tauri/src-tauri
+   cargo clean
+   cd ../..
+   bun run build
+   ```
+
+### API client generation fails
+
+**Solutions:**
+
+1. **Start backend server**
+
+   ```bash
+   bun run dev:server
+   ```
+
+2. **Check OpenAPI endpoint**
+
+   ```bash
+   curl http://localhost:8000/openapi.json
+   ```
+
+3. **Regenerate client**
+   ```bash
+   bun run generate:api
+   ```
+
+## Still Having Issues?
+
+1. **Check existing issues**
+
+   - Search GitHub issues for similar problems
+   - Check closed issues for solutions
+
+2. **Create new issue**
+
+   - Include:
+     - OS and version
+     - Voicebox version
+     - Steps to reproduce
+     - Error messages/logs
+     - Screenshots (if applicable)
+
+3. **Get help**
+   - Check documentation in `docs/`
+   - Review `backend/README.md` for API details
+   - See `CONTRIBUTING.md` for development help
+
+---
+
+For more help, open an issue on [GitHub](https://github.com/jamiepine/voicebox/issues).
diff --git a/docs2/content/docs/api/meta.json b/docs2/content/docs/api/meta.json
new file mode 100644
index 00000000..d23c38eb
--- /dev/null
+++ b/docs2/content/docs/api/meta.json
@@ -0,0 +1,4 @@
+{
+  "title": "API Reference",
+  "pages": ["overview", "authentication", "voice-profiles", "generation", "recordings"]
+}
diff --git a/docs2/content/docs/developer/contributing.mdx b/docs2/content/docs/developer/contributing.mdx
new file mode 100644
index 00000000..8ae5914f
--- /dev/null
+++ b/docs2/content/docs/developer/contributing.mdx
@@ -0,0 +1,336 @@
+---
+title: "Contributing"
+description: "How to contribute to Voicebox"
+---
+
+Thank you for your interest in contributing to Voicebox! This guide will help you get started.
+
+## Code of Conduct
+
+- Be respectful and inclusive
+- Welcome newcomers and help them learn
+- Focus on constructive feedback
+- Respect different viewpoints and experiences
+
+## Getting Started
+
+Before you start contributing, make sure you have:
+
+1. **Read the documentation** to understand how Voicebox works
+2. **Set up your development environment** - see [Development Setup](/development/setup)
+3. **Explored the codebase** to understand the project structure
+4. **Checked existing issues** to see if someone else is working on something similar
+
+## Ways to Contribute
+
+<CardGroup cols={2}>
+	<Card title="Report Bugs" icon="bug">
+		Found a bug? Open an issue with reproduction steps
+	</Card>
+	<Card title="Request Features" icon="lightbulb">
+		Have an idea? Start a discussion or open an issue
+	</Card>
+	<Card title="Improve Docs" icon="book">
+		Fix typos, add examples, or clarify instructions
+	</Card>
+	<Card title="Write Code" icon="code">
+		Fix bugs, add features, or optimize performance
+	</Card>
+</CardGroup>
+
+## Development Workflow
+
+### 1. Fork & Clone
+
+```bash
+# Fork the repository on GitHub
+# Then clone your fork
+git clone https://github.com/YOUR_USERNAME/voicebox.git
+cd voicebox
+```
+
+### 2. Create a Branch
+
+Use descriptive branch names:
+
+```bash
+# For features
+git checkout -b feature/voice-effects
+
+# For bug fixes
+git checkout -b fix/audio-playback-issue
+
+# For documentation
+git checkout -b docs/api-examples
+```
+
+### 3. Make Your Changes
+
+Follow these guidelines:
+
+<AccordionGroup>
+  <Accordion title="Code Style">
+    **TypeScript/React:**
+    - Use TypeScript strict mode
+    - Prefer functional components with hooks
+    - Use named exports
+    - Format with Biome (runs automatically)
+
+    **Python:**
+    - Follow PEP 8
+    - Use type hints
+    - Use async/await for I/O
+    - Document functions with docstrings
+
+    **Rust:**
+    - Follow Rust conventions
+    - Use meaningful names
+    - Handle errors explicitly
+    - Run `rustfmt`
+
+  </Accordion>
+
+  <Accordion title="Commit Messages">
+    Write clear, descriptive commit messages:
+
+    ```bash
+    # Good
+    git commit -m "Add voice profile export feature"
+    git commit -m "Fix audio playback stopping after 30 seconds"
+
+    # Avoid
+    git commit -m "Update code"
+    git commit -m "Fix bug"
+    ```
+
+    Format:
+    - Use imperative mood ("Add feature" not "Added feature")
+    - Keep first line under 50 characters
+    - Add detailed description if needed
+
+  </Accordion>
+
+  <Accordion title="Testing">
+    - Test your changes manually in the app
+    - Ensure backend API endpoints work
+    - Check for TypeScript/Python errors
+    - Verify UI components render correctly
+    - Add automated tests when possible
+  </Accordion>
+</AccordionGroup>
+
+### 4. Push & Create PR
+
+```bash
+# Push your branch
+git push origin feature/your-feature-name
+
+# Then create a pull request on GitHub
+```
+
+## Pull Request Guidelines
+
+When creating a pull request:
+
+<Steps>
+  <Step title="Use a Clear Title">
+    Examples:
+    - "Add voice profile export functionality"
+    - "Fix audio playback stopping after 30 seconds"
+    - "Improve generation speed with caching"
+  </Step>
+
+{" "}
+<Step title="Provide Description">
+	Include: - What changes you made - Why you made them - How to test them -
+	Screenshots (for UI changes) - Reference related issues
+</Step>
+
+{" "}
+<Step title="Update Documentation">
+	- Update relevant docs if behavior changes - Add API documentation for new
+	endpoints - Update README if needed
+</Step>
+
+  <Step title="Check the Checklist">
+    - [ ] Code follows style guidelines
+    - [ ] Documentation updated
+    - [ ] Changes tested
+    - [ ] No breaking changes (or documented)
+    - [ ] CHANGELOG.md updated
+  </Step>
+</Steps>
+
+## Project Structure
+
+Understanding the codebase:
+
+```
+voicebox/
+├── app/              # Shared React frontend
+│   ├── src/
+│   │   ├── components/   # UI components
+│   │   ├── lib/          # Utilities and API client
+│   │   ├── hooks/        # React hooks
+│   │   └── stores/       # Zustand state stores
+├── backend/          # Python FastAPI server
+│   ├── main.py       # API routes
+│   ├── tts.py        # Voice synthesis logic
+│   ├── database.py   # SQLite operations
+│   └── models.py     # Pydantic models
+├── tauri/            # Desktop app wrapper
+│   └── src-tauri/    # Rust backend
+├── web/              # Web deployment
+├── landing/          # Marketing website
+└── scripts/          # Build & release scripts
+```
+
+## Areas for Contribution
+
+### Bug Fixes
+
+- Check [existing issues](https://github.com/jamiepine/voicebox/issues) for bugs
+- Test your fix thoroughly
+- Add regression tests if possible
+
+### New Features
+
+- Check the [roadmap](https://github.com/jamiepine/voicebox#roadmap) for planned features
+- Discuss major features in an issue first
+- Keep features focused and well-scoped
+
+### Documentation
+
+- Improve clarity and fix typos
+- Add code examples
+- Create tutorials or guides
+- Document API endpoints
+
+### UI/UX Improvements
+
+- Improve accessibility
+- Enhance visual design
+- Optimize performance
+- Add animations/transitions
+
+### Infrastructure
+
+- Improve build process
+- Add CI/CD improvements
+- Optimize bundle size
+- Add testing infrastructure
+
+## API Development
+
+When adding new API endpoints:
+
+<Steps>
+  <Step title="Add Route">
+    In `backend/main.py`:
+
+    ```python
+    @app.post("/api/new-endpoint")
+    async def new_endpoint(data: RequestModel) -> ResponseModel:
+        """Endpoint description."""
+        # Implementation
+        return response
+    ```
+
+  </Step>
+
+  <Step title="Create Models">
+    In `backend/models.py`:
+
+    ```python
+    class RequestModel(BaseModel):
+        field: str
+
+    class ResponseModel(BaseModel):
+        result: str
+    ```
+
+  </Step>
+
+  <Step title="Regenerate Client">
+    ```bash
+    bun run generate:api
+    ```
+
+    This updates the TypeScript client with type-safe bindings.
+
+  </Step>
+
+  <Step title="Update Docs">
+    The API documentation is automatically generated from the OpenAPI schema. Ensure your endpoint has proper docstrings and type hints, then regenerate the docs:
+    
+    ```bash
+    bun run generate:api
+    ```
+  </Step>
+</Steps>
+
+## Testing
+
+Currently testing is primarily manual. When adding tests:
+
+**Backend:**
+
+```bash
+cd backend
+pytest
+```
+
+**Frontend:**
+
+```bash
+bun run test
+```
+
+**E2E (future):**
+
+```bash
+bun run test:e2e
+```
+
+## Release Process
+
+Releases are managed by maintainers using `bumpversion`:
+
+```bash
+# Bump version (patch, minor, or major)
+bumpversion patch
+
+# Push with tags
+git push && git push --tags
+```
+
+GitHub Actions automatically builds and publishes releases when tags are pushed.
+
+## Community
+
+- **GitHub Issues:** Bug reports and feature requests
+- **GitHub Discussions:** General questions and ideas
+- **Discord:** Real-time chat (coming soon)
+
+## Recognition
+
+Contributors are recognized in:
+
+- [CHANGELOG.md](https://github.com/jamiepine/voicebox/blob/main/CHANGELOG.md)
+- GitHub contributor list
+- Release notes
+
+## License
+
+By contributing, you agree that your contributions will be licensed under the MIT License.
+
+## Questions?
+
+If you have questions:
+
+1. Check the [documentation](/overview/introduction)
+2. Search [existing issues](https://github.com/jamiepine/voicebox/issues)
+3. Open a new issue or discussion
+4. See [CONTRIBUTING.md](https://github.com/jamiepine/voicebox/blob/main/CONTRIBUTING.md) in the repo
+
+Thank you for contributing to Voicebox! 🎉
diff --git a/docs2/content/docs/developer/meta.json b/docs2/content/docs/developer/meta.json
new file mode 100644
index 00000000..5c97f225
--- /dev/null
+++ b/docs2/content/docs/developer/meta.json
@@ -0,0 +1,17 @@
+{
+  "title": "Developer",
+  "pages": [
+    "setup",
+    "architecture",
+    "contributing",
+    "building",
+    "autoupdater",
+    "voice-profiles",
+    "tts-generation",
+    "history",
+    "stories",
+    "transcription",
+    "audio-channels",
+    "model-management"
+  ]
+}
diff --git a/docs2/content/docs/developer/setup.mdx b/docs2/content/docs/developer/setup.mdx
new file mode 100644
index 00000000..be5b5eff
--- /dev/null
+++ b/docs2/content/docs/developer/setup.mdx
@@ -0,0 +1,245 @@
+---
+title: "Development Setup"
+description: "Set up your local development environment for Voicebox"
+---
+
+## Prerequisites
+
+Before you begin, ensure you have the following installed:
+
+<CardGroup cols={3}>
+	<Card title="Bun" icon="package">
+		[Download Bun](https://bun.sh) ```bash curl -fsSL https://bun.sh/install |
+		bash ```
+	</Card>
+	<Card title="Python 3.11+" icon="python">
+		[Download Python](https://python.org) ```bash python --version ```
+	</Card>
+	<Card title="Rust" icon="rust">
+		[Install Rust](https://rustup.rs) ```bash rustc --version ```
+	</Card>
+</CardGroup>
+
+## Clone the Repository
+
+```bash
+git clone https://github.com/jamiepine/voicebox.git
+cd voicebox
+```
+
+## Quick Setup (Recommended)
+
+The easiest way to get started is using the Makefile:
+
+```bash
+# Setup everything
+make setup
+
+# Start development
+make dev
+```
+
+<Note>
+	The Makefile is available on macOS and Linux. Windows users should follow the
+	manual setup below.
+</Note>
+
+## Manual Setup
+
+### 1. Install JavaScript Dependencies
+
+```bash
+bun install
+```
+
+This installs dependencies for:
+
+- `app/` - Shared React frontend
+- `tauri/` - Tauri desktop wrapper
+- `web/` - Web deployment wrapper
+
+### 2. Set Up Python Backend
+
+```bash
+cd backend
+
+# Create virtual environment
+python -m venv venv
+
+# Activate virtual environment
+source venv/bin/activate  # macOS/Linux
+# or
+venv\Scripts\activate  # Windows
+
+# Install Python dependencies
+pip install -r requirements.txt
+
+# Install MLX dependencies (Apple Silicon only - for faster inference)
+# On Apple Silicon, this enables native Metal acceleration
+if [[ $(uname -m) == "arm64" ]]; then
+  pip install -r requirements-mlx.txt
+fi
+
+# Install Qwen3-TTS
+pip install git+https://github.com/QwenLM/Qwen3-TTS.git
+```
+
+## Running in Development
+
+Development requires **two terminals**: one for the Python backend, one for the Tauri app.
+
+<Tabs>
+  <Tab title="Terminal 1: Backend">
+    Start the Python server first:
+
+    ```bash
+    cd backend
+    source venv/bin/activate  # Activate venv
+    bun run dev:server
+    ```
+
+    Or manually:
+    ```bash
+    uvicorn main:app --reload --port 17493
+    ```
+
+    Backend will be available at `http://localhost:17493`
+
+  </Tab>
+
+  <Tab title="Terminal 2: Desktop App">
+    Then start the Tauri app:
+
+    ```bash
+    bun run dev
+    ```
+
+    This will:
+    - Create a placeholder sidecar binary
+    - Start Vite dev server on port 5173
+    - Launch Tauri window
+    - Enable hot reload
+
+  </Tab>
+</Tabs>
+
+<Info>
+	In dev mode, the app connects to your manually-started Python server. The
+	bundled server binary is only used in production builds.
+</Info>
+
+### Optional: Web App
+
+```bash
+bun run dev:web
+```
+
+Web app will be available at `http://localhost:5174`
+
+## Model Downloads
+
+Models are automatically downloaded from HuggingFace Hub on first use:
+
+- **Whisper** (transcription): Auto-downloads on first transcription
+- **Qwen3-TTS** (voice cloning): Auto-downloads on first generation (~2-4GB)
+
+<Warning>
+	First-time usage will be slower due to model downloads, but subsequent runs
+	will use cached models.
+</Warning>
+
+## Project Structure
+
+```
+voicebox/
+├── app/              # Shared React frontend
+│   └── src/
+│       ├── components/   # UI components
+│       ├── lib/          # Utilities and API client
+│       └── hooks/        # React hooks
+├── backend/          # Python FastAPI server
+│   ├── main.py       # API routes
+│   ├── tts.py        # Voice synthesis
+│   └── database.py   # SQLite operations
+├── tauri/            # Desktop app wrapper
+│   └── src-tauri/    # Rust backend
+├── web/              # Web deployment
+├── landing/          # Marketing website
+└── scripts/          # Build & release scripts
+```
+
+## Available Make Commands
+
+Run `make help` to see all available commands:
+
+```bash
+make setup          # Install all dependencies
+make dev            # Start development servers
+make dev-web        # Start web development server
+make build          # Build desktop app
+make build-web      # Build web app
+make clean          # Clean build artifacts
+make test           # Run tests
+```
+
+## Generate OpenAPI Client
+
+After starting the backend server, generate the TypeScript API client:
+
+```bash
+./scripts/generate-api.sh
+# or
+bun run generate:api
+```
+
+This downloads the OpenAPI schema and generates the TypeScript client in `app/src/lib/api/`
+
+## Next Steps
+
+<CardGroup cols={2}>
+	<Card
+		title="Architecture"
+		icon="diagram-project"
+		href="/development/architecture"
+	>
+		Understand the system architecture
+	</Card>
+	<Card
+		title="Contributing"
+		icon="code-pull-request"
+		href="/development/contributing"
+	>
+		Read the contribution guidelines
+	</Card>
+	<Card title="Building" icon="hammer" href="/development/building">
+		Learn how to build production releases
+	</Card>
+	<Card title="API Reference" icon="code" href="/api-reference">
+		Explore the REST API
+	</Card>
+</CardGroup>
+
+## Troubleshooting
+
+<AccordionGroup>
+  <Accordion title="Backend won't start">
+    - Check Python version (must be 3.11+)
+    - Ensure virtual environment is activated
+    - Verify all dependencies are installed: `pip install -r requirements.txt`
+    - Check if port 17493 is available
+  </Accordion>
+
+{" "}
+<Accordion title="Tauri build fails">
+	- Ensure Rust is installed: `rustc --version` - Clean the build: `cd
+	tauri/src-tauri && cargo clean` - Try rebuilding: `bun run dev`
+</Accordion>
+
+  <Accordion title="OpenAPI client generation fails">
+    - Ensure backend is running: `curl http://localhost:17493/openapi.json`
+    - Check network connectivity
+    - Verify the backend is accessible at localhost:17493
+  </Accordion>
+</AccordionGroup>
+
+See the full [Troubleshooting Guide](/guides/troubleshooting) for more issues and solutions.
diff --git a/docs2/content/docs/index.mdx b/docs2/content/docs/index.mdx
new file mode 100644
index 00000000..1c2b401e
--- /dev/null
+++ b/docs2/content/docs/index.mdx
@@ -0,0 +1,50 @@
+---
+title: "Voicebox Documentation"
+description: "Welcome to Voicebox - the open-source voice synthesis studio"
+---
+
+## What is Voicebox?
+
+Voicebox is a **local-first voice cloning studio** with DAW-like features for professional voice synthesis. Think of it as the **Ollama for voice** — download models, clone voices, and generate speech entirely on your machine.
+
+<Frame>
+	<img src="/images/app-screenshot-1.webp" alt="Voicebox App Screenshot" />
+</Frame>
+
+Unlike cloud services that lock your voice data behind subscriptions, Voicebox gives you:
+
+- **Complete privacy** — models and voice data stay on your machine
+- **Professional tools** — multi-track timeline editor, audio trimming, conversation mixing
+- **Model flexibility** — currently powered by Qwen3-TTS, with support for XTTS, Bark, and other models coming soon
+- **API-first** — use the desktop app or integrate voice synthesis into your own projects
+- **Native performance** — built with Tauri (Rust), not Electron
+
+Download a voice model, clone any voice from a few seconds of audio, and compose multi-voice projects with studio-grade editing tools. No Python install required, no cloud dependency, no limits.
+
+## Key Features
+
+<CardGroup cols={2}>
+	<Card title="Voice Cloning" icon="microphone">
+		Instant cloning from just a few seconds of audio with Qwen3-TTS
+	</Card>
+	<Card title="Stories Editor" icon="film">
+		Multi-track timeline for creating conversations and narratives
+	</Card>
+	<Card title="Full API" icon="code">
+		REST API for integrating voice synthesis into your apps
+	</Card>
+	<Card title="Local-First" icon="shield">
+		Everything runs on your machine - complete privacy
+	</Card>
+</CardGroup>
+
+## Get Started
+
+<CardGroup cols={2}>
+	<Card title="Installation" icon="download" href="/docs/overview/installation">
+		Download and install Voicebox on your machine
+	</Card>
+	<Card title="Quick Start" icon="rocket" href="/docs/overview/quick-start">
+		Get up and running in 5 minutes
+	</Card>
+</CardGroup>
diff --git a/docs2/content/docs/meta.json b/docs2/content/docs/meta.json
new file mode 100644
index 00000000..42d96896
--- /dev/null
+++ b/docs2/content/docs/meta.json
@@ -0,0 +1,4 @@
+{
+  "title": "Voicebox Documentation",
+  "pages": ["overview", "api-reference", "developer", "plans"]
+}
diff --git a/docs2/content/docs/overview/creating-voice-profiles.mdx b/docs2/content/docs/overview/creating-voice-profiles.mdx
new file mode 100644
index 00000000..2894ea5d
--- /dev/null
+++ b/docs2/content/docs/overview/creating-voice-profiles.mdx
@@ -0,0 +1,297 @@
+---
+title: "Creating Voice Profiles"
+description: "Advanced guide to creating high-quality voice profiles"
+---
+
+## Overview
+
+Voice profiles are the foundation of voice cloning in Voicebox. This guide covers best practices for creating professional-quality voice profiles.
+
+## Quick Start
+
+<Steps>
+	<Step title="Prepare Audio">10-30 seconds of clear speech</Step>
+	<Step title="Create Profile">**Profiles** → **+ New Profile**</Step>
+	<Step title="Upload Sample">Add your audio file</Step>
+	<Step title="Generate">Use the profile to generate speech</Step>
+</Steps>
+
+## Audio Requirements
+
+### Ideal Sample Characteristics
+
+<CardGroup cols={2}>
+  <Card title="Duration" icon="clock">
+    **10-30 seconds**
+
+    Too short: Poor quality
+    Too long: Unnecessary
+
+  </Card>
+  <Card title="Clarity" icon="volume">
+    **Clear speech**
+
+    No background noise
+    No music or overlapping voices
+
+  </Card>
+  <Card title="Quality" icon="sparkles">
+    **High fidelity**
+
+    44.1kHz or 48kHz sample rate
+    Minimal compression
+
+  </Card>
+  <Card title="Content" icon="microphone">
+    **Natural speech**
+
+    Conversational tone
+    Complete sentences
+
+  </Card>
+</CardGroup>
+
+### File Formats
+
+Supported formats:
+
+- **WAV** (recommended) - Lossless quality
+- **MP3** - Acceptable, minimal compression
+- **M4A** - Acceptable
+- **FLAC** - Lossless alternative
+
+<Tip>Use WAV for best results. Avoid heavily compressed formats.</Tip>
+
+## Recording Tips
+
+### Environment
+
+<AccordionGroup>
+  <Accordion title="Quiet Space">
+    - Record in a quiet room
+    - Turn off fans, AC, appliances
+    - Close windows to reduce outside noise
+    - Use soft furnishings to reduce echo
+  </Accordion>
+
+{" "}
+<Accordion title="Microphone Placement">
+	- 6-12 inches from mouth - Slight angle to reduce plosives (p, b, t) - Use a
+	pop filter if available - Maintain consistent distance
+</Accordion>
+
+  <Accordion title="Recording Settings">
+    - 44.1kHz or 48kHz sample rate
+    - 16-bit or 24-bit depth
+    - Mono is fine (stereo will be converted)
+    - Avoid automatic gain control
+  </Accordion>
+</AccordionGroup>
+
+### Speaking
+
+- **Natural pace** - Don't rush or speak too slowly
+- **Clear articulation** - Pronounce words clearly
+- **Consistent volume** - Maintain steady loudness
+- **Normal tone** - Speak as you normally would
+- **Complete sentences** - Avoid fragments or "ums"
+
+## Multiple Samples
+
+Adding multiple samples can significantly improve quality:
+
+### Why Multiple Samples?
+
+<CardGroup cols={2}>
+	<Card title="Robustness" icon="shield">
+		Model learns a more complete representation
+	</Card>
+	<Card title="Versatility" icon="palette">
+		Handles different speaking styles better
+	</Card>
+	<Card title="Quality" icon="star">
+		Reduces artifacts and improves naturalness
+	</Card>
+	<Card title="Consistency" icon="check">
+		More reliable across different texts
+	</Card>
+</CardGroup>
+
+### Sample Variety
+
+Consider adding samples with:
+
+1. **Different tones**
+
+   - Casual conversation
+   - Professional/formal
+   - Excited/enthusiastic
+   - Calm/serious
+
+2. **Different content**
+
+   - Narratives
+   - Questions
+   - Statements
+   - Emotions (happy, sad, neutral)
+
+3. **Different recording conditions**
+   - Studio quality
+   - Phone call quality (if needed)
+   - Room acoustics
+
+<Warning>
+	All samples should be from the **same speaker**. Mixing voices will produce
+	poor results.
+</Warning>
+
+## Processing Existing Audio
+
+If you have existing audio (podcasts, videos, etc.):
+
+### Extracting Clean Segments
+
+<Steps>
+  <Step title="Find Clean Speech">
+    Look for segments with:
+    - Just the target speaker
+    - No background music
+    - Minimal noise
+  </Step>
+
+{" "}
+<Step title="Use Audio Editor">
+	Tools like Audacity or Adobe Audition: - Cut out clean 10-30s segments -
+	Remove silence at start/end - Normalize volume if needed
+</Step>
+
+  <Step title="Export as WAV">
+    Save as high-quality WAV file
+  </Step>
+</Steps>
+
+### Noise Reduction
+
+If you have light background noise:
+
+```
+1. Use noise reduction in Audacity:
+   - Select noise-only section
+   - Get Noise Profile
+   - Select full audio
+   - Apply noise reduction (gentle settings)
+
+2. Avoid over-processing:
+   - Can introduce artifacts
+   - May reduce voice quality
+```
+
+## Testing & Iteration
+
+### Test Your Profile
+
+After creating a profile:
+
+<Steps>
+  <Step title="Generate Test">
+    Generate a simple phrase:
+    ```
+    "Hello, this is a test of my voice profile."
+    ```
+  </Step>
+
+{" "}
+<Step title="Evaluate Quality">
+	Listen for: - Natural tone - Clear pronunciation - Proper prosody - Lack of
+	artifacts
+</Step>
+
+  <Step title="Iterate">
+    If quality is poor:
+    - Add more samples
+    - Try different source audio
+    - Check sample quality
+  </Step>
+</Steps>
+
+### Common Issues
+
+<AccordionGroup>
+  <Accordion title="Robotic Voice">
+    **Cause**: Poor quality samples or too short
+
+    **Fix**: Use longer, higher quality samples
+
+  </Accordion>
+
+  <Accordion title="Wrong Tone">
+    **Cause**: Sample tone doesn't match desired output
+
+    **Fix**: Record samples in the style you want to generate
+
+  </Accordion>
+
+  <Accordion title="Artifacts/Glitches">
+    **Cause**: Background noise or audio issues in samples
+
+    **Fix**: Clean up samples or re-record in quieter environment
+
+  </Accordion>
+</AccordionGroup>
+
+## Advanced Tips
+
+### Celebrity/Character Voices
+
+For cloning public figures or characters:
+
+1. **Legal considerations** - Ensure you have rights or it's fair use
+2. **Source quality** - Find high-quality interview audio or clean clips
+3. **Consistency** - Use clips where they speak similarly
+4. **Multiple samples** - Very important for recognizable voices
+
+### Accent & Dialect
+
+The model will preserve accent and dialect:
+
+- British English will generate British English
+- Southern accent will produce Southern accent
+- Regional pronunciations will be maintained
+
+### Emotion Transfer
+
+The emotional tone of samples affects generation:
+
+- Energetic samples → Energetic output
+- Calm samples → Calm output
+- Mix samples for versatile profile
+
+## Managing Profiles
+
+### Organization
+
+- **Descriptive names** - "John Smith - Professional Narrator"
+- **Add descriptions** - Note recording conditions, use cases
+- **Language tags** - Mark the primary language
+- **Archive unused** - Keep profile list manageable
+
+### Export/Import
+
+- **Export** profiles to share or backup
+- **Import** from colleagues or teammates
+- Profiles include voice embeddings, not original audio
+
+## Next Steps
+
+<CardGroup cols={2}>
+	<Card
+		title="Generate Speech"
+		icon="waveform"
+		href="/overview/generating-speech"
+	>
+		Use your profile to generate speech
+	</Card>
+	<Card title="Build Stories" icon="film" href="/overview/building-stories">
+		Create multi-voice narratives
+	</Card>
+</CardGroup>
diff --git a/docs2/content/docs/overview/meta.json b/docs2/content/docs/overview/meta.json
new file mode 100644
index 00000000..d3906004
--- /dev/null
+++ b/docs2/content/docs/overview/meta.json
@@ -0,0 +1,17 @@
+{
+  "title": "Overview",
+  "pages": [
+    "introduction",
+    "installation",
+    "quick-start",
+    "voice-cloning",
+    "stories-editor",
+    "recording-transcription",
+    "generation-history",
+    "remote-mode",
+    "creating-voice-profiles",
+    "generating-speech",
+    "building-stories",
+    "troubleshooting"
+  ]
+}
diff --git a/docs2/content/docs/overview/quick-start.mdx b/docs2/content/docs/overview/quick-start.mdx
new file mode 100644
index 00000000..dac64fe4
--- /dev/null
+++ b/docs2/content/docs/overview/quick-start.mdx
@@ -0,0 +1,166 @@
+---
+title: "Quick Start"
+description: "Get started with Voicebox in 5 minutes"
+---
+
+This guide will walk you through creating your first voice profile and generating speech.
+
+## Prerequisites
+
+Make sure you have [installed Voicebox](/overview/installation) and launched the app.
+
+## Step 1: Create a Voice Profile
+
+Voice profiles are the foundation of Voicebox. Each profile contains voice samples that the AI uses to clone the voice.
+
+<Steps>
+  <Step title="Navigate to Profiles">
+    Click the **Profiles** tab in the sidebar
+  </Step>
+
+  <Step title="Create New Profile">
+    Click the **+ New Profile** button
+
+    Fill in the details:
+    - **Name:** A descriptive name (e.g., "John Smith")
+    - **Language:** Select the primary language
+    - **Description:** Optional notes about the voice
+
+  </Step>
+
+  <Step title="Add Voice Sample">
+    You have two options:
+
+    **Option A: Upload Audio**
+    - Click **Upload Sample**
+    - Select an audio file (WAV, MP3, or M4A)
+    - Ideal length: 10-30 seconds of clear speech
+
+    **Option B: Record Live**
+    - Click **Record Sample**
+    - Speak clearly for 10-30 seconds
+    - Click stop when finished
+
+  </Step>
+
+  <Step title="Save Profile">
+    Click **Create Profile** to save
+  </Step>
+</Steps>
+
+<Tip>
+	For best results, use clean audio with minimal background noise and consistent
+	speaking tone.
+</Tip>
+
+## Step 2: Generate Speech
+
+Now let's use your new voice profile to generate speech.
+
+<Steps>
+  <Step title="Go to Generation">
+    Click the **Generate** tab in the sidebar
+  </Step>
+
+{" "}
+<Step title="Select Voice Profile">
+	Choose your newly created profile from the dropdown
+</Step>
+
+  <Step title="Enter Text">
+    Type or paste the text you want to generate:
+
+    ```
+    Hello! This is my first voice generation with Voicebox.
+    ```
+
+  </Step>
+
+  <Step title="Generate">
+    Click **Generate** and wait a few seconds
+
+    <Note>
+      First generation may take longer due to model initialization. Subsequent generations will be faster.
+    </Note>
+
+  </Step>
+
+  <Step title="Play & Download">
+    - Click **Play** to preview the audio
+    - Click **Download** to save the audio file
+    - The generation is also saved to your **History**
+  </Step>
+</Steps>
+
+## Step 3: Build a Story (Optional)
+
+The Stories Editor lets you create multi-voice narratives with a timeline-based interface.
+
+<Steps>
+  <Step title="Create New Story">
+    Navigate to **Stories** and click **+ New Story**
+  </Step>
+
+{" "}
+<Step title="Add Voice Tracks">
+	Click **+ Add Track** to create tracks for different speakers
+</Step>
+
+{" "}
+<Step title="Add Audio Clips">
+	- Drag generated audio from your History - Or generate new clips directly in
+	the timeline - Arrange clips on the timeline
+</Step>
+
+  <Step title="Edit & Export">
+    - Trim clips by dragging edges
+    - Adjust timing and spacing
+    - Click **Export** to render the final audio
+  </Step>
+</Steps>
+
+## What's Next?
+
+<CardGroup cols={2}>
+	<Card
+		title="Voice Cloning Guide"
+		icon="microphone"
+		href="/overview/creating-voice-profiles"
+	>
+		Learn advanced techniques for high-quality voice cloning
+	</Card>
+	<Card title="API Integration" icon="code" href="/api-reference">
+		Integrate Voicebox into your own applications
+	</Card>
+	<Card title="Stories Editor" icon="film" href="/overview/stories-editor">
+		Master the multi-track timeline editor
+	</Card>
+	<Card title="Remote Mode" icon="server" href="/overview/remote-mode">
+		Connect to a GPU server for faster generation
+	</Card>
+</CardGroup>
+
+## Tips for Success
+
+<AccordionGroup>
+  <Accordion title="Getting the Best Voice Quality">
+    - Use 10-30 seconds of clear, consistent speech
+    - Avoid background noise and echo
+    - Multiple samples from the same speaker improve quality
+    - Match the speaking style you want to generate
+  </Accordion>
+
+{" "}
+<Accordion title="Improving Generation Speed">
+	- Use a CUDA-capable GPU for 5-10x faster generation - Enable voice prompt
+	caching for repeated generations - Consider running the backend on a remote
+	GPU server
+</Accordion>
+
+  <Accordion title="Troubleshooting Common Issues">
+    - **Server won't start:** Check if port 17493 is available
+    - **Poor audio quality:** Try adding more voice samples
+    - **Slow generation:** Verify GPU acceleration is enabled
+    - See the full [Troubleshooting Guide](/overview/troubleshooting) for more
+  </Accordion>
+</AccordionGroup>
diff --git a/docs2/content/docs/plans/DOCKER_DEPLOYMENT.md b/docs2/content/docs/plans/DOCKER_DEPLOYMENT.md
new file mode 100644
index 00000000..988dab91
--- /dev/null
+++ b/docs2/content/docs/plans/DOCKER_DEPLOYMENT.md
@@ -0,0 +1,786 @@
+---
+title: "Docker Deployment Guide"
+description: "Docker deployment guide for Voicebox (In Development)"
+---
+
+**Status:** In Development for v0.2.0
+**Requested By:** Reddit community ([thread](https://reddit.com/r/LocalLLaMA/...))
+
+## Overview
+
+Docker support makes Voicebox easier to deploy, especially for:
+
+- **Consistent Environments**: Same setup across dev/staging/prod
+- **GPU Passthrough**: Easy NVIDIA/AMD GPU access
+- **Server Deployments**: Run on headless Linux servers
+- **Multi-User Setups**: Isolate instances per user/team
+- **Cloud Platforms**: Deploy to AWS, GCP, Azure, DigitalOcean
+
+## Quick Start
+
+### Using Pre-Built Images (Recommended)
+
+```bash
+# CPU-only version
+docker run -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest
+
+# NVIDIA GPU version
+docker run --gpus all -p 8000:8000 -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest-cuda
+
+# AMD GPU version (experimental)
+docker run --device=/dev/kfd --device=/dev/dri -p 8000:8000 \
+  -v voicebox-data:/app/data \
+  ghcr.io/jamiepine/voicebox:latest-rocm
+```
+
+Then open: `http://localhost:8000`
+
+### Using Docker Compose (Easiest)
+
+Create `docker-compose.yml`:
+
+```yaml
+version: "3.8"
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - GPU_MEMORY_FRACTION=0.8 # Use 80% of GPU memory
+      - TTS_MODE=local
+      - WHISPER_MODE=local
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+```
+
+Run:
+
+```bash
+docker compose up -d
+```
+
+## Building From Source
+
+### Basic Dockerfile
+
+```dockerfile
+# Dockerfile
+FROM python:3.11-slim
+
+WORKDIR /app
+
+# Install system dependencies
+RUN apt-get update && apt-get install -y \
+    git \
+    build-essential \
+    ffmpeg \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy application
+COPY backend/ /app/backend/
+COPY requirements.txt /app/
+
+# Install Python dependencies
+RUN pip install --no-cache-dir -r requirements.txt
+RUN pip install --no-cache-dir git+https://github.com/QwenLM/Qwen3-TTS.git
+
+# Create data directory
+RUN mkdir -p /app/data
+
+# Expose port
+EXPOSE 8000
+
+# Run server
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
+```
+
+Build and run:
+
+```bash
+docker build -t voicebox .
+docker run -p 8000:8000 -v $(pwd)/data:/app/data voicebox
+```
+
+### Multi-Stage Build (Optimized)
+
+Smaller image size by separating build and runtime:
+
+```dockerfile
+# Dockerfile.optimized
+# Stage 1: Build dependencies
+FROM python:3.11-slim AS builder
+
+WORKDIR /build
+
+RUN apt-get update && apt-get install -y \
+    git build-essential && \
+    rm -rf /var/lib/apt/lists/*
+
+COPY backend/requirements.txt .
+RUN pip install --no-cache-dir --target=/build/packages \
+    -r requirements.txt
+
+RUN pip install --no-cache-dir --target=/build/packages \
+    git+https://github.com/QwenLM/Qwen3-TTS.git
+
+# Stage 2: Runtime
+FROM python:3.11-slim
+
+WORKDIR /app
+
+# Install only runtime dependencies
+RUN apt-get update && apt-get install -y \
+    ffmpeg \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy installed packages from builder
+COPY --from=builder /build/packages /usr/local/lib/python3.11/site-packages/
+
+# Copy application code
+COPY backend/ /app/backend/
+
+# Create data directory
+RUN mkdir -p /app/data
+
+EXPOSE 8000
+
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
+```
+
+Build:
+
+```bash
+docker build -f Dockerfile.optimized -t voicebox:slim .
+```
+
+## GPU Support
+
+### NVIDIA GPUs (CUDA)
+
+**Dockerfile:**
+
+```dockerfile
+FROM nvidia/cuda:12.1.0-runtime-ubuntu22.04
+
+# Install Python
+RUN apt-get update && apt-get install -y \
+    python3.11 python3-pip git ffmpeg && \
+    rm -rf /var/lib/apt/lists/*
+
+WORKDIR /app
+
+# Install PyTorch with CUDA support
+COPY backend/requirements.txt .
+RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
+
+# Install other dependencies
+RUN pip3 install -r requirements.txt
+RUN pip3 install git+https://github.com/QwenLM/Qwen3-TTS.git
+
+COPY backend/ /app/backend/
+
+EXPOSE 8000
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
+```
+
+**Run with GPU:**
+
+```bash
+docker run --gpus all -p 8000:8000 \
+  -v voicebox-data:/app/data \
+  voicebox:cuda
+```
+
+**Docker Compose with GPU:**
+
+```yaml
+services:
+  voicebox:
+    image: voicebox:cuda
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: all
+              capabilities: [gpu]
+```
+
+### AMD GPUs (ROCm) - Experimental
+
+**Dockerfile:**
+
+```dockerfile
+FROM rocm/dev-ubuntu-22.04:6.0
+
+# Install Python
+RUN apt-get update && apt-get install -y \
+    python3.11 python3-pip git ffmpeg && \
+    rm -rf /var/lib/apt/lists/*
+
+WORKDIR /app
+
+# Install PyTorch with ROCm support
+COPY backend/requirements.txt .
+RUN pip3 install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/rocm6.0
+
+# Install other dependencies
+RUN pip3 install -r requirements.txt
+RUN pip3 install git+https://github.com/QwenLM/Qwen3-TTS.git
+
+# Set ROCm environment variables
+ENV HSA_OVERRIDE_GFX_VERSION=10.3.0
+ENV ROCM_PATH=/opt/rocm
+
+COPY backend/ /app/backend/
+
+EXPOSE 8000
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000"]
+```
+
+**Run with AMD GPU:**
+
+```bash
+docker run --device=/dev/kfd --device=/dev/dri \
+  --group-add video --ipc=host --cap-add=SYS_PTRACE \
+  --security-opt seccomp=unconfined \
+  -p 8000:8000 -v voicebox-data:/app/data \
+  voicebox:rocm
+```
+
+**Note:** ROCm support varies by GPU model. Works best on Linux. See [AMD ROCm docs](https://rocm.docs.amd.com) for compatibility.
+
+## Volume Mounts
+
+### Essential Volumes
+
+```bash
+docker run -v voicebox-data:/app/data \           # Profiles, generations, history
+           -v huggingface-cache:/root/.cache/huggingface \  # Downloaded models
+           -p 8000:8000 voicebox
+```
+
+### Development Volume Mounts
+
+For development with hot-reload:
+
+```bash
+docker run -v $(pwd)/backend:/app/backend \       # Live code changes
+           -v voicebox-data:/app/data \
+           -e RELOAD=true \
+           -p 8000:8000 voicebox
+```
+
+### Custom Model Storage
+
+Use external model directory:
+
+```bash
+docker run -v /path/to/models:/models \
+           -e MODELS_DIR=/models \
+           -v voicebox-data:/app/data \
+           -p 8000:8000 voicebox
+```
+
+## Environment Variables
+
+Configure Voicebox via environment variables:
+
+```bash
+docker run -e TTS_MODE=local \
+           -e WHISPER_MODE=openai-api \
+           -e OPENAI_API_KEY=sk-... \
+           -e GPU_MEMORY_FRACTION=0.8 \
+           -e LOG_LEVEL=info \
+           -p 8000:8000 voicebox
+```
+
+### Available Variables
+
+| Variable              | Default       | Description                                        |
+| --------------------- | ------------- | -------------------------------------------------- |
+| `TTS_MODE`            | `local`       | TTS provider: `local`, `remote`                    |
+| `TTS_REMOTE_URL`      | -             | URL for remote TTS server                          |
+| `WHISPER_MODE`        | `local`       | Whisper provider: `local`, `openai-api`, `remote`  |
+| `WHISPER_REMOTE_URL`  | -             | URL for remote Whisper server                      |
+| `OPENAI_API_KEY`      | -             | OpenAI API key (if using OpenAI Whisper)           |
+| `GPU_MEMORY_FRACTION` | `0.9`         | Fraction of GPU memory to use (0.0-1.0)            |
+| `DATA_DIR`            | `/app/data`   | Directory for profiles/generations                 |
+| `MODELS_DIR`          | `/app/models` | Directory for local models                         |
+| `LOG_LEVEL`           | `info`        | Logging level: `debug`, `info`, `warning`, `error` |
+| `RELOAD`              | `false`       | Enable hot-reload for development                  |
+
+## Complete Docker Compose Examples
+
+### Production Deployment
+
+```yaml
+# docker-compose.prod.yml
+version: "3.8"
+
+services:
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    container_name: voicebox
+    restart: unless-stopped
+    ports:
+      - "8000:8000"
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - TTS_MODE=local
+      - WHISPER_MODE=local
+      - GPU_MEMORY_FRACTION=0.8
+      - LOG_LEVEL=info
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+    healthcheck:
+      test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 40s
+
+volumes:
+  voicebox-data:
+    driver: local
+  huggingface-cache:
+    driver: local
+```
+
+Run:
+
+```bash
+docker compose -f docker-compose.prod.yml up -d
+```
+
+### Development Setup
+
+```yaml
+# docker-compose.dev.yml
+version: "3.8"
+
+services:
+  voicebox:
+    build:
+      context: .
+      dockerfile: Dockerfile
+    ports:
+      - "8000:8000"
+    volumes:
+      - ./backend:/app/backend:ro
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - RELOAD=true
+      - LOG_LEVEL=debug
+      - TTS_MODE=local
+    command: uvicorn backend.main:app --host 0.0.0.0 --port 8000 --reload
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+```
+
+### Multi-Service Stack
+
+Full stack with reverse proxy and monitoring:
+
+```yaml
+# docker-compose.stack.yml
+version: "3.8"
+
+services:
+  # Main Voicebox app
+  voicebox:
+    image: ghcr.io/jamiepine/voicebox:latest-cuda
+    restart: unless-stopped
+    volumes:
+      - voicebox-data:/app/data
+      - huggingface-cache:/root/.cache/huggingface
+    environment:
+      - TTS_MODE=local
+      - WHISPER_MODE=local
+    deploy:
+      resources:
+        reservations:
+          devices:
+            - driver: nvidia
+              count: 1
+              capabilities: [gpu]
+
+  # Nginx reverse proxy
+  nginx:
+    image: nginx:alpine
+    ports:
+      - "80:80"
+      - "443:443"
+    volumes:
+      - ./nginx.conf:/etc/nginx/nginx.conf:ro
+      - ./ssl:/etc/nginx/ssl:ro
+    depends_on:
+      - voicebox
+
+  # Prometheus monitoring (optional)
+  prometheus:
+    image: prom/prometheus
+    ports:
+      - "9090:9090"
+    volumes:
+      - ./prometheus.yml:/etc/prometheus/prometheus.yml
+      - prometheus-data:/prometheus
+
+volumes:
+  voicebox-data:
+  huggingface-cache:
+  prometheus-data:
+```
+
+## Cloud Deployment
+
+### AWS EC2
+
+1. **Launch GPU Instance** (g4dn.xlarge or p3.2xlarge)
+2. **Install Docker + nvidia-docker:**
+   ```bash
+   # Amazon Linux 2
+   sudo yum install -y docker
+   sudo systemctl start docker
+   distribution=$(. /etc/os-release;echo $ID$VERSION_ID)
+   curl -s -L https://nvidia.github.io/nvidia-docker/gpgkey | sudo apt-key add -
+   curl -s -L https://nvidia.github.io/nvidia-docker/$distribution/nvidia-docker.list | \
+     sudo tee /etc/apt/sources.list.d/nvidia-docker.list
+   sudo apt-get update && sudo apt-get install -y nvidia-docker2
+   sudo systemctl restart docker
+   ```
+3. **Deploy:**
+   ```bash
+   docker run --gpus all -d -p 80:8000 \
+     -v voicebox-data:/app/data \
+     --restart unless-stopped \
+     ghcr.io/jamiepine/voicebox:latest-cuda
+   ```
+
+### DigitalOcean
+
+Use GPU Droplet + Docker:
+
+```bash
+# Create droplet via CLI
+doctl compute droplet create voicebox \
+  --size gpu-h100x1-80gb \
+  --image ubuntu-22-04-x64 \
+  --region nyc3
+
+# SSH and deploy
+ssh root@<droplet-ip>
+curl -fsSL https://get.docker.com -o get-docker.sh
+sh get-docker.sh
+docker run --gpus all -d -p 80:8000 voicebox:cuda
+```
+
+### Google Cloud Run (CPU-only)
+
+```bash
+# Build and push
+docker build -t gcr.io/your-project/voicebox .
+docker push gcr.io/your-project/voicebox
+
+# Deploy to Cloud Run
+gcloud run deploy voicebox \
+  --image gcr.io/your-project/voicebox \
+  --platform managed \
+  --region us-central1 \
+  --memory 4Gi \
+  --cpu 2 \
+  --port 8000
+```
+
+### Fly.io
+
+Create `fly.toml`:
+
+```toml
+app = "voicebox"
+
+[build]
+  image = "ghcr.io/jamiepine/voicebox:latest"
+
+[[services]]
+  http_checks = []
+  internal_port = 8000
+  protocol = "tcp"
+
+  [[services.ports]]
+    port = 80
+    handlers = ["http"]
+
+  [[services.ports]]
+    port = 443
+    handlers = ["tls", "http"]
+
+[mounts]
+  source = "voicebox_data"
+  destination = "/app/data"
+```
+
+Deploy:
+
+```bash
+fly launch
+fly deploy
+```
+
+## Troubleshooting
+
+### GPU Not Detected
+
+**Check NVIDIA Docker:**
+
+```bash
+docker run --rm --gpus all nvidia/cuda:12.1.0-base-ubuntu22.04 nvidia-smi
+```
+
+If this fails, reinstall nvidia-docker2.
+
+**Check AMD ROCm:**
+
+```bash
+docker run --rm --device=/dev/kfd --device=/dev/dri rocm/dev-ubuntu-22.04:6.0 rocminfo
+```
+
+### Permission Errors
+
+Container can't write to volumes:
+
+```bash
+# Fix permissions
+docker run --user $(id -u):$(id -g) -v $(pwd)/data:/app/data voicebox
+```
+
+### Out of Memory
+
+Reduce GPU memory usage:
+
+```bash
+docker run -e GPU_MEMORY_FRACTION=0.5 voicebox
+```
+
+Or use CPU-only:
+
+```bash
+docker run -e DEVICE=cpu voicebox
+```
+
+### Model Download Fails
+
+Ensure HuggingFace cache is writable:
+
+```bash
+docker run -v huggingface-cache:/root/.cache/huggingface voicebox
+```
+
+Or use host cache:
+
+```bash
+docker run -v ~/.cache/huggingface:/root/.cache/huggingface voicebox
+```
+
+### Port Already in Use
+
+Change host port:
+
+```bash
+docker run -p 8080:8000 voicebox  # Use port 8080 instead
+```
+
+## Security Best Practices
+
+### 1. Don't Run as Root
+
+Create non-root user in Dockerfile:
+
+```dockerfile
+RUN useradd -m -u 1000 voicebox
+USER voicebox
+```
+
+### 2. Use Secrets for API Keys
+
+Don't put API keys in docker-compose.yml:
+
+```bash
+# Use Docker secrets
+echo "sk-your-key" | docker secret create openai_key -
+
+docker service create \
+  --secret openai_key \
+  -e OPENAI_API_KEY_FILE=/run/secrets/openai_key \
+  voicebox
+```
+
+### 3. Network Isolation
+
+Use internal networks for multi-container setups:
+
+```yaml
+services:
+  voicebox:
+    networks:
+      - internal
+  nginx:
+    networks:
+      - internal
+      - external
+    ports:
+      - "80:80"
+
+networks:
+  internal:
+    internal: true
+  external:
+```
+
+### 4. Resource Limits
+
+Prevent resource exhaustion:
+
+```yaml
+services:
+  voicebox:
+    deploy:
+      resources:
+        limits:
+          cpus: "4"
+          memory: 8G
+        reservations:
+          cpus: "2"
+          memory: 4G
+```
+
+## Performance Tuning
+
+### GPU Memory Management
+
+```bash
+# Use 80% of GPU (default 90%)
+docker run -e GPU_MEMORY_FRACTION=0.8 voicebox
+
+# Allow GPU memory growth (prevents OOM)
+docker run -e TF_FORCE_GPU_ALLOW_GROWTH=true voicebox
+```
+
+### Model Caching
+
+Pre-download models to volume:
+
+```bash
+# Download models first
+docker run --rm -v huggingface-cache:/root/.cache/huggingface \
+  voicebox python -c "
+from transformers import WhisperProcessor, WhisperForConditionalGeneration
+WhisperProcessor.from_pretrained('openai/whisper-base')
+WhisperForConditionalGeneration.from_pretrained('openai/whisper-base')
+"
+
+# Then run normally
+docker run -v huggingface-cache:/root/.cache/huggingface voicebox
+```
+
+### Multi-Worker Setup
+
+Use uvicorn workers for better throughput:
+
+```dockerfile
+CMD ["uvicorn", "backend.main:app", "--host", "0.0.0.0", "--port", "8000", "--workers", "4"]
+```
+
+## Monitoring
+
+### Health Checks
+
+Built-in health endpoint:
+
+```bash
+curl http://localhost:8000/health
+```
+
+Docker health check:
+
+```yaml
+healthcheck:
+  test: ["CMD", "curl", "-f", "http://localhost:8000/health"]
+  interval: 30s
+  timeout: 10s
+  retries: 3
+```
+
+### Prometheus Metrics
+
+Add metrics exporter:
+
+```python
+# backend/main.py
+from prometheus_fastapi_instrumentator import Instrumentator
+
+Instrumentator().instrument(app).expose(app)
+```
+
+Then scrape `/metrics` with Prometheus.
+
+### Logs
+
+View container logs:
+
+```bash
+docker logs -f voicebox
+
+# Or with compose
+docker compose logs -f voicebox
+```
+
+## Next Steps
+
+- [ ] Publish official images to GitHub Container Registry
+- [ ] Add Kubernetes Helm charts
+- [ ] Create Docker Desktop extension
+- [ ] Add automated vulnerability scanning
+- [ ] Support ARM64 builds for Raspberry Pi / Apple Silicon
+
+## Contributing
+
+Help improve Docker support:
+
+1. Test on different platforms (AMD GPU, ARM64, etc.)
+2. Submit Dockerfile optimizations
+3. Share deployment configurations
+4. Report issues: [GitHub Issues](https://github.com/jamiepine/voicebox/issues)
+
+## Resources
+
+- [Docker Documentation](https://docs.docker.com)
+- [NVIDIA Container Toolkit](https://github.com/NVIDIA/nvidia-docker)
+- [AMD ROCm Docker](https://rocm.docs.amd.com/projects/install-on-linux/en/latest/how-to/docker.html)
+- [Docker Compose Reference](https://docs.docker.com/compose/compose-file/)
diff --git a/docs2/content/docs/plans/EXTERNAL_PROVIDERS.md b/docs2/content/docs/plans/EXTERNAL_PROVIDERS.md
new file mode 100644
index 00000000..24cea16f
--- /dev/null
+++ b/docs2/content/docs/plans/EXTERNAL_PROVIDERS.md
@@ -0,0 +1,461 @@
+---
+title: "External Provider Support"
+description: "External provider support for Voicebox (Planned)"
+---
+
+**Status:** Planned for v0.2.0
+**Discussion:** [Reddit Thread](https://reddit.com/r/LocalLLaMA/...)
+
+## Overview
+
+External provider support allows you to connect Voicebox to remotely-hosted TTS and Whisper services instead of running models locally. This is useful for:
+
+- **Existing GPU Infrastructure**: You already have Qwen3-TTS running on a GPU server
+- **AMD GPU Users**: Run models on your AMD hardware, use Voicebox as the UI
+- **Cloud Deployments**: Host models on Modal, Replicate, RunPod, etc.
+- **Team Sharing**: Multiple users share one GPU server running models
+- **Mixed Deployments**: Local Whisper + remote TTS, or vice versa
+
+## Architecture
+
+```
+┌─────────────────┐         HTTP/API         ┌──────────────────┐
+│   Voicebox UI   │ ───────────────────────> │  Your TTS Server │
+│   + Backend     │                           │  (Qwen3-TTS on   │
+│                 │ <─────────────────────── │   AMD/NVIDIA GPU)│
+│  - Profiles     │      Audio + Metadata     └──────────────────┘
+│  - History      │
+│  - Audio Edit   │         HTTP/API         ┌──────────────────┐
+│  - UI           │ ───────────────────────> │ Whisper Service  │
+└─────────────────┘                           │ (OpenAI API or   │
+                                              │  self-hosted)    │
+                                              └──────────────────┘
+```
+
+**What Voicebox Still Handles:**
+
+- Voice profile management
+- Generation history
+- Audio trimming/editing
+- Multi-track story editor
+- UI/UX layer
+
+**What External Providers Handle:**
+
+- Model inference (TTS generation, transcription)
+- GPU allocation
+- Model loading/caching
+
+## Configuration
+
+### Environment Variables
+
+```bash
+# TTS Provider
+TTS_MODE=remote                              # local | remote
+TTS_REMOTE_URL=http://192.168.1.100:8000    # Your TTS server URL
+TTS_API_KEY=your-api-key                     # Optional authentication
+
+# Whisper Provider
+WHISPER_MODE=openai-api                      # local | openai-api | remote
+WHISPER_REMOTE_URL=http://localhost:9000     # For self-hosted Whisper
+OPENAI_API_KEY=sk-...                        # For OpenAI Whisper API
+```
+
+### Voicebox Config UI (Planned)
+
+Settings page will include:
+
+- Provider selection dropdowns
+- URL/API key inputs
+- Connection test button
+- Latency/status indicators
+
+## Hosting External Services
+
+### Option 1: Simple FastAPI Server (Recommended)
+
+Create a lightweight server to expose your local Qwen3-TTS model:
+
+```python
+# tts_server.py
+from fastapi import FastAPI, UploadFile, File
+from qwen_tts import Qwen3TTSModel
+import numpy as np
+import base64
+
+app = FastAPI()
+model = Qwen3TTSModel.from_pretrained(
+    "Qwen/Qwen3-TTS-12Hz-1.7B-Base",
+    device_map="cuda"  # or "cpu" for AMD ROCm: use torch+rocm
+)
+
+@app.post("/v1/generate")
+async def generate(
+    text: str,
+    voice_prompt: dict,
+    language: str = "en",
+    seed: int = None
+):
+    """Generate speech from text using voice prompt."""
+    audio, sample_rate = model.generate_voice_clone(
+        text=text,
+        voice_clone_prompt=voice_prompt,
+    )
+
+    # Return as base64 for transport
+    audio_bytes = audio.tobytes()
+    return {
+        "audio": base64.b64encode(audio_bytes).decode(),
+        "sample_rate": sample_rate,
+        "dtype": str(audio.dtype)
+    }
+
+@app.post("/v1/create_voice_prompt")
+async def create_voice_prompt(
+    audio: UploadFile = File(...),
+    reference_text: str = ""
+):
+    """Create voice prompt from reference audio."""
+    # Save uploaded audio temporarily
+    audio_path = f"/tmp/{audio.filename}"
+    with open(audio_path, "wb") as f:
+        f.write(await audio.read())
+
+    # Create voice prompt
+    voice_prompt = model.create_voice_clone_prompt(
+        ref_audio=audio_path,
+        ref_text=reference_text,
+    )
+
+    return {"voice_prompt": voice_prompt}
+
+@app.get("/health")
+async def health():
+    return {
+        "status": "healthy",
+        "model": "Qwen3-TTS-12Hz-1.7B-Base",
+        "device": str(model.device)
+    }
+
+if __name__ == "__main__":
+    import uvicorn
+    uvicorn.run(app, host="0.0.0.0", port=8000)
+```
+
+**Run it:**
+
+```bash
+# Install dependencies
+pip install fastapi uvicorn qwen-tts torch
+
+# For AMD GPUs, use ROCm PyTorch:
+pip install torch --index-url https://download.pytorch.org/whl/rocm6.4
+
+# Start server
+python tts_server.py
+```
+
+### Option 2: vLLM (If Supported)
+
+```bash
+vllm serve Qwen/Qwen3-TTS-12Hz-1.7B-Base \
+  --host 0.0.0.0 \
+  --port 8000 \
+  --gpu-memory-utilization 0.9
+```
+
+### Option 3: Cloud Platforms
+
+**Modal.com Example:**
+
+```python
+import modal
+
+app = modal.App("qwen-tts")
+image = modal.Image.debian_slim().pip_install("qwen-tts", "torch")
+
+@app.function(gpu="A10G", image=image)
+@modal.web_endpoint(method="POST")
+def generate(text: str, voice_prompt: dict):
+    from qwen_tts import Qwen3TTSModel
+    model = Qwen3TTSModel.from_pretrained("Qwen/Qwen3-TTS-12Hz-1.7B-Base")
+    audio, sr = model.generate_voice_clone(text, voice_prompt)
+    return {"audio": audio.tolist(), "sample_rate": sr}
+```
+
+Deploy: `modal deploy tts_server.py`
+Get URL: `https://yourapp--generate.modal.run`
+
+## API Specification
+
+External TTS providers must implement these endpoints:
+
+### `POST /v1/generate`
+
+Generate speech from text.
+
+**Request:**
+
+```json
+{
+	"text": "Hello, this is a test.",
+	"voice_prompt": {
+		/* voice prompt object */
+	},
+	"language": "en",
+	"seed": 12345
+}
+```
+
+**Response:**
+
+```json
+{
+	"audio": "base64-encoded-audio-bytes",
+	"sample_rate": 24000,
+	"dtype": "float32"
+}
+```
+
+### `POST /v1/create_voice_prompt`
+
+Create a voice prompt from reference audio.
+
+**Request:** (multipart/form-data)
+
+- `audio`: Audio file upload
+- `reference_text`: Transcript of the audio
+
+**Response:**
+
+```json
+{
+	"voice_prompt": {
+		/* voice prompt object */
+	}
+}
+```
+
+### `GET /health`
+
+Health check endpoint.
+
+**Response:**
+
+```json
+{
+	"status": "healthy",
+	"model": "Qwen3-TTS-12Hz-1.7B-Base",
+	"device": "cuda:0"
+}
+```
+
+## Whisper External Providers
+
+### OpenAI Whisper API
+
+Simply set:
+
+```bash
+WHISPER_MODE=openai-api
+OPENAI_API_KEY=sk-...
+```
+
+Voicebox will use OpenAI's Whisper API automatically.
+
+### Self-Hosted Whisper
+
+Run your own Whisper server:
+
+```python
+# whisper_server.py
+from fastapi import FastAPI, UploadFile, File
+from transformers import WhisperProcessor, WhisperForConditionalGeneration
+import librosa
+
+app = FastAPI()
+processor = WhisperProcessor.from_pretrained("openai/whisper-base")
+model = WhisperForConditionalGeneration.from_pretrained("openai/whisper-base")
+
+@app.post("/v1/transcribe")
+async def transcribe(audio: UploadFile = File(...), language: str = None):
+    # Load audio
+    audio_path = f"/tmp/{audio.filename}"
+    with open(audio_path, "wb") as f:
+        f.write(await audio.read())
+
+    audio_data, sr = librosa.load(audio_path, sr=16000)
+
+    # Process
+    inputs = processor(audio_data, sampling_rate=16000, return_tensors="pt")
+    predicted_ids = model.generate(inputs["input_features"])
+    transcription = processor.batch_decode(predicted_ids, skip_special_tokens=True)[0]
+
+    return {"text": transcription}
+```
+
+Configure Voicebox:
+
+```bash
+WHISPER_MODE=remote
+WHISPER_REMOTE_URL=http://localhost:9000
+```
+
+## Use Cases
+
+### 1. AMD GPU User with Existing Setup
+
+**Scenario:** You have a Radeon 7900 XTX running Qwen3-TTS on Linux.
+
+**Setup:**
+
+1. Run `tts_server.py` on your AMD box (ROCm PyTorch)
+2. Configure Voicebox: `TTS_MODE=remote`, `TTS_REMOTE_URL=http://amd-box:8000`
+3. Use Voicebox UI for profiles, generation, editing
+4. TTS happens on your AMD GPU
+
+### 2. Team Deployment
+
+**Scenario:** 5 team members, 1 GPU server.
+
+**Setup:**
+
+1. Deploy TTS server on shared GPU box
+2. Each person runs Voicebox desktop app locally
+3. All point to same `TTS_REMOTE_URL`
+4. Profiles and history stay local per user
+5. GPU usage is shared
+
+### 3. Hybrid Local/Remote
+
+**Scenario:** Fast local Whisper, heavy TTS on cloud.
+
+**Setup:**
+
+```bash
+TTS_MODE=remote
+TTS_REMOTE_URL=https://your-modal-app.modal.run
+
+WHISPER_MODE=local  # Fast transcription on your CPU
+```
+
+### 4. OpenAI Whisper + Self-Hosted TTS
+
+**Scenario:** Use OpenAI's API for transcription, run TTS locally.
+
+**Setup:**
+
+```bash
+TTS_MODE=local
+
+WHISPER_MODE=openai-api
+OPENAI_API_KEY=sk-...
+```
+
+## Security Considerations
+
+### Authentication
+
+Add API key authentication to your external server:
+
+```python
+from fastapi import Header, HTTPException
+
+API_KEY = "your-secret-key"
+
+async def verify_api_key(x_api_key: str = Header(...)):
+    if x_api_key != API_KEY:
+        raise HTTPException(status_code=401, detail="Invalid API key")
+
+@app.post("/v1/generate", dependencies=[Depends(verify_api_key)])
+async def generate(...):
+    ...
+```
+
+Configure Voicebox:
+
+```bash
+TTS_API_KEY=your-secret-key
+```
+
+### Network Security
+
+- **VPN/Tailscale**: Use private network for remote servers
+- **HTTPS**: Use reverse proxy (nginx/Caddy) with SSL certificates
+- **Firewall**: Restrict access to known IPs
+
+### Rate Limiting
+
+Protect your external server:
+
+```python
+from slowapi import Limiter
+from slowapi.util import get_remote_address
+
+limiter = Limiter(key_func=get_remote_address)
+app.state.limiter = limiter
+
+@app.post("/v1/generate")
+@limiter.limit("10/minute")
+async def generate(...):
+    ...
+```
+
+## Performance Considerations
+
+### Latency
+
+External providers add network latency:
+
+- **Local network**: ~10-50ms overhead (negligible)
+- **Same datacenter**: ~1-5ms overhead
+- **Cross-region cloud**: 50-200ms+ overhead
+
+For real-time applications, keep TTS server on local network or same cloud region.
+
+### Caching
+
+Implement response caching on external server:
+
+```python
+from functools import lru_cache
+
+@lru_cache(maxsize=1000)
+def get_cached_generation(text, voice_prompt_hash, language, seed):
+    return model.generate_voice_clone(text, voice_prompt)
+```
+
+### Load Balancing
+
+For high-traffic deployments, run multiple TTS servers behind a load balancer:
+
+```
+Voicebox ──> Load Balancer ──> TTS Server 1 (GPU 1)
+                           ├──> TTS Server 2 (GPU 2)
+                           └──> TTS Server 3 (GPU 3)
+```
+
+## Future Enhancements
+
+- [ ] **Provider Marketplace**: Built-in directory of compatible providers
+- [ ] **Automatic Fallback**: If remote fails, fallback to local
+- [ ] **Cost Tracking**: Monitor API usage and costs
+- [ ] **Performance Metrics**: Latency, throughput dashboards
+- [ ] **Multi-Provider**: Use different providers for different voices/languages
+
+## Contributing
+
+If you build an external provider, please share:
+
+1. Server implementation
+2. Performance benchmarks
+3. Deployment guide
+
+Submit to: [GitHub Discussions](https://github.com/jamiepine/voicebox/discussions)
+
+## Questions?
+
+- **Discord**: [Join the community](https://discord.gg/...)
+- **GitHub**: [Open an issue](https://github.com/jamiepine/voicebox/issues)
+- **Docs**: [Full documentation](https://voicebox.sh/docs)
diff --git a/docs2/content/docs/plans/MLX_AUDIO.md b/docs2/content/docs/plans/MLX_AUDIO.md
new file mode 100644
index 00000000..021911fc
--- /dev/null
+++ b/docs2/content/docs/plans/MLX_AUDIO.md
@@ -0,0 +1,431 @@
+---
+title: "MLX Audio Integration"
+description: "MLX Audio integration for Voicebox (Validated)"
+---
+
+**Status:** Validated ✅
+**Context:** [mlx-audio v0.3.1 release](https://github.com/Blaizzy/mlx-audio)
+
+## Validation Results
+
+We validated mlx-audio in an isolated environment (`mlx-test/`). Key findings:
+
+| Metric          | Result                                      |
+| --------------- | ------------------------------------------- |
+| MLX Version     | 0.30.4                                      |
+| Model Load Time | ~1s (after initial download)                |
+| Generation RTF  | **0.5-0.6x** (1.7-2x faster than real-time) |
+| Test Hardware   | Apple Silicon Mac                           |
+
+### Model Mapping
+
+| voicebox (PyTorch)              | mlx-audio (MLX)                               |
+| ------------------------------- | --------------------------------------------- |
+| `Qwen/Qwen3-TTS-12Hz-1.7B-Base` | `mlx-community/Qwen3-TTS-12Hz-1.7B-Base-bf16` |
+| `Qwen/Qwen3-TTS-12Hz-0.6B-Base` | (not yet converted)                           |
+
+### mlx-audio API
+
+The API uses a **generator-based streaming pattern**:
+
+```python
+from mlx_audio.tts import load
+
+model = load("mlx-community/Qwen3-TTS-12Hz-1.7B-Base-bf16")
+
+# generate() yields GenerationResult objects
+for result in model.generate("Hello world"):
+    audio = result.audio           # numpy array of samples
+    sample_rate = result.sample_rate  # 24000
+    rtf = result.real_time_factor  # e.g., 0.55
+```
+
+### Known Warnings (harmless)
+
+```
+You are using a model of type qwen3_tts to instantiate a model of type .
+The tokenizer you are loading... with an incorrect regex pattern...
+```
+
+These warnings appear but don't affect functionality or output quality.
+
+### Demo Script
+
+Run `mlx-test/demo.py` to test:
+
+```bash
+cd mlx-test && source venv/bin/activate && python demo.py "Your text here"
+```
+
+## Problem
+
+Apple Silicon users are stuck on CPU inference while Windows and Linux users get CUDA acceleration. The current PyTorch MPS backend has stability issues (lines 34-36 in `backend/tts.py` and `backend/transcribe.py`), forcing a CPU fallback that makes voicebox significantly slower on M1/M2/M3 Macs.
+
+This creates a poor experience for a large portion of users who bought Apple Silicon specifically for ML workloads.
+
+## Solution
+
+Integrate [mlx-audio](https://github.com/Blaizzy/mlx-audio) as the inference engine for macOS Apple Silicon builds. MLX is Apple's native ML framework, optimized for Metal and the unified memory architecture. It's fast, stable, and already supports the same Qwen3-TTS models we use.
+
+**Key wins:**
+
+- Native GPU acceleration on Apple Silicon (no more CPU fallback)
+- Streaming TTS support (faster perceived latency)
+- Memory optimizations (run larger models on less RAM)
+- Fixed 0.6B silence bug that we currently ship
+- Same Qwen3-TTS models (zero migration cost for users)
+
+## Architecture
+
+### Current Stack
+
+```
+┌─────────────────────────┐
+│   PyTorch + Qwen3-TTS   │
+│   (CPU only on macOS)   │
+└─────────────────────────┘
+```
+
+### Proposed Stack
+
+```
+┌─────────────────────────────────────────┐
+│  Platform Detection at Runtime          │
+└─────────────────────────────────────────┘
+           │
+           ├─── Apple Silicon (aarch64-darwin)
+           │    ┌─────────────────────────┐
+           │    │  MLX Audio Backend      │
+           │    │  - Qwen3-TTS (mlx)      │
+           │    │  - Whisper (mlx)        │
+           │    │  - Streaming support    │
+           │    └─────────────────────────┘
+           │
+           └─── Other (x86_64, Windows, Linux)
+                ┌─────────────────────────┐
+                │  PyTorch Backend        │
+                │  - Qwen3-TTS (pytorch)  │
+                │  - Whisper (pytorch)    │
+                │  - CUDA if available    │
+                └─────────────────────────┘
+```
+
+## Implementation Phases
+
+### Phase 1: Platform Detection & Dependency Management
+
+Create a backend that switches between PyTorch and MLX based on runtime platform detection.
+
+**New files:**
+
+- `backend/platform.py` - Detect Apple Silicon, return backend type
+- `backend/backends/__init__.py` - Backend factory pattern
+- `backend/requirements-mlx.txt` - MLX-specific deps (macOS only)
+
+**Modified files:**
+
+- `backend/requirements.txt` - Keep PyTorch as default
+- `backend/main.py` - Import from backend factory instead of direct imports
+
+**Platform detection logic:**
+
+```python
+def get_backend_type() -> str:
+    """Detect best backend for current platform."""
+    if platform.system() == "Darwin" and platform.machine() == "arm64":
+        # Apple Silicon detected
+        try:
+            import mlx
+            return "mlx"
+        except ImportError:
+            return "pytorch"  # Fallback if mlx not installed
+    return "pytorch"
+```
+
+### Phase 2: MLX Backend Implementation
+
+Create parallel implementations of TTS and STT using mlx-audio.
+
+**New files:**
+
+- `backend/backends/mlx_backend.py` - MLX inference engine
+- `backend/backends/pytorch_backend.py` - Refactor current code into backend
+
+**Interface both backends must implement:**
+
+```python
+class TTSBackend(Protocol):
+    async def load_model(self, model_size: str) -> None: ...
+    async def create_voice_prompt(self, audio_path: str, reference_text: str) -> dict: ...
+    async def generate(self, text: str, voice_prompt: dict, **kwargs) -> Tuple[np.ndarray, int]: ...
+    async def generate_streaming(self, text: str, voice_prompt: dict, **kwargs) -> AsyncIterator[bytes]: ...
+    def unload_model(self) -> None: ...
+
+class STTBackend(Protocol):
+    async def load_model(self, model_size: str) -> None: ...
+    async def transcribe(self, audio_path: str, language: Optional[str]) -> str: ...
+    def unload_model(self) -> None: ...
+```
+
+**MLX backend implementation notes:**
+
+mlx-audio's `generate()` returns a generator by default (streaming is built-in):
+
+```python
+# MLX backend wrapper
+from mlx_audio.tts import load
+
+class MLXTTSBackend:
+    def __init__(self):
+        self.model = None
+
+    async def load_model(self, model_size: str) -> None:
+        model_map = {
+            "1.7B": "mlx-community/Qwen3-TTS-12Hz-1.7B-Base-bf16",
+            # "0.6B": needs conversion to mlx format
+        }
+        self.model = load(model_map[model_size])
+
+    async def generate(self, text: str, voice_prompt: dict, **kwargs) -> Tuple[np.ndarray, int]:
+        # Collect all chunks from generator
+        chunks = []
+        for result in self.model.generate(text):  # TODO: add voice_prompt support
+            chunks.append(np.array(result.audio))
+        return np.concatenate(chunks), 24000
+```
+
+**MLX-specific features to expose:**
+
+- Streaming TTS (new endpoint: `/api/generate/stream`)
+- Memory-optimized model loading
+- Qwen3-ASR for transcription (in addition to Whisper)
+
+### Phase 3: API Layer Updates
+
+Update FastAPI endpoints to support new streaming capabilities and maintain backward compatibility.
+
+**Modified files:**
+
+- `backend/main.py` - Add streaming endpoints
+- `backend/tts.py` - Refactor to use backend abstraction
+- `backend/transcribe.py` - Refactor to use backend abstraction
+
+**New endpoints:**
+
+```python
+@app.post("/api/generate/stream")
+async def generate_stream(...) -> StreamingResponse:
+    """Stream TTS chunks as they're generated (MLX only)."""
+    backend = get_backend()
+    if not hasattr(backend, 'generate_streaming'):
+        raise HTTPException(501, "Streaming not supported on this backend")
+    return StreamingResponse(backend.generate_streaming(...), media_type="audio/wav")
+```
+
+**Backward compatibility:**
+
+- Keep all existing `/api/generate` endpoints unchanged
+- PyTorch backend users see no behavior change
+- MLX users automatically get faster inference, streaming is opt-in
+
+### Phase 4: Frontend Integration
+
+Add UI indicators for backend type and streaming progress.
+
+**Modified files:**
+
+- `app/src/hooks/useGenerationForm.tsx` - Add streaming support
+- `app/src/components/GenerationForm.tsx` - Show backend badge, streaming toggle
+- `app/src/lib/api.ts` - Add streaming API client
+
+**UI additions:**
+
+- Badge showing current backend ("MLX" or "PyTorch")
+- Toggle for streaming mode (disabled if PyTorch)
+- Real-time streaming playback (WaveSurfer progressive loading)
+
+### Phase 5: Build & Distribution
+
+Create separate installers for MLX (Apple Silicon) and PyTorch (Universal).
+
+**Modified files:**
+
+- `tauri/src-tauri/tauri.conf.json` - Add target-specific builds
+- `.github/workflows/release.yml` - Build both variants
+
+**Build matrix:**
+
+```yaml
+- target: aarch64-apple-darwin
+  backend: mlx
+  installer: voicebox-macos-silicon-{version}.dmg
+
+- target: x86_64-apple-darwin
+  backend: pytorch
+  installer: voicebox-macos-intel-{version}.dmg
+
+- target: x86_64-pc-windows-msvc
+  backend: pytorch
+  installer: voicebox-windows-{version}.exe
+```
+
+**Installation flow:**
+
+- Auto-detect architecture, recommend correct installer
+- MLX installer includes `mlx-audio` in embedded Python
+- PyTorch installer includes `torch` in embedded Python
+- Both can coexist (different backend, same profile format)
+
+### Phase 6: Testing & Validation
+
+Ensure both backends produce compatible outputs.
+
+**New files:**
+
+- `backend/tests/test_backend_parity.py` - Verify both backends produce similar audio
+- `backend/tests/test_streaming.py` - Streaming-specific tests
+
+**Test scenarios:**
+
+- Same voice prompt on both backends → similar (not identical) audio output
+- Profile created on MLX → loads on PyTorch (and vice versa)
+- Streaming chunks assemble into valid WAV file
+- Model downloads work on both backends
+- Memory usage stays within bounds
+
+### Phase 7: Documentation
+
+Update user-facing docs and developer guides.
+
+**New files:**
+
+- `docs/developer/BACKENDS.md` - Guide for adding new backends
+- `docs/overview/performance.md` - Backend comparison benchmarks
+
+**Modified files:**
+
+- `README.md` - Note Apple Silicon acceleration
+- `docs/TROUBLESHOOTING.md` - Add MLX-specific issues
+
+**Key docs to write:**
+
+- Which installer to download (architecture detection)
+- Performance comparison (MLX vs PyTorch on same M2 hardware)
+- How streaming mode works
+- How to force PyTorch on Apple Silicon (for debugging)
+
+## Technical Decisions
+
+### Why Dual Backend Instead of MLX-Only?
+
+**Pros of dual backend:**
+
+- Windows and Intel Mac users unaffected
+- Easier testing (can compare outputs)
+- Fallback if MLX has issues
+
+**Cons of dual backend:**
+
+- More code to maintain
+- Two dependency trees
+- Build complexity (separate installers)
+
+**Decision:** Dual backend. The maintenance cost is worth it to avoid breaking existing users and to have a fallback.
+
+### Why Separate Installers Instead of Runtime Detection?
+
+**Pros of separate installers:**
+
+- Smaller bundle size (don't ship both PyTorch and MLX)
+- Clearer to users which version they have
+- Easier to debug (no "which backend am I running?" confusion)
+- Can optimize each build for its target
+
+**Cons:**
+
+- More installers to build and test
+- Users might download the wrong one
+
+**Decision:** Separate installers. Bundle size matters (PyTorch + MLX would be huge), and we can auto-detect architecture on the download page.
+
+### Streaming vs Batch Generation
+
+MLX supports streaming, PyTorch doesn't (without significant work). Should streaming be:
+
+1. MLX-only feature (✅ chosen)
+2. Implemented for both (lots of work)
+3. Not exposed at all (wasted opportunity)
+
+**Decision:** MLX-only. Expose as opt-in feature with graceful degradation (button disabled on PyTorch backend).
+
+## Migration Path
+
+Nothing needs migrating, macos users will just notice a speed-boost in inference
+
+**Data format compatibility:**
+
+- Profiles (SQLite) → no schema changes needed
+- Voice prompts (cached) → backend-agnostic (just numpy arrays)
+- Audio files → unchanged
+
+## Performance Expectations
+
+### Measured Results (from validation)
+
+| Metric                  | MLX (measured) | PyTorch CPU (estimated) |
+| ----------------------- | -------------- | ----------------------- |
+| **6s audio generation** | ~3-4s          | ~10-15s                 |
+| **Real-time factor**    | 0.5-0.6x       | 2-3x                    |
+| **Model load (cached)** | ~1s            | ~3-5s                   |
+
+### TTS Generation (1.7B model, ~20s output)
+
+- **PyTorch CPU (M2 Max):** ~45-60s (slower than real-time)
+- **MLX (M2 Max):** ~8-12s (faster than real-time)
+- **Improvement:** ~4-5x faster
+
+### Whisper Transcription (10s audio clip)
+
+- **PyTorch CPU:** ~5-8s
+- **MLX:** ~1-2s
+- **Improvement:** ~3-4x faster
+
+### Memory Usage (1.7B model)
+
+- **PyTorch:** ~8-10GB (no GPU offload, so CPU RAM)
+- **MLX:** ~4-6GB (unified memory, better optimization)
+- **Improvement:** ~40% less RAM
+
+Full benchmarks will be in `docs/overview/performance.md` after Phase 6.
+
+## Open Questions
+
+- **Should we support Qwen3-ASR (MLX-only) in addition to Whisper?** Adds another model option but increases complexity. Probably phase 8+. - Sure
+- **Should we backport streaming to PyTorch?** Would require chunking and callback-based generation. Probably not worth it given mlx-audio already has it. - No
+- **What's the auto-update UX for migrating PyTorch→MLX users?** Needs design. Don't want to force reinstall, but also want to make upgrade obvious. - it just updates, users see nothing
+- **Do we expose backend selection in settings or hide it?** Leaning toward auto-detect only, with env var override for power users.
+
+## Success Metrics
+
+How we'll know this worked:
+
+1. **Performance:** Apple Silicon users report generation faster than real-time
+2. **Adoption:** >80% of macOS downloads are MLX build within 1 month
+3. **Stability:** <5% increase in bug reports (backend abstraction doesn't introduce regressions)
+4. **Feedback:** Positive sentiment in Discord/GitHub about macOS performance
+
+## Related Work
+
+- [PyTorch MPS tracking issue](https://github.com/pytorch/pytorch/issues/77764) - Why we can't use MPS directly
+- [mlx-audio server implementation](https://github.com/Blaizzy/mlx-audio/blob/main/examples/server.py) - Reference for streaming API
+- [MLX Whisper benchmarks](https://github.com/ml-explore/mlx-examples/tree/main/whisper) - Performance data
+
+## Next Steps
+
+1. ~~Validate mlx-audio can load Qwen3-TTS models (quick test)~~ ✅ Done - see `mlx-test/`
+2. Get approval on dual-backend architecture
+3. Start Phase 1 (platform detection)
+
+## Questions?
+
+Feedback welcome in GitHub discussions or Discord.
diff --git a/docs2/content/docs/plans/OPENAI_SUPPORT.md b/docs2/content/docs/plans/OPENAI_SUPPORT.md
new file mode 100644
index 00000000..e570dcf0
--- /dev/null
+++ b/docs2/content/docs/plans/OPENAI_SUPPORT.md
@@ -0,0 +1,238 @@
+---
+title: "OpenAI API Compatibility"
+description: "OpenAI API compatibility for Voicebox (Planned)"
+---
+
+**Status:** Planned for v0.2.0
+
+**Issue:** [#10 OpenAI API compatibility](https://github.com/jamiepine/voicebox/issues/10)
+
+## Overview
+
+This feature exposes OpenAI-compatible endpoints from Voicebox, allowing any tool, library, or application that speaks the OpenAI Audio API to use Voicebox as a drop-in local replacement.
+
+```mermaid
+flowchart LR
+    subgraph clients [External Clients]
+        SDK[OpenAI SDK]
+        Curl[curl / HTTP]
+        Apps[Third-party Apps]
+    end
+
+    subgraph voicebox [Voicebox Server]
+        OpenAI["/v1/audio/* endpoints"]
+        TTS[TTSModel]
+        Whisper[WhisperModel]
+        Profiles[Voice Profiles]
+    end
+
+    SDK --> OpenAI
+    Curl --> OpenAI
+    Apps --> OpenAI
+    OpenAI --> TTS
+    OpenAI --> Whisper
+    OpenAI --> Profiles
+```
+
+## Use Cases
+
+- **OpenAI SDK users**: `openai.audio.speech.create()` works with Voicebox
+- **LLM frameworks**: LangChain, AutoGen, etc. can use Voicebox for TTS
+- **Shell scripts**: `curl` commands copy-pasted from OpenAI docs work
+- **Existing integrations**: Any tool expecting OpenAI's API works without code changes
+
+## Endpoints to Implement
+
+### 1. `POST /v1/audio/speech` (TTS)
+
+OpenAI spec: https://platform.openai.com/docs/api-reference/audio/createSpeech
+
+**Request:**
+
+```json
+{
+	"model": "tts-1",
+	"input": "Hello world!",
+	"voice": "alloy",
+	"response_format": "mp3",
+	"speed": 1.0
+}
+```
+
+**Response:** Audio file (mp3, wav, opus, aac, flac, pcm)
+
+**Voice Mapping Strategy:**
+
+- `voice` parameter maps to Voicebox profile names (case-insensitive)
+- If no match, use a configurable default profile
+- Support special syntax: `voice: "profile:uuid"` for explicit profile ID
+
+### 2. `POST /v1/audio/transcriptions` (Whisper)
+
+OpenAI spec: https://platform.openai.com/docs/api-reference/audio/createTranscription
+
+**Request:** (multipart/form-data)
+
+- `file`: Audio file
+- `model`: "whisper-1"
+- `language`: Optional language hint
+- `response_format`: json, text, srt, verbose_json, vtt
+
+**Response:**
+
+```json
+{
+	"text": "Hello world!"
+}
+```
+
+## Implementation Details
+
+### New File: `backend/openai_compat.py`
+
+Create a dedicated module with an APIRouter for OpenAI-compatible endpoints:
+
+```python
+from fastapi import APIRouter, UploadFile, File, Form, HTTPException
+from fastapi.responses import StreamingResponse
+from pydantic import BaseModel
+from typing import Literal, Optional
+
+router = APIRouter(prefix="/v1/audio", tags=["OpenAI Compatible"])
+
+class SpeechRequest(BaseModel):
+    model: str = "tts-1"
+    input: str
+    voice: str = "alloy"
+    response_format: Literal["mp3", "wav", "opus", "aac", "flac", "pcm"] = "mp3"
+    speed: float = 1.0
+
+@router.post("/speech")
+async def create_speech(request: SpeechRequest, db: Session = Depends(get_db)):
+    # 1. Map voice name to profile
+    # 2. Generate audio using existing TTSModel
+    # 3. Convert to requested format
+    # 4. Return audio stream
+    ...
+
+@router.post("/transcriptions")
+async def create_transcription(
+    file: UploadFile = File(...),
+    model: str = Form("whisper-1"),
+    language: Optional[str] = Form(None),
+    response_format: str = Form("json"),
+):
+    # 1. Save uploaded file
+    # 2. Transcribe using existing WhisperModel
+    # 3. Return in requested format
+    ...
+```
+
+### Voice Profile Resolution
+
+Add helper in [backend/profiles.py](backend/profiles.py):
+
+```python
+async def resolve_voice_for_openai(voice: str, db: Session) -> Optional[VoiceProfile]:
+    """
+    Resolve OpenAI voice parameter to a Voicebox profile.
+
+    Priority:
+    1. Exact profile name match (case-insensitive)
+    2. Profile ID match (if voice starts with "profile:")
+    3. Default profile from config
+    4. First available profile
+    """
+    ...
+```
+
+### Audio Format Conversion
+
+Add conversion utilities in [backend/utils/audio.py](backend/utils/audio.py):
+
+```python
+def convert_audio_format(
+    audio: np.ndarray,
+    sample_rate: int,
+    target_format: str,  # mp3, wav, opus, aac, flac, pcm
+) -> bytes:
+    """Convert audio to target format using ffmpeg or pydub."""
+    ...
+```
+
+### Configuration
+
+Add to [backend/config.py](backend/config.py):
+
+```python
+# OpenAI API Compatibility
+OPENAI_COMPAT_ENABLED = True
+OPENAI_COMPAT_DEFAULT_VOICE = None  # Profile ID or name for default voice
+OPENAI_COMPAT_REQUIRE_AUTH = False  # Require API key validation
+OPENAI_COMPAT_API_KEY = None        # If set, validate against this
+```
+
+### Integration with main.py
+
+In [backend/main.py](backend/main.py), include the router:
+
+```python
+from . import openai_compat
+
+# Add OpenAI-compatible routes
+if config.OPENAI_COMPAT_ENABLED:
+    app.include_router(openai_compat.router)
+```
+
+## Streaming Support (Future Enhancement)
+
+Initial implementation returns complete audio. Streaming can be added later:
+
+```python
+@router.post("/speech")
+async def create_speech(request: SpeechRequest):
+    if request.stream:
+        return StreamingResponse(
+            generate_audio_chunks(request),
+            media_type=f"audio/{request.response_format}"
+        )
+    ...
+```
+
+## Testing
+
+Example usage after implementation:
+
+```bash
+# TTS with curl
+curl http://localhost:8000/v1/audio/speech \
+  -H "Content-Type: application/json" \
+  -d '{"model": "tts-1", "input": "Hello!", "voice": "MyProfile"}' \
+  --output speech.mp3
+
+# With OpenAI Python SDK
+from openai import OpenAI
+client = OpenAI(base_url="http://localhost:8000/v1", api_key="unused")
+response = client.audio.speech.create(
+    model="tts-1",
+    voice="MyProfile",
+    input="Hello world!"
+)
+response.stream_to_file("output.mp3")
+
+# Transcription
+curl http://localhost:8000/v1/audio/transcriptions \
+  -F file=@audio.mp3 \
+  -F model="whisper-1"
+```
+
+## Security Considerations
+
+- Optional API key validation (for shared deployments)
+- Rate limiting on endpoints
+- Input length limits (same as existing `/generate` endpoint)
+
+## Dependencies
+
+- `pydub` or `ffmpeg-python` for audio format conversion (mp3, opus, etc.)
+- No changes to existing TTS/Whisper model code
diff --git a/docs2/content/docs/plans/meta.json b/docs2/content/docs/plans/meta.json
new file mode 100644
index 00000000..fc3ea779
--- /dev/null
+++ b/docs2/content/docs/plans/meta.json
@@ -0,0 +1,4 @@
+{
+  "title": "Plans",
+  "pages": ["DOCKER_DEPLOYMENT", "EXTERNAL_PROVIDERS", "MLX_AUDIO", "OPENAI_SUPPORT"]
+}
diff --git a/docs2/lib/layout.shared.tsx b/docs2/lib/layout.shared.tsx
new file mode 100644
index 00000000..1d8ed146
--- /dev/null
+++ b/docs2/lib/layout.shared.tsx
@@ -0,0 +1,9 @@
+import type { BaseLayoutProps } from 'fumadocs-ui/layouts/shared';
+
+export function baseOptions(): BaseLayoutProps {
+  return {
+    nav: {
+      title: 'Voicebox',
+    },
+  };
+}
diff --git a/docs2/mdx-components.tsx b/docs2/mdx-components.tsx
new file mode 100644
index 00000000..68824788
--- /dev/null
+++ b/docs2/mdx-components.tsx
@@ -0,0 +1,39 @@
+import defaultMdxComponents from 'fumadocs-ui/mdx';
+import type { MDXComponents } from 'mdx/types';
+import { APIPage } from '@/components/api-page';
+import {
+  Accordion,
+  AccordionGroup,
+  CardGroup,
+  Danger,
+  Frame,
+  Info,
+  MintlifyCard,
+  Note,
+  Step,
+  Steps,
+  Tip,
+  Warning,
+} from '@/components/mintlify-compat';
+
+export function getMDXComponents(components?: MDXComponents): MDXComponents {
+  return {
+    ...defaultMdxComponents,
+    // Mintlify compatibility components
+    Frame,
+    CardGroup,
+    Card: MintlifyCard,
+    Steps,
+    Step,
+    Tip,
+    Note,
+    Warning,
+    Info,
+    Danger,
+    AccordionGroup,
+    Accordion,
+    // OpenAPI component
+    APIPage,
+    ...components,
+  };
+}
diff --git a/docs2/openapi.json b/docs2/openapi.json
new file mode 100644
index 00000000..b573a920
--- /dev/null
+++ b/docs2/openapi.json
@@ -0,0 +1,877 @@
+{
+  "openapi": "3.1.0",
+  "info": {
+    "title": "voicebox API",
+    "description": "Production-quality Qwen3-TTS voice cloning API",
+    "version": "0.1.0"
+  },
+  "servers": [{ "url": "http://localhost:8000", "description": "Local development server" }],
+  "paths": {
+    "/": {
+      "get": {
+        "summary": "Root",
+        "description": "Root endpoint.",
+        "operationId": "root__get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          }
+        }
+      }
+    },
+    "/health": {
+      "get": {
+        "summary": "Health",
+        "description": "Health check endpoint.",
+        "operationId": "health_health_get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": { "schema": { "$ref": "#/components/schemas/HealthResponse" } }
+            }
+          }
+        }
+      }
+    },
+    "/profiles": {
+      "get": {
+        "summary": "List Profiles",
+        "description": "List all voice profiles.",
+        "operationId": "list_profiles_profiles_get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "items": { "$ref": "#/components/schemas/VoiceProfileResponse" },
+                  "type": "array",
+                  "title": "Response List Profiles Profiles Get"
+                }
+              }
+            }
+          }
+        }
+      },
+      "post": {
+        "summary": "Create Profile",
+        "description": "Create a new voice profile.",
+        "operationId": "create_profile_profiles_post",
+        "requestBody": {
+          "content": {
+            "application/json": { "schema": { "$ref": "#/components/schemas/VoiceProfileCreate" } }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/VoiceProfileResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/profiles/{profile_id}": {
+      "get": {
+        "summary": "Get Profile",
+        "description": "Get a voice profile by ID.",
+        "operationId": "get_profile_profiles__profile_id__get",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/VoiceProfileResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      },
+      "put": {
+        "summary": "Update Profile",
+        "description": "Update a voice profile.",
+        "operationId": "update_profile_profiles__profile_id__put",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "requestBody": {
+          "required": true,
+          "content": {
+            "application/json": { "schema": { "$ref": "#/components/schemas/VoiceProfileCreate" } }
+          }
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/VoiceProfileResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      },
+      "delete": {
+        "summary": "Delete Profile",
+        "description": "Delete a voice profile.",
+        "operationId": "delete_profile_profiles__profile_id__delete",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/profiles/{profile_id}/samples": {
+      "post": {
+        "summary": "Add Profile Sample",
+        "description": "Add a sample to a voice profile.",
+        "operationId": "add_profile_sample_profiles__profile_id__samples_post",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "requestBody": {
+          "required": true,
+          "content": {
+            "multipart/form-data": {
+              "schema": {
+                "$ref": "#/components/schemas/Body_add_profile_sample_profiles__profile_id__samples_post"
+              }
+            }
+          }
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/ProfileSampleResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      },
+      "get": {
+        "summary": "Get Profile Samples",
+        "description": "Get all samples for a profile.",
+        "operationId": "get_profile_samples_profiles__profile_id__samples_get",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Profile Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": {
+                  "type": "array",
+                  "items": { "$ref": "#/components/schemas/ProfileSampleResponse" },
+                  "title": "Response Get Profile Samples Profiles  Profile Id  Samples Get"
+                }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/profiles/samples/{sample_id}": {
+      "delete": {
+        "summary": "Delete Profile Sample",
+        "description": "Delete a profile sample.",
+        "operationId": "delete_profile_sample_profiles_samples__sample_id__delete",
+        "parameters": [
+          {
+            "name": "sample_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Sample Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/generate": {
+      "post": {
+        "summary": "Generate Speech",
+        "description": "Generate speech from text using a voice profile.",
+        "operationId": "generate_speech_generate_post",
+        "requestBody": {
+          "content": {
+            "application/json": { "schema": { "$ref": "#/components/schemas/GenerationRequest" } }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/GenerationResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/history": {
+      "get": {
+        "summary": "List History",
+        "description": "List generation history with optional filters.",
+        "operationId": "list_history_history_get",
+        "parameters": [
+          {
+            "name": "profile_id",
+            "in": "query",
+            "required": false,
+            "schema": { "anyOf": [{ "type": "string" }, { "type": "null" }], "title": "Profile Id" }
+          },
+          {
+            "name": "search",
+            "in": "query",
+            "required": false,
+            "schema": { "anyOf": [{ "type": "string" }, { "type": "null" }], "title": "Search" }
+          },
+          {
+            "name": "limit",
+            "in": "query",
+            "required": false,
+            "schema": { "type": "integer", "default": 50, "title": "Limit" }
+          },
+          {
+            "name": "offset",
+            "in": "query",
+            "required": false,
+            "schema": { "type": "integer", "default": 0, "title": "Offset" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HistoryListResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/history/{generation_id}": {
+      "get": {
+        "summary": "Get Generation",
+        "description": "Get a generation by ID.",
+        "operationId": "get_generation_history__generation_id__get",
+        "parameters": [
+          {
+            "name": "generation_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Generation Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": { "schema": { "$ref": "#/components/schemas/HistoryResponse" } }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      },
+      "delete": {
+        "summary": "Delete Generation",
+        "description": "Delete a generation.",
+        "operationId": "delete_generation_history__generation_id__delete",
+        "parameters": [
+          {
+            "name": "generation_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Generation Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/history/stats": {
+      "get": {
+        "summary": "Get Stats",
+        "description": "Get generation statistics.",
+        "operationId": "get_stats_history_stats_get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          }
+        }
+      }
+    },
+    "/transcribe": {
+      "post": {
+        "summary": "Transcribe Audio",
+        "description": "Transcribe audio file to text.",
+        "operationId": "transcribe_audio_transcribe_post",
+        "requestBody": {
+          "content": {
+            "multipart/form-data": {
+              "schema": { "$ref": "#/components/schemas/Body_transcribe_audio_transcribe_post" }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/TranscriptionResponse" }
+              }
+            }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/audio/{generation_id}": {
+      "get": {
+        "summary": "Get Audio",
+        "description": "Serve generated audio file.",
+        "operationId": "get_audio_audio__generation_id__get",
+        "parameters": [
+          {
+            "name": "generation_id",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Generation Id" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/models/load": {
+      "post": {
+        "summary": "Load Model",
+        "description": "Manually load TTS model.",
+        "operationId": "load_model_models_load_post",
+        "parameters": [
+          {
+            "name": "model_size",
+            "in": "query",
+            "required": false,
+            "schema": { "type": "string", "default": "1.7B", "title": "Model Size" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/models/unload": {
+      "post": {
+        "summary": "Unload Model",
+        "description": "Unload TTS model to free memory.",
+        "operationId": "unload_model_models_unload_post",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          }
+        }
+      }
+    },
+    "/models/progress/{model_name}": {
+      "get": {
+        "summary": "Get Model Progress",
+        "description": "Get model download progress via Server-Sent Events.",
+        "operationId": "get_model_progress_models_progress__model_name__get",
+        "parameters": [
+          {
+            "name": "model_name",
+            "in": "path",
+            "required": true,
+            "schema": { "type": "string", "title": "Model Name" }
+          }
+        ],
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/models/status": {
+      "get": {
+        "summary": "Get Model Status",
+        "description": "Get status of all available models.",
+        "operationId": "get_model_status_models_status_get",
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/ModelStatusListResponse" }
+              }
+            }
+          }
+        }
+      }
+    },
+    "/models/download": {
+      "post": {
+        "summary": "Trigger Model Download",
+        "description": "Trigger download of a specific model.",
+        "operationId": "trigger_model_download_models_download_post",
+        "requestBody": {
+          "content": {
+            "application/json": {
+              "schema": { "$ref": "#/components/schemas/ModelDownloadRequest" }
+            }
+          },
+          "required": true
+        },
+        "responses": {
+          "200": {
+            "description": "Successful Response",
+            "content": { "application/json": { "schema": {} } }
+          },
+          "422": {
+            "description": "Validation Error",
+            "content": {
+              "application/json": {
+                "schema": { "$ref": "#/components/schemas/HTTPValidationError" }
+              }
+            }
+          }
+        }
+      }
+    }
+  },
+  "components": {
+    "schemas": {
+      "Body_add_profile_sample_profiles__profile_id__samples_post": {
+        "properties": {
+          "file": { "type": "string", "format": "binary", "title": "File" },
+          "reference_text": { "type": "string", "title": "Reference Text" }
+        },
+        "type": "object",
+        "required": ["file", "reference_text"],
+        "title": "Body_add_profile_sample_profiles__profile_id__samples_post"
+      },
+      "Body_transcribe_audio_transcribe_post": {
+        "properties": {
+          "file": { "type": "string", "format": "binary", "title": "File" },
+          "language": { "anyOf": [{ "type": "string" }, { "type": "null" }], "title": "Language" }
+        },
+        "type": "object",
+        "required": ["file"],
+        "title": "Body_transcribe_audio_transcribe_post"
+      },
+      "GenerationRequest": {
+        "properties": {
+          "profile_id": { "type": "string", "title": "Profile Id" },
+          "text": { "type": "string", "maxLength": 5000, "minLength": 1, "title": "Text" },
+          "language": {
+            "type": "string",
+            "pattern": "^(en|zh)$",
+            "title": "Language",
+            "default": "en"
+          },
+          "seed": {
+            "anyOf": [{ "type": "integer", "minimum": 0.0 }, { "type": "null" }],
+            "title": "Seed"
+          },
+          "model_size": {
+            "anyOf": [{ "type": "string", "pattern": "^(1\\.7B|0\\.6B)$" }, { "type": "null" }],
+            "title": "Model Size",
+            "default": "1.7B"
+          }
+        },
+        "type": "object",
+        "required": ["profile_id", "text"],
+        "title": "GenerationRequest",
+        "description": "Request model for voice generation."
+      },
+      "GenerationResponse": {
+        "properties": {
+          "id": { "type": "string", "title": "Id" },
+          "profile_id": { "type": "string", "title": "Profile Id" },
+          "text": { "type": "string", "title": "Text" },
+          "language": { "type": "string", "title": "Language" },
+          "audio_path": { "type": "string", "title": "Audio Path" },
+          "duration": { "type": "number", "title": "Duration" },
+          "seed": { "anyOf": [{ "type": "integer" }, { "type": "null" }], "title": "Seed" },
+          "created_at": { "type": "string", "format": "date-time", "title": "Created At" }
+        },
+        "type": "object",
+        "required": [
+          "id",
+          "profile_id",
+          "text",
+          "language",
+          "audio_path",
+          "duration",
+          "seed",
+          "created_at"
+        ],
+        "title": "GenerationResponse",
+        "description": "Response model for voice generation."
+      },
+      "HTTPValidationError": {
+        "properties": {
+          "detail": {
+            "items": { "$ref": "#/components/schemas/ValidationError" },
+            "type": "array",
+            "title": "Detail"
+          }
+        },
+        "type": "object",
+        "title": "HTTPValidationError"
+      },
+      "HealthResponse": {
+        "properties": {
+          "status": { "type": "string", "title": "Status" },
+          "model_loaded": { "type": "boolean", "title": "Model Loaded" },
+          "model_downloaded": {
+            "anyOf": [{ "type": "boolean" }, { "type": "null" }],
+            "title": "Model Downloaded"
+          },
+          "model_size": {
+            "anyOf": [{ "type": "string" }, { "type": "null" }],
+            "title": "Model Size"
+          },
+          "gpu_available": { "type": "boolean", "title": "Gpu Available" },
+          "vram_used_mb": {
+            "anyOf": [{ "type": "number" }, { "type": "null" }],
+            "title": "Vram Used Mb"
+          }
+        },
+        "type": "object",
+        "required": ["status", "model_loaded", "gpu_available"],
+        "title": "HealthResponse",
+        "description": "Response model for health check."
+      },
+      "HistoryListResponse": {
+        "properties": {
+          "items": {
+            "items": { "$ref": "#/components/schemas/HistoryResponse" },
+            "type": "array",
+            "title": "Items"
+          },
+          "total": { "type": "integer", "title": "Total" }
+        },
+        "type": "object",
+        "required": ["items", "total"],
+        "title": "HistoryListResponse",
+        "description": "Response model for history list."
+      },
+      "HistoryResponse": {
+        "properties": {
+          "id": { "type": "string", "title": "Id" },
+          "profile_id": { "type": "string", "title": "Profile Id" },
+          "profile_name": { "type": "string", "title": "Profile Name" },
+          "text": { "type": "string", "title": "Text" },
+          "language": { "type": "string", "title": "Language" },
+          "audio_path": { "type": "string", "title": "Audio Path" },
+          "duration": { "type": "number", "title": "Duration" },
+          "seed": { "anyOf": [{ "type": "integer" }, { "type": "null" }], "title": "Seed" },
+          "created_at": { "type": "string", "format": "date-time", "title": "Created At" }
+        },
+        "type": "object",
+        "required": [
+          "id",
+          "profile_id",
+          "profile_name",
+          "text",
+          "language",
+          "audio_path",
+          "duration",
+          "seed",
+          "created_at"
+        ],
+        "title": "HistoryResponse",
+        "description": "Response model for history entry (includes profile name)."
+      },
+      "ModelDownloadRequest": {
+        "properties": { "model_name": { "type": "string", "title": "Model Name" } },
+        "type": "object",
+        "required": ["model_name"],
+        "title": "ModelDownloadRequest",
+        "description": "Request model for triggering model download."
+      },
+      "ModelStatus": {
+        "properties": {
+          "model_name": { "type": "string", "title": "Model Name" },
+          "display_name": { "type": "string", "title": "Display Name" },
+          "downloaded": { "type": "boolean", "title": "Downloaded" },
+          "size_mb": { "anyOf": [{ "type": "number" }, { "type": "null" }], "title": "Size Mb" },
+          "loaded": { "type": "boolean", "title": "Loaded", "default": false }
+        },
+        "type": "object",
+        "required": ["model_name", "display_name", "downloaded"],
+        "title": "ModelStatus",
+        "description": "Response model for model status."
+      },
+      "ModelStatusListResponse": {
+        "properties": {
+          "models": {
+            "items": { "$ref": "#/components/schemas/ModelStatus" },
+            "type": "array",
+            "title": "Models"
+          }
+        },
+        "type": "object",
+        "required": ["models"],
+        "title": "ModelStatusListResponse",
+        "description": "Response model for model status list."
+      },
+      "ProfileSampleResponse": {
+        "properties": {
+          "id": { "type": "string", "title": "Id" },
+          "profile_id": { "type": "string", "title": "Profile Id" },
+          "audio_path": { "type": "string", "title": "Audio Path" },
+          "reference_text": { "type": "string", "title": "Reference Text" }
+        },
+        "type": "object",
+        "required": ["id", "profile_id", "audio_path", "reference_text"],
+        "title": "ProfileSampleResponse",
+        "description": "Response model for profile sample."
+      },
+      "TranscriptionResponse": {
+        "properties": {
+          "text": { "type": "string", "title": "Text" },
+          "duration": { "type": "number", "title": "Duration" }
+        },
+        "type": "object",
+        "required": ["text", "duration"],
+        "title": "TranscriptionResponse",
+        "description": "Response model for transcription."
+      },
+      "ValidationError": {
+        "properties": {
+          "loc": {
+            "items": { "anyOf": [{ "type": "string" }, { "type": "integer" }] },
+            "type": "array",
+            "title": "Location"
+          },
+          "msg": { "type": "string", "title": "Message" },
+          "type": { "type": "string", "title": "Error Type" }
+        },
+        "type": "object",
+        "required": ["loc", "msg", "type"],
+        "title": "ValidationError"
+      },
+      "VoiceProfileCreate": {
+        "properties": {
+          "name": { "type": "string", "maxLength": 100, "minLength": 1, "title": "Name" },
+          "description": {
+            "anyOf": [{ "type": "string", "maxLength": 500 }, { "type": "null" }],
+            "title": "Description"
+          },
+          "language": {
+            "type": "string",
+            "pattern": "^(en|zh)$",
+            "title": "Language",
+            "default": "en"
+          }
+        },
+        "type": "object",
+        "required": ["name"],
+        "title": "VoiceProfileCreate",
+        "description": "Request model for creating a voice profile."
+      },
+      "VoiceProfileResponse": {
+        "properties": {
+          "id": { "type": "string", "title": "Id" },
+          "name": { "type": "string", "title": "Name" },
+          "description": {
+            "anyOf": [{ "type": "string" }, { "type": "null" }],
+            "title": "Description"
+          },
+          "language": { "type": "string", "title": "Language" },
+          "created_at": { "type": "string", "format": "date-time", "title": "Created At" },
+          "updated_at": { "type": "string", "format": "date-time", "title": "Updated At" }
+        },
+        "type": "object",
+        "required": ["id", "name", "description", "language", "created_at", "updated_at"],
+        "title": "VoiceProfileResponse",
+        "description": "Response model for voice profile."
+      }
+    }
+  }
+}
diff --git a/docs2/package.json b/docs2/package.json
new file mode 100644
index 00000000..1d14cd8f
--- /dev/null
+++ b/docs2/package.json
@@ -0,0 +1,32 @@
+{
+  "name": "example-next-mdx",
+  "version": "0.0.0",
+  "private": true,
+  "scripts": {
+    "build": "fumadocs-mdx && next build",
+    "dev": "fumadocs-mdx && next dev",
+    "start": "next start",
+    "postinstall": "fumadocs-mdx"
+  },
+  "dependencies": {
+    "fumadocs-core": "^16.4.11",
+    "fumadocs-mdx": "13",
+    "fumadocs-openapi": "^10.2.7",
+    "fumadocs-ui": "^16.4.11",
+    "lucide-react": "^0.546.0",
+    "next": "^16.1.6",
+    "react": "^19.2.0",
+    "react-dom": "^19.2.0",
+    "shiki": "^3.22.0"
+  },
+  "devDependencies": {
+    "@tailwindcss/postcss": "^4.1.15",
+    "@types/mdx": "^2.0.13",
+    "@types/node": "^24.9.1",
+    "@types/react": "^19.2.2",
+    "@types/react-dom": "^19.2.2",
+    "postcss": "^8.5.6",
+    "tailwindcss": "^4.1.15",
+    "typescript": "^5.9.3"
+  }
+}
diff --git a/providers/README.md b/providers/README.md
index 9ca3e03b..6f4a6f42 100644
--- a/providers/README.md
+++ b/providers/README.md
@@ -43,24 +43,27 @@ Voicebox uses a **pluggable provider architecture** that separates the main appl
 
 ## Platform Behavior
 
-| Platform | App Size | TTS Backend | Provider Download |
-|----------|----------|-------------|-------------------|
-| macOS (Apple Silicon) | ~300MB | MLX bundled | Not needed |
-| macOS (Intel) | ~300MB | PyTorch bundled | Not needed |
-| Windows | ~150MB | None bundled | Required |
-| Linux | ~150MB | None bundled | Required |
+| Platform              | App Size | TTS Backend     | Provider Download |
+| --------------------- | -------- | --------------- | ----------------- |
+| macOS (Apple Silicon) | ~300MB   | MLX bundled     | Not needed        |
+| macOS (Intel)         | ~300MB   | PyTorch bundled | Not needed        |
+| Windows               | ~150MB   | None bundled    | Required          |
+| Linux                 | ~150MB   | None bundled    | Required          |
 
 ### macOS (Apple Silicon)
+
 - MLX backend is **bundled** in the app
 - Works immediately after install
 - Uses Metal for GPU acceleration
 
 ### macOS (Intel)
+
 - PyTorch backend is **bundled** in the app
 - Works immediately after install
 - Uses CPU inference
 
 ### Windows / Linux
+
 - **No TTS bundled** - keeps app small (~150MB)
 - On first use, prompts to download a provider
 - Provider options:
@@ -108,7 +111,7 @@ On macOS, the `BundledProvider` directly calls the bundled `backends/` code:
 class BundledProvider:
     def __init__(self):
         self._backend = get_tts_backend()  # MLX or PyTorch
-    
+
     async def generate(self, text, voice_prompt, ...):
         return await self._backend.generate(text, voice_prompt, ...)
 ```
@@ -122,7 +125,7 @@ On Windows/Linux, the `LocalProvider` communicates with a standalone provider vi
 class LocalProvider:
     def __init__(self, base_url: str):
         self.base_url = base_url  # e.g., "http://127.0.0.1:8765"
-    
+
     async def generate(self, text, voice_prompt, ...):
         response = await self.client.post(
             f"{self.base_url}/tts/generate",
@@ -149,68 +152,82 @@ async def generate(text: str, voice_prompt: dict, ...):
 All providers (local or remote) must implement these HTTP endpoints:
 
 ### POST /tts/generate
+
 Generate speech from text.
 
 **Request:**
+
 ```json
 {
-    "text": "Hello world!",
-    "voice_prompt": { /* voice embedding */ },
-    "language": "en",
-    "seed": 12345,
-    "model_size": "1.7B"
+	"text": "Hello world!",
+	"voice_prompt": {
+		/* voice embedding */
+	},
+	"language": "en",
+	"seed": 12345,
+	"model_size": "1.7B"
 }
 ```
 
 **Response:**
+
 ```json
 {
-    "audio": "base64-encoded-wav",
-    "sample_rate": 24000,
-    "duration": 2.5
+	"audio": "base64-encoded-wav",
+	"sample_rate": 24000,
+	"duration": 2.5
 }
 ```
 
 ### POST /tts/create_voice_prompt
+
 Create voice embedding from reference audio.
 
 **Request:** `multipart/form-data`
+
 - `audio`: Audio file
 - `reference_text`: Transcript
 
 **Response:**
+
 ```json
 {
-    "voice_prompt": { /* voice embedding */ },
-    "was_cached": false
+	"voice_prompt": {
+		/* voice embedding */
+	},
+	"was_cached": false
 }
 ```
 
 ### GET /tts/health
+
 Health check.
 
 **Response:**
+
 ```json
 {
-    "status": "healthy",
-    "provider": "pytorch-cuda",
-    "version": "1.0.0",
-    "model": "1.7B",
-    "device": "cuda:0"
+	"status": "healthy",
+	"provider": "pytorch-cuda",
+	"version": "1.0.0",
+	"model": "1.7B",
+	"device": "cuda:0"
 }
 ```
 
 ### GET /tts/status
+
 Model status.
 
 **Response:**
+
 ```json
 {
-    "model_loaded": true,
-    "model_size": "1.7B",
-    "available_sizes": ["0.6B", "1.7B"],
-    "gpu_available": true,
-    "vram_used_mb": 1234
+	"model_loaded": true,
+	"model_size": "1.7B",
+	"available_sizes": ["0.6B", "1.7B"],
+	"gpu_available": true,
+	"vram_used_mb": 1234
 }
 ```
 
@@ -245,10 +262,12 @@ Model status.
 ## Building Providers
 
 ### Prerequisites
+
 - Python 3.12
 - PyInstaller
 
 ### Build PyTorch CPU Provider
+
 ```bash
 cd providers/pytorch-cpu
 pip install -r requirements.txt
@@ -257,6 +276,7 @@ python build.py
 ```
 
 ### Build PyTorch CUDA Provider
+
 ```bash
 cd providers/pytorch-cuda
 pip install torch --index-url https://download.pytorch.org/whl/cu121
@@ -273,6 +293,7 @@ Providers have **independent versions** from the app:
 - **Provider version:** `v1.0.0` (rare updates)
 
 Providers only need updates when:
+
 - TTS model changes (new Qwen3-TTS version)
 - API spec changes
 - Bug fixes in inference code
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index c9020db2ed0176ead670e76d10bd339fd140d47e..3df4bd6fb8ca7ff37906e8213bdb379941a49c76 100644
GIT binary patch
delta 815
zcmZwFJ5N+W6bJBKR%GS1AS?=^g1WvBJ2Q8lG?zQC@DV8O?2M&_oyBg8#P2|&g$c#o
z(r;jCWADbo#ERDcMzC2Y`DKbp{%7XQ8UFa$9Kz>sz3xJz(U^x0EW;8kp8f89?Hse&
zlP~JvglYC(v$Gev-zs&s#weCZ1#U<N<H@GXiQ6J&XB;c6C+=LKiA`1^1<$JT%FDgi
zuU;PSZoM13!Pqrn23l|hX5lK#)nnIAv!&)<Wu63O6%t9qDzY(2s$@}2YDCG|bRC;x
zN`LEY*Tb^?p;cBPrW_R`p9CXmRU|7N?(bO2G8tiVnhvUP_%G;9Xm^{XD6C4_3Nqd}
zk|HYdJ|a?8HtVd5;N5hPb1wSJ8;xUovsJRh1PU`^I%NdOOx7Dkco{cUD2&h3E!3fk
z`XcD&;OMXo*I*tNU=fyJ89J~6t8g9GU>&-!0XJZhu?bsn3%21l+=08W1G{h!?!yD<
z!9#cikKqYCt&a|$ou8LRqYvB*3JkrL*)u#!WfD17F)Eov(9_+?M%#EX7lYG-=RmLr
zePF;rKmig|eR`nlUnMJ;@>xq_7(J5QTXIYas&dv9<}$GKpMUi+@o-si)Hj1s--4@0
b{r$DKtLu%1Ucvm&VBf*MQGfrq|7q?Iba>tr

delta 815
zcmZwFJ5N+W7zW^7R%GRlT$B|RRJ;%S&78T?9OfE+0;Qduv9z$W*lm&cA4s$?p*WQO
z14|owHx?#Vw7vwXmPwvW_kNd|;jiEAA$<L@y*k%wwPs-f=3xe=PyTLyUpS=6qi<^O
zh%|lFbn;5~J2fXKeHNLStSyr<YvwB>m?Mfp8C8WUGcBbwjLwe;T5zp|4tD45o7ab1
zy$>Td7`Zk~KnJeDBwUB7X5_kgvUVwk#A9O42g#%+&4P7`1s+vJf+(9XUPoBZ-9?>^
zW>|MWb!rtHx0RBNWEGesMa&vmv0RlLBasxG#)G6*rd$TSi`~_BO(M$Tie*M}g^qY&
z*7?Ya6;>!|qABi*APQDp28~j8y;J9`mCuwJuN*omxnRg>St8*po>F!?jRhH<y{C(y
z+k=DsF5G}=n1NZCgLznhMOcEHuna4(3Tto+&NJ4b2X|lt?!rB|51X(B58xp@f^B#V
zPv9v$gXhh`{)@A-I`K+~s3Max7ABPs%nNKMB}=?`6Qc5CLuv0*_&-!{aJ=^t80<hF
z2sj9+K!R$H_jL28E;)-BlVVO<6eQ`HFO^1pNt6_&RIYee?X!&+TkH)^`vxqy=Cr@N
Z{C;Vz)zXXj{}Z@3aj!H#Kkt5-`Ue<X-Aw=h

diff --git a/tauri/src-tauri/src/main.rs b/tauri/src-tauri/src/main.rs
index 255655aa..25251169 100644
--- a/tauri/src-tauri/src/main.rs
+++ b/tauri/src-tauri/src/main.rs
@@ -423,43 +423,30 @@ fn is_process_running(pid: u32) -> bool {
     false
 }
 
-/// Kill entire Windows process tree by enumerating children
+/// Kill entire Windows process tree using taskkill's built-in /T flag
+/// This is more reliable than WMIC-based enumeration (WMIC is deprecated on Windows 11)
 #[cfg(windows)]
 fn kill_windows_process_tree(parent_pid: u32) -> Result<(), String> {
     use std::process::Command;
 
-    // Find all child processes using WMIC
-    let output = Command::new("wmic")
-        .args([
-            "process",
-            "where",
-            &format!("ParentProcessId={}", parent_pid),
-            "get",
-            "ProcessId"
-        ])
+    // taskkill with /T kills the entire process tree
+    // /F = force, /T = tree (kill child processes)
+    let result = Command::new("taskkill")
+        .args(["/PID", &parent_pid.to_string(), "/T", "/F"])
         .output();
 
-    if let Ok(output) = output {
-        let output_str = String::from_utf8_lossy(&output.stdout);
-        for line in output_str.lines().skip(1) { // Skip header
-            if let Ok(child_pid) = line.trim().parse::<u32>() {
-                println!("Found child process: {}", child_pid);
-                // Recursively kill child's children
-                let _ = kill_windows_process_tree(child_pid);
-                // Kill the child
-                let _ = Command::new("taskkill")
-                    .args(["/PID", &child_pid.to_string(), "/F"])
-                    .output();
+    match result {
+        Ok(output) => {
+            if output.status.success() {
+                println!("Successfully killed process tree for PID {}", parent_pid);
+            } else {
+                let stderr = String::from_utf8_lossy(&output.stderr);
+                eprintln!("taskkill stderr: {}", stderr);
             }
+            Ok(())
         }
+        Err(e) => Err(format!("Failed to run taskkill: {}", e))
     }
-
-    // Kill the parent process
-    let _ = Command::new("taskkill")
-        .args(["/PID", &parent_pid.to_string(), "/F"])
-        .output();
-
-    Ok(())
 }
 
 #[command]
diff --git a/web/src/assets.d.ts b/web/src/assets.d.ts
new file mode 100644
index 00000000..1c592325
--- /dev/null
+++ b/web/src/assets.d.ts
@@ -0,0 +1,4 @@
+declare module '*.png' {
+  const value: string;
+  export default value;
+}
diff --git a/web/src/platform/updater.ts b/web/src/platform/updater.ts
index 32ed0148..2f8be445 100644
--- a/web/src/platform/updater.ts
+++ b/web/src/platform/updater.ts
@@ -11,10 +11,6 @@ class WebUpdater implements PlatformUpdater {
 
   private subscribers: Set<(status: UpdateStatus) => void> = new Set();
 
-  private notifySubscribers() {
-    this.subscribers.forEach((callback) => callback(this.status));
-  }
-
   subscribe(callback: (status: UpdateStatus) => void): () => void {
     this.subscribers.add(callback);
     callback(this.status);
diff --git a/web/src/vite-env.d.ts b/web/src/vite-env.d.ts
new file mode 100644
index 00000000..31a365f5
--- /dev/null
+++ b/web/src/vite-env.d.ts
@@ -0,0 +1,12 @@
+/// <reference types="vite/client" />
+
+interface ImportMetaEnv {
+  readonly VITE_SERVER_URL?: string;
+  readonly VITE_APP_VERSION?: string;
+  readonly PROD?: boolean;
+  readonly DEV?: boolean;
+}
+
+interface ImportMeta {
+  readonly env: ImportMetaEnv;
+}
diff --git a/web/tsconfig.json b/web/tsconfig.json
index 629bcb7f..1c148061 100644
--- a/web/tsconfig.json
+++ b/web/tsconfig.json
@@ -15,6 +15,7 @@
     "noUnusedLocals": true,
     "noUnusedParameters": true,
     "noFallthroughCasesInSwitch": true,
+    "types": ["vite/client"],
     "baseUrl": ".",
     "paths": {
       "@/*": ["../app/src/*"]

From 53b1e8868ce1ade1b78e01c8d8fbee83ab45690c Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 02:19:11 -0800
Subject: [PATCH 19/33] Enhance provider logging and error handling

- Added functionality to create log files for provider output, improving debugging on Windows.
- Updated error handling to read from log files instead of using subprocess output directly.
- Enhanced logging messages to include log file locations for easier troubleshooting.
---
 backend/providers/__init__.py | 50 ++++++++++++++++++++++-------------
 1 file changed, 31 insertions(+), 19 deletions(-)

diff --git a/backend/providers/__init__.py b/backend/providers/__init__.py
index cbe1c2cf..b8b96e00 100644
--- a/backend/providers/__init__.py
+++ b/backend/providers/__init__.py
@@ -71,14 +71,22 @@ async def start_provider(self, provider_type: str) -> None:
                 logger.info(f"Provider binary: {provider_path}")
                 logger.info(f"Data directory: {get_data_dir()}")
 
+                # Create log files for provider output (easier debugging on Windows)
+                logs_dir = get_data_dir() / "logs"
+                logs_dir.mkdir(exist_ok=True)
+                stdout_log = logs_dir / f"{provider_type}-stdout.log"
+                stderr_log = logs_dir / f"{provider_type}-stderr.log"
+
+                logger.info(f"Provider logs will be written to: {logs_dir}")
+
                 process = subprocess.Popen(
                     [
                         str(provider_path),
                         "--port", str(port),
                         "--data-dir", str(get_data_dir()),
                     ],
-                    stdout=subprocess.PIPE,
-                    stderr=subprocess.PIPE,
+                    stdout=open(stdout_log, 'w'),
+                    stderr=open(stderr_log, 'w'),
                     text=True,
                     bufsize=1,
                 )
@@ -88,23 +96,24 @@ async def start_provider(self, provider_type: str) -> None:
                 try:
                     await self._wait_for_provider_health(base_url, timeout=30)
                 except TimeoutError as e:
-                    # Capture subprocess output for debugging
-                    stdout_lines = []
-                    stderr_lines = []
+                    # Read log files for debugging (works on all platforms unlike select)
+                    stdout_content = ""
+                    stderr_content = ""
 
-                    # Try to read available output
-                    import select
                     try:
-                        if process.stdout and select.select([process.stdout], [], [], 0)[0]:
-                            stdout_lines = process.stdout.readlines()
-                        if process.stderr and select.select([process.stderr], [], [], 0)[0]:
-                            stderr_lines = process.stderr.readlines()
-                    except Exception:
-                        # select might not work on all platforms
-                        pass
+                        if stdout_log.exists():
+                            stdout_content = stdout_log.read_text()
+                        if stderr_log.exists():
+                            stderr_content = stderr_log.read_text()
+                    except Exception as read_err:
+                        logger.error(f"Failed to read provider logs: {read_err}")
 
-                    logger.error(f"Provider failed to start. Stdout: {stdout_lines}")
-                    logger.error(f"Provider failed to start. Stderr: {stderr_lines}")
+                    logger.error(f"Provider failed to start within 30 seconds")
+                    logger.error(f"Check logs at: {logs_dir}")
+                    if stdout_content:
+                        logger.error(f"Stdout: {stdout_content[-2000:]}")  # Last 2000 chars
+                    if stderr_content:
+                        logger.error(f"Stderr: {stderr_content[-2000:]}")  # Last 2000 chars
 
                     # Terminate the process
                     process.terminate()
@@ -113,15 +122,18 @@ async def start_provider(self, provider_type: str) -> None:
                     except subprocess.TimeoutExpired:
                         process.kill()
 
-                    raise
+                    # Raise with log file location for user
+                    raise TimeoutError(
+                        f"Provider {provider_type} failed to start. Check logs at: {logs_dir}"
+                    )
 
                 # Create LocalProvider instance
                 self.active_provider = LocalProvider(base_url)
                 self._provider_process = process
                 self._provider_port = port
 
-                # Start background task to log subprocess output
-                asyncio.create_task(self._log_subprocess_output(process))
+                # Logs are written directly to files (stdout_log, stderr_log)
+                # No need for background task - users can check {logs_dir} for debugging
             else:
                 # No external binary, use bundled provider (if available)
                 if provider_type == "pytorch-cpu":

From 732d35ca899161c8ff0d06884f760046bae2bbbc Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 03:34:20 -0800
Subject: [PATCH 20/33] Update README and documentation for Linux support and
 Docker usage

- Revised README to include links for downloading the latest releases for macOS, Windows, and Linux.
- Added detailed instructions for running Voicebox with Docker, including Docker Compose usage.
- Updated installation documentation to reflect Linux availability and provide specific download options for AppImage and Deb packages.
- Enhanced clarity in Docker documentation regarding accessing the web UI.
---
 README.md                      |  34 ++++++++++++++++++++-------------
 docs/overview/docker.mdx       |   8 ++++----
 docs/overview/installation.mdx |  34 ++++++++++++++++++++++++++++++---
 tauri/src-tauri/gen/Assets.car | Bin 3847048 -> 3847048 bytes
 4 files changed, 56 insertions(+), 20 deletions(-)

diff --git a/README.md b/README.md
index 32bf7133..666f042c 100644
--- a/README.md
+++ b/README.md
@@ -80,28 +80,35 @@ Download a voice model, clone any voice from a few seconds of audio, and compose
 
 | Platform              | Download                                                                                                                    |
 | --------------------- | --------------------------------------------------------------------------------------------------------------------------- |
-| macOS (Apple Silicon) | [voicebox_aarch64.app.tar.gz](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_aarch64.app.tar.gz)   |
-| macOS (Intel)         | [voicebox_x64.app.tar.gz](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_x64.app.tar.gz)           |
-| Windows (MSI)         | [voicebox_0.1.0_x64_en-US.msi](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64_en-US.msi) |
-| Windows (Setup)       | [voicebox_0.1.0_x64-setup.exe](https://github.com/jamiepine/voicebox/releases/download/v0.1.0/voicebox_0.1.0_x64-setup.exe) |
+| macOS (Apple Silicon) | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest)   |
+| macOS (Intel)         | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest)           |
+| Windows (MSI)         | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest) |
+| Windows (Setup)       | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest) |
+| Linux (AppImage)      | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest) |
+| Linux (Deb)           | [Download latest release](https://github.com/jamiepine/voicebox/releases/latest) |
 
-> **Linux desktop builds coming soon** — Currently blocked by GitHub runner disk space limitations.
+### Docker
 
-### Docker (Server Deployment)
-
-Run Voicebox with the web UI in Docker:
+Run Voicebox with the web UI in Docker - perfect for servers and headless deployments:
 
 ```bash
 # CPU-only (supports amd64 and arm64)
 docker run -p 8000:8000 -v voicebox-data:/app/data \
   ghcr.io/jamiepine/voicebox:latest
 
-# NVIDIA GPU
+# NVIDIA GPU (recommended for performance)
 docker run --gpus all -p 8000:8000 -v voicebox-data:/app/data \
   ghcr.io/jamiepine/voicebox:latest-cuda
 ```
 
-See [Docker Deployment Guide](docs/plans/DOCKER_DEPLOYMENT.md) for full documentation.
+Or use Docker Compose:
+```bash
+docker compose up -d
+```
+
+Open http://localhost:8000 to access the web UI.
+
+See [Docker Deployment Guide](docs/overview/docker.mdx) for cloud deployments, GPU setup, and more.
 
 ---
 
@@ -153,9 +160,10 @@ Create multi-voice narratives, podcasts, and conversations with a timeline-based
 
 ### Flexible Deployment
 
-- **Local mode** — Everything runs on your machine
-- **Remote mode** — Connect to a GPU server on your network
-- **One-click server** — Turn any machine into a Voicebox server
+- **Desktop app** — Native apps for macOS, Windows, and Linux
+- **Docker** — Deploy to servers with the web UI included
+- **Remote mode** — Connect desktop app to a remote GPU server
+- **Cloud ready** — Deploy to AWS, GCP, DigitalOcean, or any cloud provider
 
 ---
 
diff --git a/docs/overview/docker.mdx b/docs/overview/docker.mdx
index 8fff55c8..0032a02a 100644
--- a/docs/overview/docker.mdx
+++ b/docs/overview/docker.mdx
@@ -23,7 +23,7 @@ Voicebox is available as Docker images that include both the backend API and web
       ghcr.io/jamiepine/voicebox:latest-cuda
     ```
 
-    Open http://localhost:8000 in your browser.
+    Then open http://localhost:8000 to access the web UI.
   </Tab>
 
   <Tab title="CPU Only">
@@ -33,7 +33,7 @@ Voicebox is available as Docker images that include both the backend API and web
       ghcr.io/jamiepine/voicebox:latest
     ```
 
-    Open http://localhost:8000 in your browser.
+    Then open http://localhost:8000 to access the web UI.
   </Tab>
 
   <Tab title="Docker Compose">
@@ -44,10 +44,10 @@ Voicebox is available as Docker images that include both the backend API and web
     docker compose up -d
 
     # CPU-only variant
-    docker compose -f docker-compose.cpu.yml up -d
+    docker compose -f docker-compose-cpu.yml up -d
     ```
 
-    Open http://localhost:8000 in your browser.
+    Then open http://localhost:8000 to access the web UI.
   </Tab>
 </Tabs>
 
diff --git a/docs/overview/installation.mdx b/docs/overview/installation.mdx
index 508951c7..2b1a410b 100644
--- a/docs/overview/installation.mdx
+++ b/docs/overview/installation.mdx
@@ -5,15 +5,18 @@ description: "Download and install Voicebox on macOS, Windows, or Linux"
 
 ## Download
 
-Voicebox is available for macOS and Windows, with Linux builds coming soon.
+Voicebox is available for macOS, Windows, and Linux.
 
-<CardGroup cols={3}>
+<CardGroup cols={4}>
   <Card title="macOS" icon="apple">
     Download for Apple Silicon or Intel Macs
   </Card>
   <Card title="Windows" icon="windows">
     Download MSI installer or Setup executable
   </Card>
+  <Card title="Linux" icon="linux">
+    Download AppImage or Deb package
+  </Card>
   <Card title="Docker" icon="docker" href="/overview/docker">
     Run with web UI in a container
   </Card>
@@ -63,8 +66,33 @@ Voicebox is available for macOS and Windows, with Linux builds coming soon.
 
 ### Linux
 
+<Tabs>
+  <Tab title="AppImage">
+    Download: [voicebox_x86_64.AppImage](https://github.com/jamiepine/voicebox/releases/latest)
+
+    ```bash
+    # Make executable
+    chmod +x voicebox_x86_64.AppImage
+
+    # Run
+    ./voicebox_x86_64.AppImage
+    ```
+  </Tab>
+  <Tab title="Debian/Ubuntu">
+    Download: [voicebox_amd64.deb](https://github.com/jamiepine/voicebox/releases/latest)
+
+    ```bash
+    # Install
+    sudo dpkg -i voicebox_amd64.deb
+
+    # Run
+    voicebox
+    ```
+  </Tab>
+</Tabs>
+
 <Note>
-  Linux desktop builds are coming soon. For server deployments, use [Docker](/overview/docker).
+  For headless server deployments, use [Docker](/overview/docker) instead of the desktop app.
 </Note>
 
 ## First Launch
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index 3df4bd6fb8ca7ff37906e8213bdb379941a49c76..d44f6eaf3c8b63fe5e60c3ca6ea8f1b2b1896e2f 100644
GIT binary patch
delta 841
zcmZY8yKWOf6b4{lFxgxk$b}?05Ci5u@!T&dSkLUtDkWv!fDTboP#{s*C6Pr3eIy#B
z6n4oQ<OS%l5JEtcmOn~D<CQ)gZF9~)XJ-fBe^dwX<)pLStW+vXFbf$h!UD|0-0`2z
zN%N34hQHPO;a5e6Z*{Bs?f8@aTg$m;)Hq{_C{-ZRI7K|=kr);nF9Q!eTH?5tn$WXH
z$Y`~39(DKC%NK|3t#=dGpSUX2pbl4{0asyWG;vvK<RN%zeHn<Ng(OlIj#%a;q25#D
zlP;5U({qgEMxW1VjRtx4p`L52SrX9@VVp+bf)UTq(rDwI=0XQVoes=g5SNW!7ui}h
zF9bEbw2bJ2dLk{g#472Cp|(^udKJ8%Ze#;3|2LY%Y_pyhjLVQP)vJgVA_eina^kfX
zQ7D>{noeXrwK|<A+UOtbXD|zMFb@l`2usj}Ww-{{VFgxU4c6fXob}j*Ew~9S*oIqh
z8+M=#ci=AEgAUw>2k;Oc!Q;`v{*%+woJ%HDV4kSLJ0cm*<B}?IM#rKpor^I}Zzn0n
z`Nh5HAN8IBfnDeV1qK`hNKm7ro*w^trl<^21bhvx2(AYu!9+^5i^`-jC6}g`h>KGe
t^m5*~Yx?7^1veUZ_g3Dt*DDphj6a};x`Vob+Pipvj=DPf`FZc-%s*4|;l=;}

delta 841
zcmZwGJx>%t7zgmXLu7e9lotU(ITha@Zf15~DcsxHnF%E&-@wjTT3DD^9HoTVX-{Hf
zLa|r+4fq&dj4{!~(E2BW&AG`hPbQoEpP6T8559hD9>C|*t&Pb>qmjWhOhFswU>0Uh
zer}z%583$9o@Pg1)VrfMdcFDk<fH!8Ds-~OC>BXo+>oq{CmRzdZu6L&aV)o<xO2HC
zcK+m2@T5wwyxe~I;`w1`?d{O@hpq`N7=tS?4p(8K9=a@!7n*yOcodXW6-gRak_}N(
zDf9fiN06M2_OU6%__xn`eNbfY$BMEFF$KlQN5M#170615{W}(uj7FFgM}tbd{1^19
z%9fgi$gPUn3Nqd}k|HSbJ|I$+HtD4E%Dd4Z=UniYI~s;;b*x~K2{dNJbW8}6iL5t@
za58SnDmOljj!;)+&=)}~{r%kxCSeMuVFqSl4%#pe*WfxVz#=TcGTeakj8#~Jo3IWW
za0_n3CUoEq+=Y9v1^3|rJcLK^xZdA=a&}f2jX7{HsA8D4OrGITDv?N`3_-~#Dm^-#
zWV8(z_o9E?dkO^G&;<q@1mqw=)yF+O`0*@f$|o&};pUO#-jZWdP??f0aV;wr|MOXW
vh`hS&H|U!FpliX^gYM44>&{}Mq37`jv`{xumr;8c>pj$!`unGy4-<a?gl6IG


From 61dabe73822761c68d6ab9797b7cbcfa2370d571 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 04:06:21 -0800
Subject: [PATCH 21/33] Enhance provider packaging and CUDA download
 functionality

- Added support for packaging provider archives in the release workflow, creating platform-specific zip and tar.gz files for distribution.
- Updated the `.gitignore` to exclude `.spec` files.
- Introduced a new `CudaDownloadSection` component to manage CUDA downloads, including progress tracking and error handling.
- Refactored provider download logic to handle archive extraction and cleanup after download.
- Improved subprocess output handling in the provider manager for better logging and error reporting.
---
 .github/workflows/release.yml                 |  48 +++--
 .gitignore                                    |   1 +
 .../ServerSettings/CudaDownloadSection.tsx    | 173 ++++++++++++++++++
 backend/providers/__init__.py                 |  42 ++++-
 backend/providers/installer.py                | 125 ++++++++-----
 data/.gitkeep                                 |   7 -
 data/cache/.gitkeep                           |   1 -
 providers/pytorch-cpu/build.py                |  14 +-
 providers/pytorch-cuda/build.py               |  14 +-
 9 files changed, 352 insertions(+), 73 deletions(-)
 create mode 100644 app/src/components/ServerSettings/CudaDownloadSection.tsx
 delete mode 100644 data/.gitkeep
 delete mode 100644 data/cache/.gitkeep

diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 1da7da39..d102274c 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -91,6 +91,30 @@ jobs:
           cd providers/${{ matrix.provider }}
           python build.py
 
+      - name: Package provider for distribution
+        shell: bash
+        run: |
+          cd providers/${{ matrix.provider }}/dist
+
+          # Add platform suffix for archive name
+          if [ "${{ matrix.platform }}" == "windows-latest" ]; then
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-windows.zip"
+            # On Windows, zip the directory
+            powershell Compress-Archive -Path "tts-provider-${{ matrix.provider }}/*" -DestinationPath "$ARCHIVE_NAME"
+          elif [ "${{ matrix.platform }}" == "macos-latest" ]; then
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-macos-arm64.tar.gz"
+            tar -czf "$ARCHIVE_NAME" tts-provider-${{ matrix.provider }}/
+          elif [ "${{ matrix.platform }}" == "macos-15-intel" ]; then
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-macos-x64.tar.gz"
+            tar -czf "$ARCHIVE_NAME" tts-provider-${{ matrix.provider }}/
+          else
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-linux.tar.gz"
+            tar -czf "$ARCHIVE_NAME" tts-provider-${{ matrix.provider }}/
+          fi
+
+          echo "Created archive: $ARCHIVE_NAME"
+          ls -lh "$ARCHIVE_NAME"
+
       - name: Upload provider to R2
         shell: bash
         env:
@@ -106,31 +130,23 @@ jobs:
           aws configure set aws_secret_access_key $R2_SECRET_ACCESS_KEY
           aws configure set region auto
 
-          # Determine binary name based on platform
-          if [ "${{ matrix.platform }}" == "windows-latest" ]; then
-            BINARY_NAME="tts-provider-${{ matrix.provider }}.exe"
-            BINARY_PATH="providers/${{ matrix.provider }}/dist/tts-provider-${{ matrix.provider }}.exe"
-          else
-            BINARY_NAME="tts-provider-${{ matrix.provider }}"
-            BINARY_PATH="providers/${{ matrix.provider }}/dist/tts-provider-${{ matrix.provider }}"
-          fi
-
-          # Add platform suffix for clarity
+          # Determine archive name based on platform
           if [ "${{ matrix.platform }}" == "windows-latest" ]; then
-            UPLOAD_NAME="tts-provider-${{ matrix.provider }}-windows.exe"
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-windows.zip"
           elif [ "${{ matrix.platform }}" == "macos-latest" ]; then
-            UPLOAD_NAME="tts-provider-${{ matrix.provider }}-macos-arm64"
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-macos-arm64.tar.gz"
           elif [ "${{ matrix.platform }}" == "macos-15-intel" ]; then
-            UPLOAD_NAME="tts-provider-${{ matrix.provider }}-macos-x64"
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-macos-x64.tar.gz"
           else
-            UPLOAD_NAME="tts-provider-${{ matrix.provider }}-linux"
+            ARCHIVE_NAME="tts-provider-${{ matrix.provider }}-linux.tar.gz"
           fi
 
           # Upload to R2 (bucket: voicebox)
-          aws s3 cp "$BINARY_PATH" "s3://voicebox/providers/v${{ env.PROVIDER_VERSION }}/$UPLOAD_NAME" \
+          aws s3 cp "providers/${{ matrix.provider }}/dist/$ARCHIVE_NAME" \
+            "s3://voicebox/providers/v${{ env.PROVIDER_VERSION }}/$ARCHIVE_NAME" \
             --endpoint-url "$R2_ENDPOINT"
 
-          echo "Uploaded $UPLOAD_NAME to R2"
+          echo "Uploaded $ARCHIVE_NAME to R2"
 
   # ============================================
   # Build Main App (without bundled TTS on Win/Linux)
diff --git a/.gitignore b/.gitignore
index 05f7ef0d..4fef6ea4 100644
--- a/.gitignore
+++ b/.gitignore
@@ -15,6 +15,7 @@ dist/
 build/
 *.egg-info/
 *.egg
+*.spec
 target/
 *.app
 *.dmg
diff --git a/app/src/components/ServerSettings/CudaDownloadSection.tsx b/app/src/components/ServerSettings/CudaDownloadSection.tsx
new file mode 100644
index 00000000..d6c22207
--- /dev/null
+++ b/app/src/components/ServerSettings/CudaDownloadSection.tsx
@@ -0,0 +1,173 @@
+import { useState, useEffect } from 'react';
+import { useQuery } from '@tanstack/react-query';
+import { Loader2, RefreshCw, CheckCircle, AlertCircle } from 'lucide-react';
+import { relaunch } from '@tauri-apps/plugin-process';
+import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
+import { Button } from '@/components/ui/button';
+import { Badge } from '@/components/ui/badge';
+import { Alert, AlertDescription } from '@/components/ui/alert';
+import { ModelProgress } from './ModelProgress';
+import { apiClient } from '@/lib/api/client';
+import { useServerStore } from '@/stores/serverStore';
+import { toast } from '@/components/ui/use-toast';
+import { usePlatform } from '@/platform/PlatformContext';
+import { useServerHealth } from '@/lib/hooks/useServer';
+
+export function CudaDownloadSection() {
+  const platform = usePlatform();
+  const serverUrl = useServerStore((state) => state.serverUrl);
+  const { data: health } = useServerHealth();
+  const [downloadingCuda, setDownloadingCuda] = useState(false);
+  const [downloadError, setDownloadError] = useState<string | null>(null);
+
+  // Platform checks
+  const isWindows = navigator.userAgent.includes('Windows');
+  const gpuAvailable = health?.gpu_available ?? false;
+
+  // Only show this section on Windows + Tauri + GPU available
+  if (!platform.metadata.isTauri || !isWindows || !gpuAvailable) {
+    return null;
+  }
+
+  // Query CUDA status
+  const { data: cudaStatus, refetch } = useQuery({
+    queryKey: ['cudaStatus'],
+    queryFn: () => apiClient.getCudaStatus(),
+    enabled: isWindows && platform.metadata.isTauri && gpuAvailable,
+    retry: false,
+  });
+
+  // Handle download trigger
+  const handleDownload = async () => {
+    try {
+      setDownloadError(null);
+      await apiClient.triggerCudaDownload();
+      setDownloadingCuda(true);
+    } catch (error) {
+      setDownloadError(error instanceof Error ? error.message : 'Failed to start download');
+    }
+  };
+
+  // Handle retry
+  const handleRetry = () => {
+    setDownloadError(null);
+    handleDownload();
+  };
+
+  // Monitor download progress and auto-restart on completion
+  useEffect(() => {
+    if (!downloadingCuda || !serverUrl) return;
+
+    const eventSource = new EventSource(`${serverUrl}/models/progress/cuda-binary`);
+
+    eventSource.onmessage = (event) => {
+      try {
+        const data = JSON.parse(event.data);
+
+        if (data.status === 'complete' && data.progress >= 100) {
+          eventSource.close();
+          setDownloadingCuda(false);
+
+          // Show restart toast
+          toast({
+            title: 'CUDA Downloaded',
+            description: 'Restarting app to enable GPU acceleration...',
+          });
+
+          // Restart after 2 seconds
+          setTimeout(async () => {
+            await relaunch();
+          }, 2000);
+        }
+
+        if (data.status === 'error') {
+          eventSource.close();
+          setDownloadingCuda(false);
+          setDownloadError(data.error || 'Download failed');
+        }
+      } catch (error) {
+        console.error('Error parsing CUDA download progress:', error);
+      }
+    };
+
+    eventSource.onerror = () => {
+      eventSource.close();
+      setDownloadingCuda(false);
+      setDownloadError('Connection to server lost');
+    };
+
+    return () => eventSource.close();
+  }, [downloadingCuda, serverUrl]);
+
+  if (!cudaStatus) {
+    return null;
+  }
+
+  const { cuda_available, cuda_active, cuda_binary_size_mb } = cudaStatus;
+
+  return (
+    <Card>
+      <CardHeader>
+        <CardTitle>GPU Acceleration</CardTitle>
+      </CardHeader>
+      <CardContent className="space-y-4">
+        {/* Status badges */}
+        <div className="flex flex-wrap gap-2">
+          <Badge variant={cuda_active ? 'default' : 'secondary'}>
+            Mode: {cuda_active ? 'CUDA' : 'CPU'}
+          </Badge>
+          <Badge variant={gpuAvailable ? 'default' : 'secondary'}>
+            GPU: {gpuAvailable ? 'Available' : 'Not Available'}
+          </Badge>
+        </div>
+
+        {/* Already downloaded status */}
+        {cuda_available && !downloadingCuda && (
+          <Alert>
+            <CheckCircle className="h-4 w-4" />
+            <AlertDescription>
+              CUDA support is active. GPU acceleration enabled.
+            </AlertDescription>
+          </Alert>
+        )}
+
+        {/* Download section - only show if not already downloaded */}
+        {!cuda_available && !downloadError && !downloadingCuda && (
+          <div className="space-y-3">
+            <p className="text-sm text-muted-foreground">
+              Download CUDA support for 4-5x faster inference with your NVIDIA GPU
+            </p>
+            <Button onClick={handleDownload} className="w-full">
+              Download CUDA Support ({cuda_binary_size_mb.toFixed(1)}GB)
+            </Button>
+          </div>
+        )}
+
+        {/* Progress display */}
+        {downloadingCuda && (
+          <div className="space-y-2">
+            <ModelProgress
+              modelName="cuda-binary"
+              displayName="CUDA Server Binary"
+              isDownloading={true}
+            />
+          </div>
+        )}
+
+        {/* Error with retry button */}
+        {downloadError && (
+          <div className="space-y-2">
+            <Alert variant="destructive">
+              <AlertCircle className="h-4 w-4" />
+              <AlertDescription>{downloadError}</AlertDescription>
+            </Alert>
+            <Button onClick={handleRetry} variant="outline" className="w-full">
+              <RefreshCw className="mr-2 h-4 w-4" />
+              Retry Download
+            </Button>
+          </div>
+        )}
+      </CardContent>
+    </Card>
+  );
+}
diff --git a/backend/providers/__init__.py b/backend/providers/__init__.py
index b8b96e00..57e5583e 100644
--- a/backend/providers/__init__.py
+++ b/backend/providers/__init__.py
@@ -100,13 +100,43 @@ async def start_provider(self, provider_type: str) -> None:
                     stdout_content = ""
                     stderr_content = ""
 
+                    # Try to read available output (works on Windows and Unix)
                     try:
-                        if stdout_log.exists():
-                            stdout_content = stdout_log.read_text()
-                        if stderr_log.exists():
-                            stderr_content = stderr_log.read_text()
-                    except Exception as read_err:
-                        logger.error(f"Failed to read provider logs: {read_err}")
+                        # Use non-blocking read with timeout
+                        import threading
+                        import queue
+
+                        def enqueue_output(stream, queue):
+                            try:
+                                for line in iter(stream.readline, ''):
+                                    queue.put(line)
+                            except:
+                                pass
+
+                        stdout_queue = queue.Queue()
+                        stderr_queue = queue.Queue()
+
+                        if process.stdout:
+                            t = threading.Thread(target=enqueue_output, args=(process.stdout, stdout_queue))
+                            t.daemon = True
+                            t.start()
+
+                        if process.stderr:
+                            t2 = threading.Thread(target=enqueue_output, args=(process.stderr, stderr_queue))
+                            t2.daemon = True
+                            t2.start()
+
+                        # Give threads a moment to read
+                        import time
+                        time.sleep(0.5)
+
+                        # Collect output
+                        while not stdout_queue.empty():
+                            stdout_lines.append(stdout_queue.get_nowait())
+                        while not stderr_queue.empty():
+                            stderr_lines.append(stderr_queue.get_nowait())
+                    except Exception as ex:
+                        logger.warning(f"Could not capture subprocess output: {ex}")
 
                     logger.error(f"Provider failed to start within 30 seconds")
                     logger.error(f"Check logs at: {logs_dir}")
diff --git a/backend/providers/installer.py b/backend/providers/installer.py
index a41f421e..0dcca1ec 100644
--- a/backend/providers/installer.py
+++ b/backend/providers/installer.py
@@ -55,13 +55,13 @@ def _get_provider_binary_name(provider_type: str) -> str:
 def _get_provider_download_name(provider_type: str) -> str:
     """Get the remote download filename for a provider type (includes platform suffix)."""
     system = platform.system()
-    
+
     if system == "Windows":
         platform_suffix = "windows"
-        ext = ".exe"
+        ext = ".zip"
     elif system == "Linux":
         platform_suffix = "linux"
-        ext = ""
+        ext = ".tar.gz"
     elif system == "Darwin":
         # Detect macOS architecture
         machine = platform.machine()
@@ -69,10 +69,10 @@ def _get_provider_download_name(provider_type: str) -> str:
             platform_suffix = "macos-arm64"
         else:
             platform_suffix = "macos-x64"
-        ext = ""
+        ext = ".tar.gz"
     else:
         raise ValueError(f"Provider downloads not supported on {system}")
-    
+
     return f"tts-provider-{provider_type}-{platform_suffix}{ext}"
 
 
@@ -84,97 +84,131 @@ def _get_provider_download_url(provider_type: str) -> str:
 
 async def download_provider(provider_type: str) -> Path:
     """
-    Download a provider binary from Cloudflare R2.
-    
+    Download and extract a provider archive from Cloudflare R2.
+
     Args:
         provider_type: Type of provider to download (e.g., "pytorch-cpu")
-        
+
     Returns:
-        Path to the downloaded provider binary
-        
+        Path to the extracted provider binary
+
     Raises:
         ValueError: If provider_type is invalid
         httpx.HTTPError: If download fails
     """
     if provider_type not in ["pytorch-cpu", "pytorch-cuda"]:
         raise ValueError(f"Provider type {provider_type} cannot be downloaded")
-    
+
     progress_manager = get_progress_manager()
     task_manager = get_task_manager()
-    
-    binary_name = _get_provider_binary_name(provider_type)
+
+    archive_name = _get_provider_download_name(provider_type)
     download_url = _get_provider_download_url(provider_type)
-    destination = _get_providers_dir() / binary_name
-    
+    providers_dir = _get_providers_dir()
+    archive_path = providers_dir / archive_name
+
     # Start tracking download
     task_manager.start_download(provider_type)
-    
+
     # Initialize progress state
     progress_manager.update_progress(
         model_name=provider_type,
         current=0,
         total=0,  # Will be updated once we get Content-Length
-        filename=binary_name,
+        filename=archive_name,
         status="downloading",
     )
-    
+
     try:
+        # Download archive
         async with httpx.AsyncClient(timeout=300.0) as client:
-            # First, get the file size
             async with client.stream("GET", download_url) as response:
                 response.raise_for_status()
-                
+
                 # Get total size from Content-Length header
                 total_size = int(response.headers.get("Content-Length", 0))
-                
+
                 if total_size > 0:
                     progress_manager.update_progress(
                         model_name=provider_type,
                         current=0,
                         total=total_size,
-                        filename=binary_name,
+                        filename=archive_name,
                         status="downloading",
                     )
-                
+
                 # Download with progress tracking
                 downloaded = 0
-                with open(destination, "wb") as f:
+                with open(archive_path, "wb") as f:
                     async for chunk in response.aiter_bytes(chunk_size=8192):
                         f.write(chunk)
                         downloaded += len(chunk)
-                        
+
                         # Update progress
                         progress_manager.update_progress(
                             model_name=provider_type,
                             current=downloaded,
                             total=total_size if total_size > 0 else downloaded,
-                            filename=binary_name,
+                            filename=archive_name,
                             status="downloading",
                         )
-        
+
+        # Extract archive
+        progress_manager.update_progress(
+            model_name=provider_type,
+            current=downloaded,
+            total=downloaded,
+            filename="Extracting...",
+            status="downloading",
+        )
+
+        import zipfile
+        import tarfile
+
+        if archive_name.endswith('.zip'):
+            with zipfile.ZipFile(archive_path, 'r') as zip_ref:
+                zip_ref.extractall(providers_dir)
+        elif archive_name.endswith('.tar.gz'):
+            with tarfile.open(archive_path, 'r:gz') as tar_ref:
+                tar_ref.extractall(providers_dir)
+        else:
+            raise ValueError(f"Unsupported archive format: {archive_name}")
+
+        # Remove archive after extraction
+        archive_path.unlink()
+
+        # Get path to extracted binary
+        binary_path = get_provider_binary_path(provider_type)
+        if not binary_path:
+            raise ValueError(f"Provider binary not found after extraction")
+
+        # Make executable on Unix systems
+        if platform.system() != "Windows":
+            binary_path.chmod(0o755)
+
         # Mark as complete
         progress_manager.update_progress(
             model_name=provider_type,
             current=downloaded,
             total=downloaded,
-            filename=binary_name,
+            filename=_get_provider_binary_name(provider_type),
             status="complete",
         )
         task_manager.complete_download(provider_type)
-        
-        # Make executable on Unix systems
-        if platform.system() != "Windows":
-            destination.chmod(0o755)
-        
-        return destination
-        
+
+        return binary_path
+
     except Exception as e:
+        # Clean up archive if it exists
+        if archive_path.exists():
+            archive_path.unlink()
+
         # Mark as error
         progress_manager.update_progress(
             model_name=provider_type,
             current=0,
             total=0,
-            filename=binary_name,
+            filename=archive_name,
             status="error",
         )
         task_manager.error_download(provider_type, str(e))
@@ -184,19 +218,28 @@ async def download_provider(provider_type: str) -> Path:
 def get_provider_binary_path(provider_type: str) -> Optional[Path]:
     """
     Get the path to an installed provider binary.
-    
+
     Args:
         provider_type: Type of provider
-        
+
     Returns:
         Path to provider binary, or None if not installed
     """
+    providers_dir = _get_providers_dir()
     binary_name = _get_provider_binary_name(provider_type)
-    provider_path = _get_providers_dir() / binary_name
-    
+
+    # Check for --onedir structure (directory with binary inside)
+    provider_dir = providers_dir / f"tts-provider-{provider_type}"
+    if provider_dir.exists() and provider_dir.is_dir():
+        binary_path = provider_dir / binary_name
+        if binary_path.exists() and binary_path.is_file():
+            return binary_path
+
+    # Fallback: check for direct binary (legacy)
+    provider_path = providers_dir / binary_name
     if provider_path.exists() and provider_path.is_file():
         return provider_path
-    
+
     return None
 
 
diff --git a/data/.gitkeep b/data/.gitkeep
deleted file mode 100644
index 76bde729..00000000
--- a/data/.gitkeep
+++ /dev/null
@@ -1,7 +0,0 @@
-# User data directory
-# This directory contains:
-# - profiles/ - Voice profile audio files
-# - generations/ - Generated audio files
-# - projects/ - Audio studio project files
-# - voicebox.db - SQLite database
-# - cache/ - Voice prompt cache files
diff --git a/data/cache/.gitkeep b/data/cache/.gitkeep
deleted file mode 100644
index d66284ff..00000000
--- a/data/cache/.gitkeep
+++ /dev/null
@@ -1 +0,0 @@
-# Voice prompt cache files
diff --git a/providers/pytorch-cpu/build.py b/providers/pytorch-cpu/build.py
index e71996a7..a443f343 100644
--- a/providers/pytorch-cpu/build.py
+++ b/providers/pytorch-cpu/build.py
@@ -16,7 +16,7 @@ def build_provider():
     # PyInstaller arguments
     args = [
         'main.py',
-        '--onefile',
+        '--onedir',  # Changed from --onefile to work around Windows extraction issues
         '--name', 'tts-provider-pytorch-cpu',
     ]
     
@@ -51,6 +51,18 @@ def build_provider():
         '--collect-submodules', 'jaraco',
         '--hidden-import', 'fastapi',
         '--hidden-import', 'uvicorn',
+        # Critical uvicorn imports for PyInstaller
+        '--hidden-import', 'uvicorn.logging',
+        '--hidden-import', 'uvicorn.loops',
+        '--hidden-import', 'uvicorn.loops.auto',
+        '--hidden-import', 'uvicorn.protocols',
+        '--hidden-import', 'uvicorn.protocols.http',
+        '--hidden-import', 'uvicorn.protocols.http.auto',
+        '--hidden-import', 'uvicorn.protocols.websockets',
+        '--hidden-import', 'uvicorn.protocols.websockets.auto',
+        '--hidden-import', 'uvicorn.lifespan',
+        '--hidden-import', 'uvicorn.lifespan.on',
+        '--collect-submodules', 'uvicorn',
         '--hidden-import', 'soundfile',
         '--hidden-import', 'numpy',
         '--hidden-import', 'librosa',
diff --git a/providers/pytorch-cuda/build.py b/providers/pytorch-cuda/build.py
index 1eec21a8..c45f1196 100644
--- a/providers/pytorch-cuda/build.py
+++ b/providers/pytorch-cuda/build.py
@@ -16,7 +16,7 @@ def build_provider():
     # PyInstaller arguments
     args = [
         'main.py',
-        '--onefile',
+        '--onedir',  # Changed from --onefile to work around Windows extraction issues
         '--name', 'tts-provider-pytorch-cuda',
     ]
     
@@ -53,6 +53,18 @@ def build_provider():
         '--collect-submodules', 'jaraco',
         '--hidden-import', 'fastapi',
         '--hidden-import', 'uvicorn',
+        # Critical uvicorn imports for PyInstaller
+        '--hidden-import', 'uvicorn.logging',
+        '--hidden-import', 'uvicorn.loops',
+        '--hidden-import', 'uvicorn.loops.auto',
+        '--hidden-import', 'uvicorn.protocols',
+        '--hidden-import', 'uvicorn.protocols.http',
+        '--hidden-import', 'uvicorn.protocols.http.auto',
+        '--hidden-import', 'uvicorn.protocols.websockets',
+        '--hidden-import', 'uvicorn.protocols.websockets.auto',
+        '--hidden-import', 'uvicorn.lifespan',
+        '--hidden-import', 'uvicorn.lifespan.on',
+        '--collect-submodules', 'uvicorn',
         '--hidden-import', 'soundfile',
         '--hidden-import', 'numpy',
         '--hidden-import', 'librosa',

From 3ffbdeed8928a48d18e6199f75d2bcdac4b8fd0c Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 05:12:11 -0800
Subject: [PATCH 22/33] Update Dockerfiles to prevent interactive prompts and
 include timezone data

- Added environment variables to Dockerfiles to set non-interactive mode and configure the timezone to UTC.
- Included installation of `tzdata` in both Dockerfiles to support timezone configuration during the build process.
---
 Dockerfile                     |   5 +++++
 Dockerfile.cuda                |   5 +++++
 tauri/src-tauri/gen/Assets.car | Bin 3847048 -> 3847048 bytes
 3 files changed, 10 insertions(+)

diff --git a/Dockerfile b/Dockerfile
index 6600e511..ca243bc5 100644
--- a/Dockerfile
+++ b/Dockerfile
@@ -3,12 +3,17 @@
 
 FROM python:3.12-slim
 
+# Prevent interactive prompts during build
+ENV DEBIAN_FRONTEND=noninteractive
+ENV TZ=UTC
+
 WORKDIR /app
 
 # Install system dependencies
 RUN apt-get update && apt-get install -y \
     ffmpeg \
     curl \
+    tzdata \
     && rm -rf /var/lib/apt/lists/*
 
 # Copy backend
diff --git a/Dockerfile.cuda b/Dockerfile.cuda
index b6e67296..c03001fa 100644
--- a/Dockerfile.cuda
+++ b/Dockerfile.cuda
@@ -2,6 +2,10 @@
 
 FROM nvidia/cuda:12.1.1-runtime-ubuntu22.04
 
+# Prevent interactive prompts during build
+ENV DEBIAN_FRONTEND=noninteractive
+ENV TZ=UTC
+
 WORKDIR /app
 
 # Install Python 3.12
@@ -14,6 +18,7 @@ RUN apt-get update && apt-get install -y \
     python3-pip \
     ffmpeg \
     curl \
+    tzdata \
     && rm -rf /var/lib/apt/lists/*
 
 # Set Python 3.12 as default
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index d44f6eaf3c8b63fe5e60c3ca6ea8f1b2b1896e2f..38d62c7e4d7b1c2e4315a0ccb94223ebe96da5aa 100644
GIT binary patch
delta 825
zcmZY8yKWOf7zN;UjEPBr1V}>S1h4^f|Kr)Y?Mw<bb6e#RQqs{ON(u@j3cHOgO8Q7p
zAf>P$A`(0R1sxUziV!F*C$ds`rEh<2bIx3}gP*@@1Nic_+gQx9Y+-oZ-8}l+JzhFs
zjbU5A7@nxz;WyPDzSCQ^e@7qnpSjXUWi^wDxMc-N78Tj(6jk0;N@yj7wNx-=a$;wX
z(2fU{oRxC>^{bZ$o!0w_?N4kC=AaH2paB<Qel)So)F=}(!6t3U2qj5cF33b~$mO|X
zNu;2an(Ya`FvYZIYcwdEAL?ZljN~dBVo3&)zKG<Fk65+x+B)ZCQOpJ<;RHVqdJ~$f
zwNhX`BDzE_6^SJGo?JARL}e<*bskmJvq3S1Se*w=VsoQj^2CxYbVa79G)dz$S&>`H
zmB^*7@Dh9`NLSn{I}KXz@9#C?5-h+XT!t%f6_#KbuEBM<0V}WyYj6|JGB%(Eo3I79
z;5OWWHgw=F+=Khjg$M8u9>HUHGTPsJdU{$W&4e+!AQ$pTQsJDuNs1hk(go(U^JaEa
zg2&*en`-qBcb@^lHuQi&4jcqXP@}_LJ^uYX*IEjb$e0|rVI+<-YKB`zs}_n^LC*B4
x$_FRT`^LSZKkgZ@qj7Ji{<gE8W$Fk1ggML;%#|$D%hPY&##|eH|FrXY{y)n0<-z~}

delta 845
zcmZY8yKWOf6b9h6jmhTf07*!KLmVL7C!YHy1?!oeS*1*wH=sk56ck7lP8(U2^pT)I
zN@2f6cz_giSQH3o((*?kG+yb`(KhG&b9VOd`;Xcod^z3TXk}Tp0Mn4eJj}r?%$)q*
zK5ZS*=3rmbK}YunU)BELoo?68PCn{C^@4jwjWd>rN(CZ~Q^ZpqiDAL<D)7LgC5~&U
z3B7oPj8+@xQFmUydU>?9{(kKGV^@PZG~gOE;W|tW$1YFJA_On3uL4oDltjwX5zD+J
z)O%`t(p7S9a*mPQ=*v0n;bD<~XcXFNmP9l}7^e}qWW+PHG}?HlxzGVoCj&DV#8sm=
zWxiZ1N<j^;EF-$4o=8hAu}V5(sI8QZUIp(b8`(gs|Bc2mUuzU4<1!>n^(tb8NI|@?
zoOrE86pE&#CKFjttxlJTR{IBgIZVS0%)%VZ!veHm5pKXuxCKkF3@dOOE_$rNI^2Oa
zY`|UEgbr-MJ-81KU>hF7BX|r?;OX#S@7eiz!6g$aFi%wJ9gz&@aY<D;qhrxl&czrf
zx04j({NKIkANQUEfgR`q1qK`hNKnJ$o*w;tp{NW|1bhvx2(AYu!9+^5i^`-bC6^|b
zh>KH|^lILyYx<+E1veaZcN=fFma<HJ!(UKG{e`-cWqR@QU3XAdhi9L5KTrJy!6V~N


From 409ec2dbb14770b41ae080a9083e070430bc0ba8 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 05:16:17 -0800
Subject: [PATCH 23/33] Enhance ProviderSettings component with loading state
 and improved UI interactions

- Introduced a loading state to indicate when a provider is starting, enhancing user experience.
- Disabled radio buttons and action buttons during the loading state to prevent user interaction.
- Updated UI elements to reflect the loading state, including a spinner and appropriate cursor styles.
---
 .../ServerSettings/ProviderSettings.tsx       | 66 +++++++++++++++----
 1 file changed, 52 insertions(+), 14 deletions(-)

diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index 612b3983..2d11b643 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -177,6 +177,8 @@ export function ProviderSettings() {
   console.log('currentProvider', currentProvider);
   const selectedProvider = currentProvider as ProviderType;
 
+  const isStarting = startMutation.isPending;
+
   return (
     <>
       <Card>
@@ -184,17 +186,33 @@ export function ProviderSettings() {
           <CardTitle>TTS Provider</CardTitle>
           <CardDescription>Choose how Voicebox generates speech</CardDescription>
         </CardHeader>
-        <CardContent>
-          <RadioGroup value={selectedProvider} onValueChange={(value) => handleStart(value)}>
+        <CardContent className="relative">
+          {isStarting && (
+            <div className="absolute inset-0 bg-background/80 backdrop-blur-sm flex items-center justify-center z-10 rounded-lg">
+              <div className="flex items-center gap-2 text-muted-foreground">
+                <Icon icon="svg-spinners:ring-resize" className="h-5 w-5" />
+                <span>Starting provider...</span>
+              </div>
+            </div>
+          )}
+          <RadioGroup
+            value={selectedProvider}
+            onValueChange={(value) => handleStart(value)}
+            disabled={isStarting}
+          >
             {/* PyTorch CUDA */}
             <div
               className={`flex items-center justify-between py-2 ${isMacOS() ? 'opacity-50' : ''}`}
             >
               <div className="flex items-center space-x-3 flex-1">
-                <RadioGroupItem value="pytorch-cuda" id="cuda" disabled={isMacOS()} />
+                <RadioGroupItem
+                  value="pytorch-cuda"
+                  id="cuda"
+                  disabled={isMacOS() || isStarting}
+                />
                 <Label
                   htmlFor="cuda"
-                  className={`flex-1 ${isMacOS() ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                  className={`flex-1 ${isMacOS() || isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
                 >
                   <div className="font-medium">PyTorch CUDA (NVIDIA GPU)</div>
                   <div className="text-sm text-muted-foreground">
@@ -208,7 +226,7 @@ export function ProviderSettings() {
                   <Button
                     onClick={() => handleDownload('pytorch-cuda')}
                     size="sm"
-                    disabled={downloadingProvider === 'pytorch-cuda'}
+                    disabled={downloadingProvider === 'pytorch-cuda' || isStarting}
                   >
                     {downloadingProvider === 'pytorch-cuda' ? (
                       <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
@@ -222,12 +240,22 @@ export function ProviderSettings() {
                 )}
                 {installedProviders.includes('pytorch-cuda') &&
                   selectedProvider !== 'pytorch-cuda' && (
-                    <Button onClick={() => handleStart('pytorch-cuda')} size="sm" variant="outline">
+                    <Button
+                      onClick={() => handleStart('pytorch-cuda')}
+                      size="sm"
+                      variant="outline"
+                      disabled={isStarting}
+                    >
                       Start
                     </Button>
                   )}
                 {installedProviders.includes('pytorch-cuda') && (
-                  <Button onClick={() => handleDelete('pytorch-cuda')} size="sm" variant="ghost">
+                  <Button
+                    onClick={() => handleDelete('pytorch-cuda')}
+                    size="sm"
+                    variant="ghost"
+                    disabled={isStarting}
+                  >
                     <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
                   </Button>
                 )}
@@ -237,8 +265,8 @@ export function ProviderSettings() {
             {/* PyTorch CPU */}
             <div className="flex items-center justify-between py-2">
               <div className="flex items-center space-x-3 flex-1">
-                <RadioGroupItem value="pytorch-cpu" id="cpu" />
-                <Label htmlFor="cpu" className="flex-1 cursor-pointer">
+                <RadioGroupItem value="pytorch-cpu" id="cpu" disabled={isStarting} />
+                <Label htmlFor="cpu" className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}>
                   <div className="font-medium">PyTorch CPU</div>
                   <div className="text-sm text-muted-foreground">
                     Works on any system, slower inference
@@ -251,7 +279,7 @@ export function ProviderSettings() {
                   <Button
                     onClick={() => handleDownload('pytorch-cpu')}
                     size="sm"
-                    disabled={downloadingProvider === 'pytorch-cpu'}
+                    disabled={downloadingProvider === 'pytorch-cpu' || isStarting}
                   >
                     {downloadingProvider === 'pytorch-cpu' ? (
                       <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
@@ -265,12 +293,22 @@ export function ProviderSettings() {
                 )}
                 {installedProviders.includes('pytorch-cpu') &&
                   selectedProvider !== 'pytorch-cpu' && (
-                    <Button onClick={() => handleStart('pytorch-cpu')} size="sm" variant="outline">
+                    <Button
+                      onClick={() => handleStart('pytorch-cpu')}
+                      size="sm"
+                      variant="outline"
+                      disabled={isStarting}
+                    >
                       Start
                     </Button>
                   )}
                 {installedProviders.includes('pytorch-cpu') && (
-                  <Button onClick={() => handleDelete('pytorch-cpu')} size="sm" variant="ghost">
+                  <Button
+                    onClick={() => handleDelete('pytorch-cpu')}
+                    size="sm"
+                    variant="ghost"
+                    disabled={isStarting}
+                  >
                     <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
                   </Button>
                 )}
@@ -280,8 +318,8 @@ export function ProviderSettings() {
             {/* MLX bundled (macOS Apple Silicon only) */}
             {isMacOS() && (
               <div className="flex items-center space-x-3 py-2">
-                <RadioGroupItem value="apple-mlx" id="mlx" />
-                <Label htmlFor="mlx" className="flex-1 cursor-pointer">
+                <RadioGroupItem value="apple-mlx" id="mlx" disabled={isStarting} />
+                <Label htmlFor="mlx" className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}>
                   <div className="font-medium">MLX (Apple Silicon)</div>
                   <div className="text-sm text-muted-foreground">
                     Bundled with the app - optimized for M-series chips

From af7e9814dbfc558708eeffc1a92ebc912e41b358 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 05:23:15 -0800
Subject: [PATCH 24/33] Remove 'Active' badge for inactive PyTorch providers in
 ProviderSettings component

---
 app/src/components/ServerSettings/ProviderSettings.tsx | 7 -------
 1 file changed, 7 deletions(-)

diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index 2d11b643..8057947a 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -221,7 +221,6 @@ export function ProviderSettings() {
                 </Label>
               </div>
               <div className="flex items-center gap-2">
-                {currentProvider === 'pytorch-cuda' && <Badge variant="outline">Active</Badge>}
                 {!installedProviders.includes('pytorch-cuda') && (
                   <Button
                     onClick={() => handleDownload('pytorch-cuda')}
@@ -274,7 +273,6 @@ export function ProviderSettings() {
                 </Label>
               </div>
               <div className="flex items-center gap-2">
-                {currentProvider === 'pytorch-cpu' && <Badge variant="outline">Active</Badge>}
                 {!installedProviders.includes('pytorch-cpu') && (
                   <Button
                     onClick={() => handleDownload('pytorch-cpu')}
@@ -325,11 +323,6 @@ export function ProviderSettings() {
                     Bundled with the app - optimized for M-series chips
                   </div>
                 </Label>
-                {currentProvider === 'apple-mlx' && (
-                  <Badge variant="outline" className="ml-2">
-                    Active
-                  </Badge>
-                )}
               </div>
             )}
 

From 73d9b5d70e30fd02d0b4215b669d194dde524982 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Mon, 2 Feb 2026 20:08:07 -0800
Subject: [PATCH 25/33] Refactor ProviderSettings component for improved
 readability and maintainability

- Removed unnecessary line breaks in the rendering of radio buttons and labels for a cleaner code structure.
- Added missing imports for numpy and scipy in build_binary.py to ensure proper functionality.
- Updated binary Assets.car file to reflect recent changes.
---
 .../ServerSettings/ProviderSettings.tsx       |  17 +++++++++--------
 backend/build_binary.py                       |   5 +++++
 tauri/src-tauri/gen/Assets.car                | Bin 3847048 -> 3847048 bytes
 3 files changed, 14 insertions(+), 8 deletions(-)

diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index 8057947a..b11e19ef 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -13,7 +13,6 @@ import {
   AlertDialogHeader,
   AlertDialogTitle,
 } from '@/components/ui/alert-dialog';
-import { Badge } from '@/components/ui/badge';
 import { Button } from '@/components/ui/button';
 import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card';
 import { Label } from '@/components/ui/label';
@@ -205,11 +204,7 @@ export function ProviderSettings() {
               className={`flex items-center justify-between py-2 ${isMacOS() ? 'opacity-50' : ''}`}
             >
               <div className="flex items-center space-x-3 flex-1">
-                <RadioGroupItem
-                  value="pytorch-cuda"
-                  id="cuda"
-                  disabled={isMacOS() || isStarting}
-                />
+                <RadioGroupItem value="pytorch-cuda" id="cuda" disabled={isMacOS() || isStarting} />
                 <Label
                   htmlFor="cuda"
                   className={`flex-1 ${isMacOS() || isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
@@ -265,7 +260,10 @@ export function ProviderSettings() {
             <div className="flex items-center justify-between py-2">
               <div className="flex items-center space-x-3 flex-1">
                 <RadioGroupItem value="pytorch-cpu" id="cpu" disabled={isStarting} />
-                <Label htmlFor="cpu" className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}>
+                <Label
+                  htmlFor="cpu"
+                  className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                >
                   <div className="font-medium">PyTorch CPU</div>
                   <div className="text-sm text-muted-foreground">
                     Works on any system, slower inference
@@ -317,7 +315,10 @@ export function ProviderSettings() {
             {isMacOS() && (
               <div className="flex items-center space-x-3 py-2">
                 <RadioGroupItem value="apple-mlx" id="mlx" disabled={isStarting} />
-                <Label htmlFor="mlx" className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}>
+                <Label
+                  htmlFor="mlx"
+                  className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                >
                   <div className="font-medium">MLX (Apple Silicon)</div>
                   <div className="text-sm text-muted-foreground">
                     Bundled with the app - optimized for M-series chips
diff --git a/backend/build_binary.py b/backend/build_binary.py
index 3d695fdb..df96f5dc 100644
--- a/backend/build_binary.py
+++ b/backend/build_binary.py
@@ -51,6 +51,11 @@ def build_server():
         '--hidden-import', 'backend.utils.progress',
         '--hidden-import', 'backend.utils.hf_progress',
         '--hidden-import', 'backend.utils.validation',
+        '--hidden-import', 'numpy',
+        '--hidden-import', 'numpy.core',
+        '--hidden-import', 'numpy.core._multiarray_umath',
+        '--hidden-import', 'scipy',
+        '--hidden-import', 'scipy.signal',
         '--hidden-import', 'fastapi',
         '--hidden-import', 'uvicorn',
         '--hidden-import', 'sqlalchemy',
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index 38d62c7e4d7b1c2e4315a0ccb94223ebe96da5aa..0fba2b0e5dfafaaba02b2755796043bb3bdd6973 100644
GIT binary patch
delta 829
zcmZY8xo#6d90qV7m~2ib<baq29KhTY&(1v&Vl&q&kC2j%4pCCjQP^!{QPM|(0x89&
z<PGuy>9Hsf&_KxtCJkQcr<r2+`_HG*4nKdX58>lkZ+o#;t1UnqmS7e#n1{KO@4d73
z5p9h=NjmB(I{GH}N6*xg`uWK_^`lX!U?UAY5>u+22&FagHbf$#bSg^kw06Yg${0fb
zKAhR;1I6pRFJC-A+UdL*+rik@p#e>}1TDA>Gu7B;sZ~VkWa$vhQfY|biW4JjBucQH
za_N<$VtS6twbPS1Th*}0-Zl#+Wa6S!#3YGhI%|mWfsryA?I?@RFg+dQZL;Pf=vBzp
z>xC4&^ob_oB|aBYQDS&Z#F@yH!cG~S@&D#ta_%mI#xdJ$7RDx82Ih%&-V>2>PMqM3
z<RYeA1Rk^wQ$Zo<oYG0qwZY**2D2~+^RNJmumo*bh84I1tFQ*^umM-$PsS#6;5ux<
zHr#-l(1jhi1-Ic2^x!VsgZuCR9#)43kAD4pYNfKJ%h8EBbW)x;7b%Jfni7inm```2
z3RgPm)EOM_KL!H3&<6@RFyJ6SR>%9Q`dUaToflG&U=*%ZghY(-Ii_+El_<+3rw8H?
nCj7hB&fv7K!GNt!`+KXeS2k)jwT!=@fwhZutvY|d_hIHY1)SnZ

delta 828
zcmZY8J5N+W7zW^75LxaZ7X?8V74IKAXD;8Fq3|%b6ABAU{(+sbw6L>SS|pbCBwCnI
z97_KIf56_2g^4CcOJ72$c9LhNd*8Wa4!-|rAHbKht&OQxt2GI8FbfmVff<-S`L%U6
zcPPe=z8Z1V<=yw(J$k{<+kZ|z^6!x<B;#1<Owx&xv`B_r@`mc*YopjG<s6m5*n-6Q
zQ0!$i**mSbU%z^JxViRj;Q9mCh7lNrD=-FEVZ0f*P9CeWu+e3<WR=mRom6C#wB(Dz
zi>z{FV}^TTC~bMsv)&w3oe!f`9j%roSrS=C(xFTgY)II(3GBT0x-5r-vhqq^2EB=$
z<#wg8AC-J2pUX^IhCn`9N2<29kX$5_csMBKnCi=*LF%lIRx*q1O0LP4HIufU$*ICo
zVN{`AjY-L&Ag-k|?jq<$e}At76EF!=Fby*>3v)0J3vdk<VF{LD1+K$+#wx7AO<0Ew
zxCOVN3!88U?!rCTg8T3Q9>ODd-0bf?`S<r33uP^r<YSRY8(dSc*^n1n`zSp7V2977
zWQyV9Ol$q)-KRjX4LuN0fCL2^Omn=;&Cf~{%v#w@))sgTt8tx)1zs7otc<Lq9x60-
oh+bV5p7zTAY0rXdPJ26xZx@zYEuP0G7{S`by3&06wDWoVKa8*7=>Px#


From 793e392e562025e56d2479aea8bd5687466c16fb Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Tue, 3 Feb 2026 00:32:18 -0800
Subject: [PATCH 26/33] Add DataFolders component to ServerSettings for
 managing system folder paths

- Introduced a new DataFolders component to display and manage paths for application data, models, and providers.
- Implemented a FolderRow component for individual folder display, including loading states and open folder functionality.
- Added API client methods and hooks to fetch system folder paths from the backend.
- Updated ServerTab to include the new DataFolders component, enhancing server settings management.
---
 .../components/ServerSettings/DataFolders.tsx | 112 ++++++++++++++++++
 app/src/components/ServerTab/ServerTab.tsx    |   2 +
 app/src/lib/api/client.ts                     |   6 +
 app/src/lib/api/types.ts                      |   6 +
 app/src/lib/hooks/useSystemFolders.ts         |  14 +++
 app/src/platform/types.ts                     |   7 ++
 backend/main.py                               |  13 ++
 backend/models.py                             |   7 ++
 tauri/src-tauri/gen/Assets.car                | Bin 3847048 -> 3847048 bytes
 tauri/src-tauri/tauri.conf.json               |   2 +-
 tauri/src/platform/filesystem.ts              |  11 ++
 web/src/platform/filesystem.ts                |   6 +
 12 files changed, 185 insertions(+), 1 deletion(-)
 create mode 100644 app/src/components/ServerSettings/DataFolders.tsx
 create mode 100644 app/src/lib/hooks/useSystemFolders.ts

diff --git a/app/src/components/ServerSettings/DataFolders.tsx b/app/src/components/ServerSettings/DataFolders.tsx
new file mode 100644
index 00000000..9338da09
--- /dev/null
+++ b/app/src/components/ServerSettings/DataFolders.tsx
@@ -0,0 +1,112 @@
+import { Folder01Icon, FolderOpenIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import { Icon } from '@iconify/react';
+import { Button } from '@/components/ui/button';
+import { Card, CardContent, CardDescription, CardHeader, CardTitle } from '@/components/ui/card';
+import { Input } from '@/components/ui/input';
+import { useSystemFolders } from '@/lib/hooks/useSystemFolders';
+import { usePlatform } from '@/platform/PlatformContext';
+
+interface FolderRowProps {
+  label: string;
+  description: string;
+  path: string | undefined;
+  isLoading: boolean;
+  canOpen: boolean;
+  onOpen: () => void;
+}
+
+function FolderRow({ label, description, path, isLoading, canOpen, onOpen }: FolderRowProps) {
+  return (
+    <div className="space-y-1.5">
+      <div className="flex items-center justify-between">
+        <div>
+          <div className="text-sm font-medium">{label}</div>
+          <div className="text-xs text-muted-foreground">{description}</div>
+        </div>
+        {canOpen && path && (
+          <Button
+            variant="outline"
+            size="sm"
+            onClick={onOpen}
+            disabled={isLoading || !path}
+            className="shrink-0"
+          >
+            <HugeiconsIcon icon={FolderOpenIcon} size={16} className="h-4 w-4 mr-2" />
+            Open
+          </Button>
+        )}
+      </div>
+      <Input
+        value={isLoading ? 'Loading...' : path || 'Not available'}
+        readOnly
+        className="font-mono text-xs text-muted-foreground select-all cursor-text"
+      />
+    </div>
+  );
+}
+
+export function DataFolders() {
+  const { data: folders, isLoading, error } = useSystemFolders();
+  const platform = usePlatform();
+  const isTauri = platform.metadata.isTauri;
+
+  const handleOpenFolder = async (path: string | undefined) => {
+    if (!path) return;
+    const success = await platform.filesystem.openFolder(path);
+    if (!success && isTauri) {
+      console.error('Failed to open folder:', path);
+    }
+  };
+
+  return (
+    <Card>
+      <CardHeader>
+        <CardTitle className="flex items-center gap-2">
+          <HugeiconsIcon icon={Folder01Icon} size={20} className="h-5 w-5" />
+          Data Folders
+        </CardTitle>
+        <CardDescription>
+          {isTauri
+            ? 'Click "Open" to view folders in your file explorer, or copy the paths below.'
+            : 'These are the server-side folder paths where your data is stored.'}
+        </CardDescription>
+      </CardHeader>
+      <CardContent className="space-y-4">
+        {error ? (
+          <div className="flex items-center gap-2 text-sm text-destructive">
+            <Icon icon="lucide:alert-circle" className="h-4 w-4" />
+            <span>Failed to load folder paths: {error.message}</span>
+          </div>
+        ) : (
+          <>
+            <FolderRow
+              label="App Data"
+              description="Voices, generations, and app database"
+              path={folders?.data_dir}
+              isLoading={isLoading}
+              canOpen={isTauri}
+              onOpen={() => handleOpenFolder(folders?.data_dir)}
+            />
+            <FolderRow
+              label="Models"
+              description="Downloaded AI models from HuggingFace Hub"
+              path={folders?.models_dir}
+              isLoading={isLoading}
+              canOpen={isTauri}
+              onOpen={() => handleOpenFolder(folders?.models_dir)}
+            />
+            <FolderRow
+              label="Providers"
+              description="External TTS provider binaries (PyTorch CPU/CUDA)"
+              path={folders?.providers_dir}
+              isLoading={isLoading}
+              canOpen={isTauri}
+              onOpen={() => handleOpenFolder(folders?.providers_dir)}
+            />
+          </>
+        )}
+      </CardContent>
+    </Card>
+  );
+}
diff --git a/app/src/components/ServerTab/ServerTab.tsx b/app/src/components/ServerTab/ServerTab.tsx
index 5a512027..d77c7800 100644
--- a/app/src/components/ServerTab/ServerTab.tsx
+++ b/app/src/components/ServerTab/ServerTab.tsx
@@ -1,4 +1,5 @@
 import { ConnectionForm } from '@/components/ServerSettings/ConnectionForm';
+import { DataFolders } from '@/components/ServerSettings/DataFolders';
 import { ServerStatus } from '@/components/ServerSettings/ServerStatus';
 import { UpdateStatus } from '@/components/ServerSettings/UpdateStatus';
 import { ProviderSettings } from '@/components/ServerSettings/ProviderSettings';
@@ -13,6 +14,7 @@ export function ServerTab() {
         <ServerStatus />
       </div>
       <ProviderSettings />
+      <DataFolders />
       {platform.metadata.isTauri && <UpdateStatus />}
       <div className="py-8 text-center text-sm text-muted-foreground">
         Created by{' '}
diff --git a/app/src/lib/api/client.ts b/app/src/lib/api/client.ts
index b5da41a6..01f548d2 100644
--- a/app/src/lib/api/client.ts
+++ b/app/src/lib/api/client.ts
@@ -14,6 +14,7 @@ import type {
   ModelStatusListResponse,
   ModelDownloadRequest,
   ActiveTasksResponse,
+  FolderPathsResponse,
   StoryCreate,
   StoryResponse,
   StoryDetailResponse,
@@ -57,6 +58,11 @@ class ApiClient {
     return this.request<HealthResponse>('/health');
   }
 
+  // System
+  async getSystemFolders(): Promise<FolderPathsResponse> {
+    return this.request<FolderPathsResponse>('/system/folders');
+  }
+
   // Profiles
   async createProfile(data: VoiceProfileCreate): Promise<VoiceProfileResponse> {
     return this.request<VoiceProfileResponse>('/profiles', {
diff --git a/app/src/lib/api/types.ts b/app/src/lib/api/types.ts
index dd76ca1e..717496ea 100644
--- a/app/src/lib/api/types.ts
+++ b/app/src/lib/api/types.ts
@@ -128,6 +128,12 @@ export interface ActiveTasksResponse {
   generations: ActiveGenerationTask[];
 }
 
+export interface FolderPathsResponse {
+  data_dir: string;
+  models_dir: string;
+  providers_dir: string;
+}
+
 export interface StoryCreate {
   name: string;
   description?: string;
diff --git a/app/src/lib/hooks/useSystemFolders.ts b/app/src/lib/hooks/useSystemFolders.ts
new file mode 100644
index 00000000..47e92540
--- /dev/null
+++ b/app/src/lib/hooks/useSystemFolders.ts
@@ -0,0 +1,14 @@
+import { useQuery } from '@tanstack/react-query';
+import { apiClient } from '@/lib/api/client';
+import { useServerStore } from '@/stores/serverStore';
+
+export function useSystemFolders() {
+  const serverUrl = useServerStore((state) => state.serverUrl);
+
+  return useQuery({
+    queryKey: ['system', 'folders', serverUrl],
+    queryFn: () => apiClient.getSystemFolders(),
+    staleTime: 60000, // Cache for 1 minute - folder paths don't change often
+    retry: 1,
+  });
+}
diff --git a/app/src/platform/types.ts b/app/src/platform/types.ts
index 5ea4d609..6d724fd8 100644
--- a/app/src/platform/types.ts
+++ b/app/src/platform/types.ts
@@ -10,6 +10,13 @@ export interface FileFilter {
 
 export interface PlatformFilesystem {
   saveFile(filename: string, blob: Blob, filters?: FileFilter[]): Promise<void>;
+  /**
+   * Open a folder in the native file explorer.
+   * On web, this is a no-op since browsers cannot open folders.
+   * @param path - The absolute path to the folder to open
+   * @returns true if the folder was opened, false if not supported
+   */
+  openFolder(path: string): Promise<boolean>;
 }
 
 export interface UpdateStatus {
diff --git a/backend/main.py b/backend/main.py
index 306a0639..c74ae460 100644
--- a/backend/main.py
+++ b/backend/main.py
@@ -74,6 +74,19 @@ async def shutdown_async():
     return {"message": "Shutting down..."}
 
 
+@app.get("/system/folders", response_model=models.FolderPathsResponse)
+async def get_system_folders():
+    """Get system folder paths for data, models, and providers."""
+    from huggingface_hub import constants as hf_constants
+    from .providers.installer import _get_providers_dir
+    
+    return models.FolderPathsResponse(
+        data_dir=str(config.get_data_dir().absolute()),
+        models_dir=str(Path(hf_constants.HF_HUB_CACHE).absolute()),
+        providers_dir=str(_get_providers_dir().absolute()),
+    )
+
+
 @app.get("/health", response_model=models.HealthResponse)
 async def health():
     """Health check endpoint."""
diff --git a/backend/models.py b/backend/models.py
index 59e45405..0540644e 100644
--- a/backend/models.py
+++ b/backend/models.py
@@ -170,6 +170,13 @@ class ActiveTasksResponse(BaseModel):
     generations: List[ActiveGenerationTask]
 
 
+class FolderPathsResponse(BaseModel):
+    """Response model for system folder paths."""
+    data_dir: str
+    models_dir: str
+    providers_dir: str
+
+
 class AudioChannelCreate(BaseModel):
     """Request model for creating an audio channel."""
     name: str = Field(..., min_length=1, max_length=100)
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index 0fba2b0e5dfafaaba02b2755796043bb3bdd6973..fbe8f7112d3a477897665837ed31bb74dd8b2763 100644
GIT binary patch
delta 825
zcmZwFJ5N+W6bEqD6<OXsKmkEO#rI+7{h+zb>xR;jZ(wIEEi6ndmX;7>Wlw^I3B{$b
z@Eh<2?A=%xH8HgQ6^X@qlV5T(nf%Y0GqdygOKS(-AFnM<4-E}X!6<ZK5+-0A#ty%)
z9Z&DF;l0O(?S0d1?<1_>|D{=M{XBeYew?dfs#TqBCN5<pmFqyR4v`9zS-W78;E}iy
z-V*!sX=#lLJZrQ5?CF!;)rD7m-|PDpoP#!;hhew?BTe6T%5YV<WvXaTMz}(%h=MvQ
zk(VjeS_sBe7_8%Bbn3LuVzX0qUbm|#>lB03q+LeCMk7c%Ln7Ha7tciqY%s`2A;MYE
z^VFGbRgoKKgQ}^vf|F9Lroc5PlUcM*xa={Dfs=b(|LdrqJM---2^VCJj2veMBSfUj
z!BceDtc&8dxPc%YlrG}5qq*MpRtH9548~ysCSeMu;UZju%Wwr|U>2^zHTaz|4-0S|
z7GVi)z%s1BD%^xya2wX(4%~%%a33Bt+glG$PO6Yo@q!gfCTddB2J%cevN{E=jO0c6
zfkUYhFuA|)qPM^K2ng1p3k*02kf1;}`<tfuS{3J%bUIMbn4PkmQSder)@&)bzwG{V
m9Z|ZN&I%rNZSSb-z&A(TjrNPy%$pAf8_TV^=F`E(yOCct9^{Dt

delta 825
zcmZY6yKWOf7zJQ&jEQqKmjn{ykOVOIiD!21ZZ>mUrKHRo&>>0+3M2}<jVwe(A1M?_
zDK-TKZ;%&Ak41riCM^d{8obh{*<$zn|IrM;e#?gN>9o7CRIAk%p#{q@2TfRj`QxA6
z)7AlPjJ6aV{g8C@4Cfb|Z&W8cJN}@4%@iuwNCS_=l!_6dv?kt$NJNxQMd_W^ju@tl
zA@uLVa~pl2_<ZN(i{}U1?YCn)7~2eHpbnRy0heL68rx=S6p=bvIt1sbG(>R4i4isu
zC2~f&^vY2&J;yQa^khz_8WzoW^&%HCaZxH_lEj+M8e)9NNg0iHG>^{YdOFD4WX(m;
ztI%A{3MqK$6HUZR{4S)T#PFDiGci{RZ^~fD|C@Wsxw{A&$L4yyFgDRL<eq5fJrRj<
z;snnL6EQInc+fgb1%;p)rIVnw!Tw$o=3pKcU=fyJ8Cq}!uEI6A4lA$<H{d4x$ykRr
z+=32lz-`!sE!c)Ta2M`D7w*FYcnFW+akanq<ovuyRw`RMhElmhDdmZCk)oNPDWRE<
zY`PRxxYJ3g_TX^$DG=C!9#CMA0|x=JI^0#&_d-(XypVzfqj0YxBw~zbn94;|qAZh~
m9*8AO_;;`E!AVbp0b8B)`t{e@+WXH({mpEpIy>rroc#^|E#+eX

diff --git a/tauri/src-tauri/tauri.conf.json b/tauri/src-tauri/tauri.conf.json
index 294d5049..202d22e0 100644
--- a/tauri/src-tauri/tauri.conf.json
+++ b/tauri/src-tauri/tauri.conf.json
@@ -56,7 +56,7 @@
   },
   "plugins": {
     "shell": {
-      "open": true
+      "open": "^((mailto:\\w+)|(tel:\\w+)|(https?://\\w+)|(/[^\\s]+)|([a-zA-Z]:\\\\[^\\s]*)).*"
     },
     "updater": {
       "pubkey": "dW50cnVzdGVkIGNvbW1lbnQ6IG1pbmlzaWduIHB1YmxpYyBrZXk6IEUxRENBQkRBQjdBNTM1OTIKUldTU05hVzMycXZjNGJGcUxmcVVocll2QjdSaTJNdlFxR2M3VDJsMnVvbDdyZGRPMmRlOW9aWTcK",
diff --git a/tauri/src/platform/filesystem.ts b/tauri/src/platform/filesystem.ts
index e37b4d18..7c057a6d 100644
--- a/tauri/src/platform/filesystem.ts
+++ b/tauri/src/platform/filesystem.ts
@@ -27,4 +27,15 @@ export const tauriFilesystem: PlatformFilesystem = {
       document.body.removeChild(a);
     }
   },
+
+  async openFolder(path: string): Promise<boolean> {
+    try {
+      const { open } = await import('@tauri-apps/plugin-shell');
+      await open(path);
+      return true;
+    } catch (error) {
+      console.error('Failed to open folder:', error);
+      return false;
+    }
+  },
 };
diff --git a/web/src/platform/filesystem.ts b/web/src/platform/filesystem.ts
index 1f45a49c..b9d74690 100644
--- a/web/src/platform/filesystem.ts
+++ b/web/src/platform/filesystem.ts
@@ -12,4 +12,10 @@ export const webFilesystem: PlatformFilesystem = {
     window.URL.revokeObjectURL(url);
     document.body.removeChild(a);
   },
+
+  async openFolder(_path: string): Promise<boolean> {
+    // Browsers cannot open local folders for security reasons
+    // The UI will show the path as a read-only text instead
+    return false;
+  },
 };

From 43241b85cf20e898697cb1e01400f553926691f6 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Tue, 3 Feb 2026 04:11:27 -0800
Subject: [PATCH 27/33] Update Dockerfile to install Python 3.12 venv and
 bootstrap pip

- Replaced python3-pip with python3.12-venv in the installation process.
- Added commands to ensure pip is upgraded and installed after setting Python 3.12 as the default.
- Streamlined the installation of PyTorch by removing redundant pip upgrade command.
---
 Dockerfile.cuda | 11 ++++++-----
 1 file changed, 6 insertions(+), 5 deletions(-)

diff --git a/Dockerfile.cuda b/Dockerfile.cuda
index c03001fa..b7d7ca96 100644
--- a/Dockerfile.cuda
+++ b/Dockerfile.cuda
@@ -15,15 +15,17 @@ RUN apt-get update && apt-get install -y \
     && apt-get update && apt-get install -y \
     python3.12 \
     python3.12-dev \
-    python3-pip \
+    python3.12-venv \
     ffmpeg \
     curl \
     tzdata \
     && rm -rf /var/lib/apt/lists/*
 
-# Set Python 3.12 as default
+# Set Python 3.12 as default and bootstrap pip
 RUN update-alternatives --install /usr/bin/python3 python3 /usr/bin/python3.12 1 && \
-    update-alternatives --install /usr/bin/python python /usr/bin/python3.12 1
+    update-alternatives --install /usr/bin/python python /usr/bin/python3.12 1 && \
+    python3.12 -m ensurepip --upgrade && \
+    python3.12 -m pip install --upgrade pip
 
 # Copy backend
 COPY backend/ /app/backend/
@@ -33,8 +35,7 @@ COPY providers/ /app/providers/
 COPY web/dist/ /app/web/dist/
 
 # Install PyTorch with CUDA support first
-RUN python -m pip install --upgrade pip && \
-    pip install --no-cache-dir \
+RUN pip install --no-cache-dir \
     torch torchvision torchaudio --index-url https://download.pytorch.org/whl/cu121
 
 # Install remaining dependencies

From 3f633f4a02114ef8f8b84152c443c5393ef5b7a7 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Tue, 3 Feb 2026 05:40:37 -0800
Subject: [PATCH 28/33] Update ProviderSettings component for improved clarity
 and user guidance

- Enhanced text descriptions for TTS providers, clarifying the functionality of PyTorch CUDA and Apple MLX.
- Removed outdated references to availability and added notes regarding model version differences.
- Improved UI structure by ensuring consistent labeling and disabling options based on system compatibility.
---
 .../ServerSettings/ProviderSettings.tsx       | 44 ++++++++++---------
 1 file changed, 23 insertions(+), 21 deletions(-)

diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index b11e19ef..566e73d2 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -183,7 +183,7 @@ export function ProviderSettings() {
       <Card>
         <CardHeader>
           <CardTitle>TTS Provider</CardTitle>
-          <CardDescription>Choose how Voicebox generates speech</CardDescription>
+          <CardDescription>Choose how Voicebox generates speech.</CardDescription>
         </CardHeader>
         <CardContent className="relative">
           {isStarting && (
@@ -209,9 +209,9 @@ export function ProviderSettings() {
                   htmlFor="cuda"
                   className={`flex-1 ${isMacOS() || isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
                 >
-                  <div className="font-medium">PyTorch CUDA (NVIDIA GPU)</div>
+                  <div className="font-medium">PyTorch CUDA</div>
                   <div className="text-sm text-muted-foreground">
-                    {isMacOS() ? 'Not available on macOS' : '4-5x faster inference on NVIDIA GPUs'}
+                    NVIDIA GPU-accelerated provider
                   </div>
                 </Label>
               </div>
@@ -312,20 +312,20 @@ export function ProviderSettings() {
             </div>
 
             {/* MLX bundled (macOS Apple Silicon only) */}
-            {isMacOS() && (
-              <div className="flex items-center space-x-3 py-2">
-                <RadioGroupItem value="apple-mlx" id="mlx" disabled={isStarting} />
-                <Label
-                  htmlFor="mlx"
-                  className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
-                >
-                  <div className="font-medium">MLX (Apple Silicon)</div>
-                  <div className="text-sm text-muted-foreground">
-                    Bundled with the app - optimized for M-series chips
-                  </div>
-                </Label>
-              </div>
-            )}
+            <div className="flex items-center space-x-3 py-2">
+              <RadioGroupItem value="apple-mlx" id="mlx" disabled={isStarting || !isMacOS()} />
+              <Label
+                htmlFor="mlx"
+                className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+              >
+                <div className="font-medium">Apple MLX</div>
+                <div className="text-sm text-muted-foreground">
+                  {isMacOS()
+                    ? 'Bundled with this version, optimized for Apple Silicon'
+                    : 'Only available on Apple Silicon'}
+                </div>
+              </Label>
+            </div>
 
             {/* Remote */}
             <div className="space-y-2 py-2 opacity-50">
@@ -334,7 +334,7 @@ export function ProviderSettings() {
                 <Label htmlFor="remote" className="flex-1 cursor-not-allowed">
                   <div className="font-medium">Remote Server</div>
                   <div className="text-sm text-muted-foreground">
-                    Connect to your own TTS server (coming soon)
+                    Connect to your own TTS server
                   </div>
                 </Label>
               </div>
@@ -346,13 +346,15 @@ export function ProviderSettings() {
                 <RadioGroupItem value="openai" id="openai" disabled />
                 <Label htmlFor="openai" className="flex-1 cursor-not-allowed">
                   <div className="font-medium">OpenAI API</div>
-                  <div className="text-sm text-muted-foreground">
-                    Use OpenAI's TTS API (coming soon)
-                  </div>
+                  <div className="text-sm text-muted-foreground">Use OpenAI's TTS API</div>
                 </Label>
               </div>
             </div>
           </RadioGroup>
+          <p className="text-xs text-muted-foreground mt-5">
+            Note: PyTorch and MLX use different versions of the same model. When switching between
+            them, you will need to redownload the model.
+          </p>
         </CardContent>
       </Card>
 

From 637e0b458530ab5224f2368f0bc31bd2265946c0 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Tue, 3 Feb 2026 06:07:19 -0800
Subject: [PATCH 29/33] Enhance ProviderSettings component for
 platform-specific functionality

- Added platform detection for macOS and Windows to improve user experience.
- Updated UI to conditionally disable options and provide clearer guidance based on installed providers.
- Refactored button states and labels for PyTorch CUDA and CPU to reflect availability and download status accurately.
---
 .../ServerSettings/ProviderSettings.tsx       | 161 ++++++++++--------
 backend/providers/__init__.py                 |  15 +-
 tauri/src-tauri/gen/Assets.car                | Bin 3847048 -> 3847048 bytes
 3 files changed, 94 insertions(+), 82 deletions(-)

diff --git a/app/src/components/ServerSettings/ProviderSettings.tsx b/app/src/components/ServerSettings/ProviderSettings.tsx
index 566e73d2..7cd68270 100644
--- a/app/src/components/ServerSettings/ProviderSettings.tsx
+++ b/app/src/components/ServerSettings/ProviderSettings.tsx
@@ -22,6 +22,12 @@ import { apiClient } from '@/lib/api/client';
 import { useModelDownloadToast } from '@/lib/hooks/useModelDownloadToast';
 
 const isMacOS = () => navigator.platform.toLowerCase().includes('mac');
+const isWindows = () => navigator.platform.toLowerCase().includes('win');
+const getPlatformName = () => {
+  if (isMacOS()) return 'macOS';
+  if (isWindows()) return 'Windows';
+  return 'Linux';
+};
 
 type ProviderType =
   | 'auto'
@@ -200,14 +206,12 @@ export function ProviderSettings() {
             disabled={isStarting}
           >
             {/* PyTorch CUDA */}
-            <div
-              className={`flex items-center justify-between py-2 ${isMacOS() ? 'opacity-50' : ''}`}
-            >
-              <div className="flex items-center space-x-3 flex-1">
-                <RadioGroupItem value="pytorch-cuda" id="cuda" disabled={isMacOS() || isStarting} />
+            <div className="flex items-center justify-between py-2">
+              <div className={`flex items-center space-x-3 flex-1 ${isMacOS() || !installedProviders.includes('pytorch-cuda') ? 'opacity-50' : ''}`}>
+                <RadioGroupItem value="pytorch-cuda" id="cuda" disabled={isMacOS() || isStarting || !installedProviders.includes('pytorch-cuda')} />
                 <Label
                   htmlFor="cuda"
-                  className={`flex-1 ${isMacOS() || isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                  className={`flex-1 ${isMacOS() || isStarting || !installedProviders.includes('pytorch-cuda') ? 'cursor-not-allowed' : 'cursor-pointer'}`}
                 >
                   <div className="font-medium">PyTorch CUDA</div>
                   <div className="text-sm text-muted-foreground">
@@ -216,41 +220,45 @@ export function ProviderSettings() {
                 </Label>
               </div>
               <div className="flex items-center gap-2">
-                {!installedProviders.includes('pytorch-cuda') && (
-                  <Button
-                    onClick={() => handleDownload('pytorch-cuda')}
-                    size="sm"
-                    disabled={downloadingProvider === 'pytorch-cuda' || isStarting}
-                  >
-                    {downloadingProvider === 'pytorch-cuda' ? (
-                      <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
-                    ) : (
-                      <>
-                        <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-1" />
-                        Download (2.4GB)
-                      </>
-                    )}
-                  </Button>
+                {isMacOS() && (
+                  <>
+                    <span className="text-xs text-muted-foreground">2.4GB</span>
+                    <Button size="sm" variant="secondary" disabled>
+                      Not Available on macOS
+                    </Button>
+                  </>
                 )}
-                {installedProviders.includes('pytorch-cuda') &&
-                  selectedProvider !== 'pytorch-cuda' && (
+                {!isMacOS() && !installedProviders.includes('pytorch-cuda') && (
+                  <>
+                    <span className="text-xs text-muted-foreground">2.4GB</span>
                     <Button
-                      onClick={() => handleStart('pytorch-cuda')}
+                      onClick={() => handleDownload('pytorch-cuda')}
                       size="sm"
                       variant="outline"
-                      disabled={isStarting}
+                      disabled={downloadingProvider === 'pytorch-cuda' || isStarting}
+                      className="shrink-0"
                     >
-                      Start
+                      {downloadingProvider === 'pytorch-cuda' ? (
+                        <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
+                      ) : (
+                        <>
+                          <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-2" />
+                          Download
+                        </>
+                      )}
                     </Button>
-                  )}
+                  </>
+                )}
                 {installedProviders.includes('pytorch-cuda') && (
                   <Button
                     onClick={() => handleDelete('pytorch-cuda')}
                     size="sm"
-                    variant="ghost"
+                    variant="outline"
                     disabled={isStarting}
+                    className="shrink-0"
                   >
-                    <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
+                    <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4 mr-2" />
+                    Uninstall
                   </Button>
                 )}
               </div>
@@ -258,11 +266,11 @@ export function ProviderSettings() {
 
             {/* PyTorch CPU */}
             <div className="flex items-center justify-between py-2">
-              <div className="flex items-center space-x-3 flex-1">
-                <RadioGroupItem value="pytorch-cpu" id="cpu" disabled={isStarting} />
+              <div className={`flex items-center space-x-3 flex-1 ${!installedProviders.includes('pytorch-cpu') ? 'opacity-50' : ''}`}>
+                <RadioGroupItem value="pytorch-cpu" id="cpu" disabled={isStarting || !installedProviders.includes('pytorch-cpu')} />
                 <Label
                   htmlFor="cpu"
-                  className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                  className={`flex-1 ${isStarting || !installedProviders.includes('pytorch-cpu') ? 'cursor-not-allowed' : 'cursor-pointer'}`}
                 >
                   <div className="font-medium">PyTorch CPU</div>
                   <div className="text-sm text-muted-foreground">
@@ -272,64 +280,67 @@ export function ProviderSettings() {
               </div>
               <div className="flex items-center gap-2">
                 {!installedProviders.includes('pytorch-cpu') && (
-                  <Button
-                    onClick={() => handleDownload('pytorch-cpu')}
-                    size="sm"
-                    disabled={downloadingProvider === 'pytorch-cpu' || isStarting}
-                  >
-                    {downloadingProvider === 'pytorch-cpu' ? (
-                      <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
-                    ) : (
-                      <>
-                        <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-1" />
-                        Download (300MB)
-                      </>
-                    )}
-                  </Button>
-                )}
-                {installedProviders.includes('pytorch-cpu') &&
-                  selectedProvider !== 'pytorch-cpu' && (
+                  <>
+                    <span className="text-xs text-muted-foreground">242MB</span>
                     <Button
-                      onClick={() => handleStart('pytorch-cpu')}
+                      onClick={() => handleDownload('pytorch-cpu')}
                       size="sm"
                       variant="outline"
-                      disabled={isStarting}
+                      disabled={downloadingProvider === 'pytorch-cpu' || isStarting}
+                      className="shrink-0"
                     >
-                      Start
+                      {downloadingProvider === 'pytorch-cpu' ? (
+                        <Icon icon="svg-spinners:ring-resize" className="h-4 w-4 animate-spin" />
+                      ) : (
+                        <>
+                          <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 mr-2" />
+                          Download
+                        </>
+                      )}
                     </Button>
-                  )}
+                  </>
+                )}
                 {installedProviders.includes('pytorch-cpu') && (
                   <Button
                     onClick={() => handleDelete('pytorch-cpu')}
                     size="sm"
-                    variant="ghost"
+                    variant="outline"
                     disabled={isStarting}
+                    className="shrink-0"
                   >
-                    <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4" />
+                    <HugeiconsIcon icon={Delete01Icon} size={16} className="h-4 w-4 mr-2" />
+                    Uninstall
                   </Button>
                 )}
               </div>
             </div>
 
             {/* MLX bundled (macOS Apple Silicon only) */}
-            <div className="flex items-center space-x-3 py-2">
-              <RadioGroupItem value="apple-mlx" id="mlx" disabled={isStarting || !isMacOS()} />
-              <Label
-                htmlFor="mlx"
-                className={`flex-1 ${isStarting ? 'cursor-not-allowed' : 'cursor-pointer'}`}
-              >
-                <div className="font-medium">Apple MLX</div>
-                <div className="text-sm text-muted-foreground">
-                  {isMacOS()
-                    ? 'Bundled with this version, optimized for Apple Silicon'
-                    : 'Only available on Apple Silicon'}
-                </div>
-              </Label>
+            <div className="flex items-center justify-between py-2">
+              <div className={`flex items-center space-x-3 flex-1 ${!isMacOS() ? 'opacity-50' : ''}`}>
+                <RadioGroupItem value="apple-mlx" id="mlx" disabled={isStarting || !isMacOS()} />
+                <Label
+                  htmlFor="mlx"
+                  className={`flex-1 ${isStarting || !isMacOS() ? 'cursor-not-allowed' : 'cursor-pointer'}`}
+                >
+                  <div className="font-medium">Apple MLX</div>
+                  <div className="text-sm text-muted-foreground">
+                    {isMacOS()
+                      ? 'Bundled with this version, optimized for Apple Silicon'
+                      : 'Only available on Apple Silicon'}
+                  </div>
+                </Label>
+              </div>
+              {!isMacOS() && (
+                <Button size="sm" variant="secondary" disabled>
+                  Not Available on {getPlatformName()}
+                </Button>
+              )}
             </div>
 
             {/* Remote */}
-            <div className="space-y-2 py-2 opacity-50">
-              <div className="flex items-center space-x-3">
+            <div className="flex items-center justify-between py-2">
+              <div className="flex items-center space-x-3 flex-1 opacity-50">
                 <RadioGroupItem value="remote" id="remote" disabled />
                 <Label htmlFor="remote" className="flex-1 cursor-not-allowed">
                   <div className="font-medium">Remote Server</div>
@@ -338,17 +349,23 @@ export function ProviderSettings() {
                   </div>
                 </Label>
               </div>
+              <Button size="sm" variant="secondary" disabled>
+                Coming Soon
+              </Button>
             </div>
 
             {/* OpenAI */}
-            <div className="space-y-2 py-2 opacity-50">
-              <div className="flex items-center space-x-3">
+            <div className="flex items-center justify-between py-2">
+              <div className="flex items-center space-x-3 flex-1 opacity-50">
                 <RadioGroupItem value="openai" id="openai" disabled />
                 <Label htmlFor="openai" className="flex-1 cursor-not-allowed">
                   <div className="font-medium">OpenAI API</div>
                   <div className="text-sm text-muted-foreground">Use OpenAI's TTS API</div>
                 </Label>
               </div>
+              <Button size="sm" variant="secondary" disabled>
+                Coming Soon
+              </Button>
             </div>
           </RadioGroup>
           <p className="text-xs text-muted-foreground mt-5">
diff --git a/backend/providers/__init__.py b/backend/providers/__init__.py
index 57e5583e..8ad9681d 100644
--- a/backend/providers/__init__.py
+++ b/backend/providers/__init__.py
@@ -220,16 +220,11 @@ async def list_installed(self) -> list[str]:
             installed.append("pytorch-cpu")
         # Linux: no bundled provider - users must download
         
-        # Check for downloaded providers (Phase 2)
-        providers_dir = _get_providers_dir()
-        if providers_dir.exists():
-            for provider_file in providers_dir.glob("tts-provider-*"):
-                if provider_file.is_file() and provider_file.stat().st_size > 0:
-                    name = provider_file.name
-                    if "pytorch-cpu" in name:
-                        installed.append("pytorch-cpu")
-                    elif "pytorch-cuda" in name:
-                        installed.append("pytorch-cuda")
+        # Check for downloaded providers by checking if binary path exists
+        for provider_type in ["pytorch-cpu", "pytorch-cuda"]:
+            binary_path = get_provider_binary_path(provider_type)
+            if binary_path and binary_path.exists() and provider_type not in installed:
+                installed.append(provider_type)
         
         return installed
     
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index fbe8f7112d3a477897665837ed31bb74dd8b2763..df9a80fcbcf1ade9897fa1cd35d81324244f4b68 100644
GIT binary patch
delta 842
zcmZwGJ5N+W6bJBK5Lup!@(@-~Q1Lx5k27axXf88*=Z2D!Z(wIEEi6ndmQq6Ov?sAK
zp}3TO1HOR08)Hngq4keIwcg}+Po_Dq%<O;v(cFhGr|T<YjYgvd6EF^Kn1(5sJpR3Y
z+CGpYhr28fzuNbQZ+W@-?f4V_87i2xjVztWF_IwGNu+T8laxxXQfXKVt&Gz`{`(Ro
ztF6mbcjMK|7YA#dcm2@ohb9ccFkFKXxDKOrKeX~lp;e|BoDqg|5G0)vo>4JG>y^?m
zI#z>qObppy)LE|gi`IwXf>hQfR9Qshqo7I}5flZH4JDaKD&zmtFlFCOSBYMCTl38#
zkgt+;PH^%SIx4mBrIsR=Iy+ki?xM$m$tie>SBd&%YiYPpoTSPeM8YV7qKg<US>f2S
zs#3Hz#(_k}hEnB=M2o$>ofeG2I84AKOu;m?VFqr%O_+r_n1=<p1?M@IpaZvI8CKv9
z+=W$GgL`lv9>6+0gh%igp1{+3Z|B+BSy4($k)1^2U4x;r6@haplqK$xVhXt$7)nPO
z{pEH#y`$~tAYcPFL4pDe1_*3@w9WOeqGT+w)KP@2aS=@*;k`0KdU6~pO5Wwcg1AD#
tTx_w^JK1#LA=D?ETeEN0<{Ay2!4nulTt!?!+`c^TA}-cHKW}{;{R@B#;DZ1F

delta 842
zcmZwGxo#6t6b4{BA;ei7$U+hvhyk<T`0h)Z$=yaNDf0$&h?0T=iNY?4EIQ~T(IBN5
zm%Kq90}CMpNGL5oBoT!f>C@4SM*q3@+?oF8FZDirJn3vTYqi=U%s>McU>@dR_V`EV
zq<KiE2H(}2!6!uruXL;a>-fF?IZ=dI$}*Wmm=J-;RC;1dA4sMmDeHCQED)x-Glc%V
zlrUO)mXzLk{_N>td-L_k^+v7^6EF#vU<xk7bTx8~JXK_7sLaX{&21(!^Nc<+5+`CT
z73Y*nKi<cNVC7k#R@E;WZzqc&${4&*MA?J|YlR?THQ~{eDLcl!r{h5`aPBXHUc|;~
zy$DQO<7G)o!x@p1mc%o~h)y&Z%WZO)#n{fBD*vr$lo}h8Mda3t6ezKbYK#z(HhD*a
z#mg#7X0ja%QeLXe&sMbFJJ@f)49vnD%)<gKLKBwY3S5O{Sb<eogKO|7V*@tfI<#O5
zZop00hBn-S+i(Xua2M{ueRu#5tAqVVr>BKaF*{B(i8?4Eh4I8uZi!LRE2#y`(v59O
zW{=68e;2)@y~jXc2f9Fk0S5sRRCTnct8YcNRtl>;@d~q(hEd|32?Wnf&N#nh|8pEc
v*bpxo4!fo|>{@Wuu)Dkbvb|QT=_ULE6R6v$>!^F@_fJq)s;?h*-%bApZ${z~


From 5d66970fe91118f1d21fae564d32fee6331d27c8 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Tue, 3 Feb 2026 06:25:27 -0800
Subject: [PATCH 30/33] Refactor FloatingGenerateBox and HistoryTable
 components for improved UI consistency

- Removed unnecessary class from the FloatingGenerateBox button for cleaner styling.
- Updated HistoryTable to remove redundant class from the delete button.
- Reorganized imports in dropdown-menu for better readability.
- Enhanced useAutoUpdater hook with improved dependency management and updated icon usage.
- Deleted obsolete useAutoUpdater.ts file to streamline codebase.
---
 .../Generation/FloatingGenerateBox.tsx        |   2 +-
 app/src/components/History/HistoryTable.tsx   |   1 -
 app/src/components/ui/dropdown-menu.tsx       |  12 ++--
 app/src/hooks/useAutoUpdater.ts               |  52 ------------------
 app/src/hooks/useAutoUpdater.tsx              |   6 +-
 tauri/src-tauri/gen/Assets.car                | Bin 3847048 -> 3847048 bytes
 6 files changed, 11 insertions(+), 62 deletions(-)
 delete mode 100644 app/src/hooks/useAutoUpdater.ts

diff --git a/app/src/components/Generation/FloatingGenerateBox.tsx b/app/src/components/Generation/FloatingGenerateBox.tsx
index 2e99d337..d8d493bd 100644
--- a/app/src/components/Generation/FloatingGenerateBox.tsx
+++ b/app/src/components/Generation/FloatingGenerateBox.tsx
@@ -300,7 +300,7 @@ export function FloatingGenerateBox({
                   <Button
                     type="submit"
                     disabled={isPending || !selectedProfileId}
-                    className="h-10 w-10 rounded-full bg-accent hover:bg-accent/90 hover:scale-105 text-accent-foreground shadow-lg hover:shadow-accent/50 transition-all duration-200"
+                    className="h-10 w-10 rounded-full bg-accent hover:bg-accent/90 hover:scale-105 text-accent-foreground shadow-lg transition-all duration-200"
                     size="icon"
                   >
                     {isPending ? (
diff --git a/app/src/components/History/HistoryTable.tsx b/app/src/components/History/HistoryTable.tsx
index 7a861e19..cc670e57 100644
--- a/app/src/components/History/HistoryTable.tsx
+++ b/app/src/components/History/HistoryTable.tsx
@@ -347,7 +347,6 @@ export function HistoryTable() {
                         <DropdownMenuItem
                           onClick={() => handleDeleteClick(gen.id, gen.profile_name)}
                           disabled={deleteGeneration.isPending}
-                          className="text-destructive focus:text-destructive"
                         >
                           <HugeiconsIcon icon={Delete01Icon} size={16} className="mr-2 h-4 w-4" />
                           Delete
diff --git a/app/src/components/ui/dropdown-menu.tsx b/app/src/components/ui/dropdown-menu.tsx
index bb83b772..7a878f99 100644
--- a/app/src/components/ui/dropdown-menu.tsx
+++ b/app/src/components/ui/dropdown-menu.tsx
@@ -1,7 +1,7 @@
-import * as React from 'react';
-import * as DropdownMenuPrimitive from '@radix-ui/react-dropdown-menu';
-import { HugeiconsIcon } from '@hugeicons/react';
 import { MoreHorizontalIcon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
+import * as DropdownMenuPrimitive from '@radix-ui/react-dropdown-menu';
+import * as React from 'react';
 import { cn } from '@/lib/utils/cn';
 
 const DropdownMenu = DropdownMenuPrimitive.Root;
@@ -74,7 +74,7 @@ const DropdownMenuItem = React.forwardRef<
   <DropdownMenuPrimitive.Item
     ref={ref}
     className={cn(
-      'relative flex cursor-default select-none items-center rounded-sm px-2 py-1.5 text-sm outline-none transition-colors focus:bg-accent focus:text-accent-foreground data-[disabled]:pointer-events-none data-[disabled]:opacity-50',
+      'relative flex cursor-default select-none items-center rounded-sm px-2 py-1.5 text-sm outline-none focus:bg-accent focus:text-accent-foreground data-[disabled]:pointer-events-none data-[disabled]:opacity-50',
       inset && 'pl-8',
       className,
     )}
@@ -155,7 +155,9 @@ const DropdownMenuSeparator = React.forwardRef<
 DropdownMenuSeparator.displayName = DropdownMenuPrimitive.Separator.displayName;
 
 const DropdownMenuShortcut = ({ className, ...props }: React.HTMLAttributes<HTMLSpanElement>) => {
-  return <span className={cn('ml-auto text-xs tracking-widest opacity-60', className)} {...props} />;
+  return (
+    <span className={cn('ml-auto text-xs tracking-widest opacity-60', className)} {...props} />
+  );
 };
 DropdownMenuShortcut.displayName = 'DropdownMenuShortcut';
 
diff --git a/app/src/hooks/useAutoUpdater.ts b/app/src/hooks/useAutoUpdater.ts
deleted file mode 100644
index e99d3ac5..00000000
--- a/app/src/hooks/useAutoUpdater.ts
+++ /dev/null
@@ -1,52 +0,0 @@
-import { useCallback, useEffect, useRef, useState } from 'react';
-import { usePlatform } from '@/platform/PlatformContext';
-import type { UpdateStatus } from '@/platform/types';
-
-// Re-export UpdateStatus for backwards compatibility
-export type { UpdateStatus };
-
-export function useAutoUpdater(checkOnMount = false) {
-  const platform = usePlatform();
-  const [status, setStatus] = useState<UpdateStatus>(platform.updater.getStatus());
-  const hasCheckedRef = useRef(false);
-
-  // Subscribe to updater status changes
-  useEffect(() => {
-    const unsubscribe = platform.updater.subscribe((newStatus) => {
-      setStatus(newStatus);
-    });
-    return unsubscribe;
-    // Empty dependency array - platform is stable from context
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.updater.subscribe]);
-
-  const checkForUpdates = useCallback(async () => {
-    await platform.updater.checkForUpdates();
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.updater.checkForUpdates]);
-
-  const downloadAndInstall = useCallback(async () => {
-    await platform.updater.downloadAndInstall();
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.updater.downloadAndInstall]);
-
-  const restartAndInstall = useCallback(async () => {
-    await platform.updater.restartAndInstall();
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [platform.updater.restartAndInstall]);
-
-  useEffect(() => {
-    if (checkOnMount && platform.metadata.isTauri && !hasCheckedRef.current) {
-      hasCheckedRef.current = true;
-      checkForUpdates();
-    }
-    // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, []);
-
-  return {
-    status,
-    checkForUpdates,
-    downloadAndInstall,
-    restartAndInstall,
-  };
-}
diff --git a/app/src/hooks/useAutoUpdater.tsx b/app/src/hooks/useAutoUpdater.tsx
index af156495..a7e1e949 100644
--- a/app/src/hooks/useAutoUpdater.tsx
+++ b/app/src/hooks/useAutoUpdater.tsx
@@ -1,5 +1,5 @@
-import { HugeiconsIcon } from '@hugeicons/react';
 import { Download01Icon, Refresh01Icon } from '@hugeicons/core-free-icons';
+import { HugeiconsIcon } from '@hugeicons/react';
 import { useCallback, useEffect, useRef, useState } from 'react';
 import { Progress } from '@/components/ui/progress';
 import { ToastAction } from '@/components/ui/toast';
@@ -74,7 +74,7 @@ export function useAutoUpdater(options: boolean | UseAutoUpdaterOptions = false)
     }
     // Empty dependency array - only run once on mount
     // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, []);
+  }, [platform.metadata.isTauri, checkOnMount, checkForUpdates]);
 
   // Show toast when update is available
   useEffect(() => {
@@ -133,7 +133,7 @@ export function useAutoUpdater(options: boolean | UseAutoUpdaterOptions = false)
     toastUpdateRef.current({
       title: (
         <div className="flex items-center gap-2">
-          <Download className="h-4 w-4 animate-pulse" />
+          <HugeiconsIcon icon={Download01Icon} size={16} className="h-4 w-4 animate-pulse" />
           <span>Downloading Update</span>
         </div>
       ),
diff --git a/tauri/src-tauri/gen/Assets.car b/tauri/src-tauri/gen/Assets.car
index df9a80fcbcf1ade9897fa1cd35d81324244f4b68..a67539b65d68f107d0fafb5402c11a5502c1f08f 100644
GIT binary patch
delta 745
zcmZwFIdW7n5XSKu2E(wg20WO>>|1-(+MDEAPfPg-z5y9UNbX=JqX@WzL$c>%a0{jg
zNS*S54auOYU#NdeDlNYM7%kxIC+TvN-bo)QMVHCeSSeYpNRkO5Czn<9WW0)s)Ss1A
z_RLirZ-03I?(^1ke<|~&jNlZE;WVtl88|yEWm4BVTY3p>0<jK`Z0{l^j!ez!P?D0y
zI<L-A5=}dvvpFof$(L~_%KKEc$4+5{f+mq%No(U&i<+Z#t04}#{0n`|ll4)TYA`l%
zA<j<7wh&2zQ<S8Y)M|-Y;(tOW>GJnP%QD#*cYWY$im`YzF$lRvqJ5;^`B;ND*|f3}
z!a03#$Dup(z1<0%gY$3!F2W_a3|HVPT!ZUy18%}P+=AQiyRiXNxC@(b5AMSQcnDkY
z2p+=|cnZ(pIlO?E@M_rGeSLJ)nOZ{R=*XAgajD{{S6)+*m|f(mV^u4cVy|1PC;wu8
zu=558wqXVe7&I8L;D&=8Km6>P)M%|U#H}^5+IdPQCt~lpnLZU)%<4eh*qprLbbdGs
N5J85++1qdXzW{9a&~yL*

delta 745
zcmZwFIdT+15CzZ}2Eni+K!66Z2(d$IYROs>r&ZNe9Xf(;fJb2B%b4*94DKKkuXPM=
z!2|}bT)r4&H68KV{Fy(a7C(QD7V!OxG@gx1UInTtF|jw9vYh@D=i<9utT$w|4TjX;
zFLQRrh1#{dpFV#0x;;Hy%6us!I0s`m4{LA%F7`{A)V0Rw%1MGH>#Go}pecGxl;on;
zCZ*u@aE?t<<7&=Uzi1}k#trLgtaO!<jfuEZmPE5qwVYLErEUDr!dzpU&w@U;lZ{a$
z9J}m7AfIE0jf$aIjG|Ob4X%i9vE!gQOXPGGv@Da&aie`!x_Y6ED#R%yRLhQncV2fn
zIhWEP$T}&yu7d8*5B4W;2`<AGxC+<cI^2MpunxE2Hr#;?xC{5-G-DH{@Bp^pAv}V|
z@C3HuDeS;Acn&Y%CA@;y@TNc5e|vJ$6y-Sips;vrQK~u;Ukho+zGdxMYBwlll1lO4
zb*A&9y>~#c3o}rl!GHw@*B|Zq{&!P6j#x}0sRj?x3R8^Ql8PL>bev<T!-050Vpmt3
Q&W~pSB1nHcd;jC`59+qh?f?J)


From 66cdb307e9e2b3bbc24a31588fe1a7b0e5254894 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Tue, 3 Feb 2026 06:33:24 -0800
Subject: [PATCH 31/33] remove redundant file

---
 .../ServerSettings/CudaDownloadSection.tsx    | 173 ------------------
 1 file changed, 173 deletions(-)
 delete mode 100644 app/src/components/ServerSettings/CudaDownloadSection.tsx

diff --git a/app/src/components/ServerSettings/CudaDownloadSection.tsx b/app/src/components/ServerSettings/CudaDownloadSection.tsx
deleted file mode 100644
index d6c22207..00000000
--- a/app/src/components/ServerSettings/CudaDownloadSection.tsx
+++ /dev/null
@@ -1,173 +0,0 @@
-import { useState, useEffect } from 'react';
-import { useQuery } from '@tanstack/react-query';
-import { Loader2, RefreshCw, CheckCircle, AlertCircle } from 'lucide-react';
-import { relaunch } from '@tauri-apps/plugin-process';
-import { Card, CardContent, CardHeader, CardTitle } from '@/components/ui/card';
-import { Button } from '@/components/ui/button';
-import { Badge } from '@/components/ui/badge';
-import { Alert, AlertDescription } from '@/components/ui/alert';
-import { ModelProgress } from './ModelProgress';
-import { apiClient } from '@/lib/api/client';
-import { useServerStore } from '@/stores/serverStore';
-import { toast } from '@/components/ui/use-toast';
-import { usePlatform } from '@/platform/PlatformContext';
-import { useServerHealth } from '@/lib/hooks/useServer';
-
-export function CudaDownloadSection() {
-  const platform = usePlatform();
-  const serverUrl = useServerStore((state) => state.serverUrl);
-  const { data: health } = useServerHealth();
-  const [downloadingCuda, setDownloadingCuda] = useState(false);
-  const [downloadError, setDownloadError] = useState<string | null>(null);
-
-  // Platform checks
-  const isWindows = navigator.userAgent.includes('Windows');
-  const gpuAvailable = health?.gpu_available ?? false;
-
-  // Only show this section on Windows + Tauri + GPU available
-  if (!platform.metadata.isTauri || !isWindows || !gpuAvailable) {
-    return null;
-  }
-
-  // Query CUDA status
-  const { data: cudaStatus, refetch } = useQuery({
-    queryKey: ['cudaStatus'],
-    queryFn: () => apiClient.getCudaStatus(),
-    enabled: isWindows && platform.metadata.isTauri && gpuAvailable,
-    retry: false,
-  });
-
-  // Handle download trigger
-  const handleDownload = async () => {
-    try {
-      setDownloadError(null);
-      await apiClient.triggerCudaDownload();
-      setDownloadingCuda(true);
-    } catch (error) {
-      setDownloadError(error instanceof Error ? error.message : 'Failed to start download');
-    }
-  };
-
-  // Handle retry
-  const handleRetry = () => {
-    setDownloadError(null);
-    handleDownload();
-  };
-
-  // Monitor download progress and auto-restart on completion
-  useEffect(() => {
-    if (!downloadingCuda || !serverUrl) return;
-
-    const eventSource = new EventSource(`${serverUrl}/models/progress/cuda-binary`);
-
-    eventSource.onmessage = (event) => {
-      try {
-        const data = JSON.parse(event.data);
-
-        if (data.status === 'complete' && data.progress >= 100) {
-          eventSource.close();
-          setDownloadingCuda(false);
-
-          // Show restart toast
-          toast({
-            title: 'CUDA Downloaded',
-            description: 'Restarting app to enable GPU acceleration...',
-          });
-
-          // Restart after 2 seconds
-          setTimeout(async () => {
-            await relaunch();
-          }, 2000);
-        }
-
-        if (data.status === 'error') {
-          eventSource.close();
-          setDownloadingCuda(false);
-          setDownloadError(data.error || 'Download failed');
-        }
-      } catch (error) {
-        console.error('Error parsing CUDA download progress:', error);
-      }
-    };
-
-    eventSource.onerror = () => {
-      eventSource.close();
-      setDownloadingCuda(false);
-      setDownloadError('Connection to server lost');
-    };
-
-    return () => eventSource.close();
-  }, [downloadingCuda, serverUrl]);
-
-  if (!cudaStatus) {
-    return null;
-  }
-
-  const { cuda_available, cuda_active, cuda_binary_size_mb } = cudaStatus;
-
-  return (
-    <Card>
-      <CardHeader>
-        <CardTitle>GPU Acceleration</CardTitle>
-      </CardHeader>
-      <CardContent className="space-y-4">
-        {/* Status badges */}
-        <div className="flex flex-wrap gap-2">
-          <Badge variant={cuda_active ? 'default' : 'secondary'}>
-            Mode: {cuda_active ? 'CUDA' : 'CPU'}
-          </Badge>
-          <Badge variant={gpuAvailable ? 'default' : 'secondary'}>
-            GPU: {gpuAvailable ? 'Available' : 'Not Available'}
-          </Badge>
-        </div>
-
-        {/* Already downloaded status */}
-        {cuda_available && !downloadingCuda && (
-          <Alert>
-            <CheckCircle className="h-4 w-4" />
-            <AlertDescription>
-              CUDA support is active. GPU acceleration enabled.
-            </AlertDescription>
-          </Alert>
-        )}
-
-        {/* Download section - only show if not already downloaded */}
-        {!cuda_available && !downloadError && !downloadingCuda && (
-          <div className="space-y-3">
-            <p className="text-sm text-muted-foreground">
-              Download CUDA support for 4-5x faster inference with your NVIDIA GPU
-            </p>
-            <Button onClick={handleDownload} className="w-full">
-              Download CUDA Support ({cuda_binary_size_mb.toFixed(1)}GB)
-            </Button>
-          </div>
-        )}
-
-        {/* Progress display */}
-        {downloadingCuda && (
-          <div className="space-y-2">
-            <ModelProgress
-              modelName="cuda-binary"
-              displayName="CUDA Server Binary"
-              isDownloading={true}
-            />
-          </div>
-        )}
-
-        {/* Error with retry button */}
-        {downloadError && (
-          <div className="space-y-2">
-            <Alert variant="destructive">
-              <AlertCircle className="h-4 w-4" />
-              <AlertDescription>{downloadError}</AlertDescription>
-            </Alert>
-            <Button onClick={handleRetry} variant="outline" className="w-full">
-              <RefreshCw className="mr-2 h-4 w-4" />
-              Retry Download
-            </Button>
-          </div>
-        )}
-      </CardContent>
-    </Card>
-  );
-}

From dab3344fb51d934c791215d2e27ff2e8ecde9a3a Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Tue, 3 Feb 2026 06:36:09 -0800
Subject: [PATCH 32/33] Enhance StoryList component with dynamic bottom padding

- Introduced useMemo to calculate bottom padding based on the visibility of the StoryTrackEditor and FloatingGenerateBox.
- Updated imports to include useStory hook for fetching the current story data.
- Adjusted the StoryList layout to accommodate the new padding logic, improving UI consistency.
---
 app/src/components/StoriesTab/StoryList.tsx | 21 ++++++++++++++++++---
 1 file changed, 18 insertions(+), 3 deletions(-)

diff --git a/app/src/components/StoriesTab/StoryList.tsx b/app/src/components/StoriesTab/StoryList.tsx
index a283a34a..dd78d245 100644
--- a/app/src/components/StoriesTab/StoryList.tsx
+++ b/app/src/components/StoriesTab/StoryList.tsx
@@ -1,6 +1,6 @@
 import { HugeiconsIcon } from '@hugeicons/react';
 import { Add01Icon, Book01Icon, MoreHorizontalIcon, PencilIcon, Delete01Icon } from '@hugeicons/core-free-icons';
-import { useState } from 'react';
+import { useState, useMemo } from 'react';
 import {
   AlertDialog,
   AlertDialogAction,
@@ -30,7 +30,7 @@ import { Input } from '@/components/ui/input';
 import { Label } from '@/components/ui/label';
 import { Textarea } from '@/components/ui/textarea';
 import { useToast } from '@/components/ui/use-toast';
-import { useStories, useCreateStory, useUpdateStory, useDeleteStory } from '@/lib/hooks/useStories';
+import { useStories, useCreateStory, useUpdateStory, useDeleteStory, useStory } from '@/lib/hooks/useStories';
 import { cn } from '@/lib/utils/cn';
 import { formatDate } from '@/lib/utils/format';
 import { useStoryStore } from '@/stores/storyStore';
@@ -39,6 +39,8 @@ export function StoryList() {
   const { data: stories, isLoading } = useStories();
   const selectedStoryId = useStoryStore((state) => state.selectedStoryId);
   const setSelectedStoryId = useStoryStore((state) => state.setSelectedStoryId);
+  const trackEditorHeight = useStoryStore((state) => state.trackEditorHeight);
+  const { data: currentStory } = useStory(selectedStoryId);
   const createStory = useCreateStory();
   const updateStory = useUpdateStory();
   const deleteStory = useDeleteStory();
@@ -55,6 +57,16 @@ export function StoryList() {
   const [newStoryDescription, setNewStoryDescription] = useState('');
   const { toast } = useToast();
 
+  // Calculate bottom padding to account for FloatingGenerateBox and StoryTrackEditor
+  const hasTrackEditor = currentStory && currentStory.items.length > 0;
+  const bottomPadding = useMemo(() => {
+    // FloatingGenerateBox height (~100px) + gap (24px)
+    const generateBoxHeight = 124;
+    // Track editor height when visible
+    const editorHeight = hasTrackEditor ? trackEditorHeight + 24 : 0;
+    return generateBoxHeight + editorHeight;
+  }, [hasTrackEditor, trackEditorHeight]);
+
   const handleCreateStory = () => {
     if (!newStoryName.trim()) {
       toast({
@@ -184,7 +196,10 @@ export function StoryList() {
       </div>
 
       {/* Story List */}
-      <div className="flex-1 min-h-0 overflow-y-auto space-y-2">
+      <div 
+        className="flex-1 min-h-0 overflow-y-auto space-y-2"
+        style={{ paddingBottom: `${bottomPadding}px` }}
+      >
         {storyList.length === 0 ? (
           <div className="text-center py-12 px-5 border-2 border-dashed border-muted rounded-2xl text-muted-foreground">
             <HugeiconsIcon icon={Book01Icon} size={48} className="h-12 w-12 mx-auto mb-4 opacity-50" />

From 1622e08372eb4147b5a5a8fa3f41e5eac7c49176 Mon Sep 17 00:00:00 2001
From: Jamie Pine <ijamespine@me.com>
Date: Tue, 3 Feb 2026 06:45:35 -0800
Subject: [PATCH 33/33] format

---
 app/src/components/ServerTab/ServerTab.tsx |  2 +-
 app/src/lib/api/client.ts                  | 78 +++++++++++++---------
 tauri/src/platform/filesystem.ts           |  2 +-
 web/src/platform/filesystem.ts             |  2 +-
 4 files changed, 50 insertions(+), 34 deletions(-)

diff --git a/app/src/components/ServerTab/ServerTab.tsx b/app/src/components/ServerTab/ServerTab.tsx
index d77c7800..69fc7117 100644
--- a/app/src/components/ServerTab/ServerTab.tsx
+++ b/app/src/components/ServerTab/ServerTab.tsx
@@ -1,8 +1,8 @@
 import { ConnectionForm } from '@/components/ServerSettings/ConnectionForm';
 import { DataFolders } from '@/components/ServerSettings/DataFolders';
+import { ProviderSettings } from '@/components/ServerSettings/ProviderSettings';
 import { ServerStatus } from '@/components/ServerSettings/ServerStatus';
 import { UpdateStatus } from '@/components/ServerSettings/UpdateStatus';
-import { ProviderSettings } from '@/components/ServerSettings/ProviderSettings';
 import { usePlatform } from '@/platform/PlatformContext';
 
 export function ServerTab() {
diff --git a/app/src/lib/api/client.ts b/app/src/lib/api/client.ts
index 01f548d2..da64d4ff 100644
--- a/app/src/lib/api/client.ts
+++ b/app/src/lib/api/client.ts
@@ -1,30 +1,30 @@
-import { useServerStore } from '@/stores/serverStore';
 import type { LanguageCode } from '@/lib/constants/languages';
+import { useServerStore } from '@/stores/serverStore';
 import type {
-  VoiceProfileCreate,
-  VoiceProfileResponse,
-  ProfileSampleResponse,
+  ActiveTasksResponse,
+  FolderPathsResponse,
   GenerationRequest,
   GenerationResponse,
-  HistoryQuery,
+  HealthResponse,
   HistoryListResponse,
+  HistoryQuery,
   HistoryResponse,
-  TranscriptionResponse,
-  HealthResponse,
-  ModelStatusListResponse,
   ModelDownloadRequest,
-  ActiveTasksResponse,
-  FolderPathsResponse,
+  ModelStatusListResponse,
+  ProfileSampleResponse,
   StoryCreate,
-  StoryResponse,
   StoryDetailResponse,
+  StoryItemBatchUpdate,
   StoryItemCreate,
   StoryItemDetail,
-  StoryItemBatchUpdate,
-  StoryItemReorder,
   StoryItemMove,
-  StoryItemTrim,
+  StoryItemReorder,
   StoryItemSplit,
+  StoryItemTrim,
+  StoryResponse,
+  TranscriptionResponse,
+  VoiceProfileCreate,
+  VoiceProfileResponse,
 } from './types';
 
 class ApiClient {
@@ -328,7 +328,15 @@ class ApiClient {
     return response.blob();
   }
 
-  async importGeneration(file: File): Promise<{ id: string; profile_id: string; profile_name: string; text: string; message: string }> {
+  async importGeneration(
+    file: File,
+  ): Promise<{
+    id: string;
+    profile_id: string;
+    profile_name: string;
+    text: string;
+    message: string;
+  }> {
     const url = `${this.getBaseUrl()}/history/import`;
     const formData = new FormData();
     formData.append('file', file);
@@ -387,7 +395,12 @@ class ApiClient {
   }
 
   async triggerModelDownload(modelName: string): Promise<{ message: string }> {
-    console.log('[API] triggerModelDownload called for:', modelName, 'at', new Date().toISOString());
+    console.log(
+      '[API] triggerModelDownload called for:',
+      modelName,
+      'at',
+      new Date().toISOString(),
+    );
     const result = await this.request<{ message: string }>('/models/download', {
       method: 'POST',
       body: JSON.stringify({ model_name: modelName } as ModelDownloadRequest),
@@ -420,10 +433,7 @@ class ApiClient {
     return this.request('/channels');
   }
 
-  async createChannel(data: {
-    name: string;
-    device_ids: string[];
-  }): Promise<{
+  async createChannel(data: { name: string; device_ids: string[] }): Promise<{
     id: string;
     name: string;
     is_default: boolean;
@@ -465,10 +475,7 @@ class ApiClient {
     return this.request(`/channels/${channelId}/voices`);
   }
 
-  async setChannelVoices(
-    channelId: string,
-    profileIds: string[],
-  ): Promise<{ message: string }> {
+  async setChannelVoices(channelId: string, profileIds: string[]): Promise<{ message: string }> {
     return this.request(`/channels/${channelId}/voices`, {
       method: 'PUT',
       body: JSON.stringify({ profile_ids: profileIds }),
@@ -479,10 +486,7 @@ class ApiClient {
     return this.request(`/profiles/${profileId}/channels`);
   }
 
-  async setProfileChannels(
-    profileId: string,
-    channelIds: string[],
-  ): Promise<{ message: string }> {
+  async setProfileChannels(profileId: string, channelIds: string[]): Promise<{ message: string }> {
     return this.request(`/profiles/${profileId}/channels`, {
       method: 'PUT',
       body: JSON.stringify({ channel_ids: channelIds }),
@@ -545,21 +549,33 @@ class ApiClient {
     });
   }
 
-  async moveStoryItem(storyId: string, itemId: string, data: StoryItemMove): Promise<StoryItemDetail> {
+  async moveStoryItem(
+    storyId: string,
+    itemId: string,
+    data: StoryItemMove,
+  ): Promise<StoryItemDetail> {
     return this.request<StoryItemDetail>(`/stories/${storyId}/items/${itemId}/move`, {
       method: 'PUT',
       body: JSON.stringify(data),
     });
   }
 
-  async trimStoryItem(storyId: string, itemId: string, data: StoryItemTrim): Promise<StoryItemDetail> {
+  async trimStoryItem(
+    storyId: string,
+    itemId: string,
+    data: StoryItemTrim,
+  ): Promise<StoryItemDetail> {
     return this.request<StoryItemDetail>(`/stories/${storyId}/items/${itemId}/trim`, {
       method: 'PUT',
       body: JSON.stringify(data),
     });
   }
 
-  async splitStoryItem(storyId: string, itemId: string, data: StoryItemSplit): Promise<StoryItemDetail[]> {
+  async splitStoryItem(
+    storyId: string,
+    itemId: string,
+    data: StoryItemSplit,
+  ): Promise<StoryItemDetail[]> {
     return this.request<StoryItemDetail[]>(`/stories/${storyId}/items/${itemId}/split`, {
       method: 'POST',
       body: JSON.stringify(data),
diff --git a/tauri/src/platform/filesystem.ts b/tauri/src/platform/filesystem.ts
index 70972eb2..226a2cba 100644
--- a/tauri/src/platform/filesystem.ts
+++ b/tauri/src/platform/filesystem.ts
@@ -1,4 +1,4 @@
-import type { PlatformFilesystem, FileFilter } from '@/platform/types';
+import type { FileFilter, PlatformFilesystem } from '@/platform/types';
 
 export const tauriFilesystem: PlatformFilesystem = {
   async saveFile(filename: string, blob: Blob, filters?: FileFilter[]) {
diff --git a/web/src/platform/filesystem.ts b/web/src/platform/filesystem.ts
index b9d74690..d2717bd2 100644
--- a/web/src/platform/filesystem.ts
+++ b/web/src/platform/filesystem.ts
@@ -1,4 +1,4 @@
-import type { PlatformFilesystem, FileFilter } from '@/platform/types';
+import type { FileFilter, PlatformFilesystem } from '@/platform/types';
 
 export const webFilesystem: PlatformFilesystem = {
   async saveFile(filename: string, blob: Blob, _filters?: FileFilter[]) {