diff --git a/backend_service/app.py b/backend_service/app.py
index e226b08..86977d7 100644
--- a/backend_service/app.py
+++ b/backend_service/app.py
@@ -8,25 +8,20 @@
 import uuid
 from datetime import datetime
 from pathlib import Path
-from typing import Any
+from typing import TYPE_CHECKING, Any
 
 from fastapi import FastAPI, Request
 from fastapi.middleware.cors import CORSMiddleware
 from starlette.responses import JSONResponse
 
-from backend_service.image_runtime import (
-    ImageGenerationConfig,
-    ImageRuntimeManager,
-)
-from backend_service.video_runtime import (
-    VideoGenerationConfig,
-    VideoRuntimeManager,
-    start_torch_warmup,
-)
 from backend_service.models import ImageGenerationRequest, VideoGenerationRequest
 from backend_service.routes import register_routes
 from backend_service.state import ChaosEngineState
 
+if TYPE_CHECKING:
+    from backend_service.image_runtime import ImageRuntimeManager
+    from backend_service.video_runtime import VideoRuntimeManager
+
 # ---------------------------------------------------------------------------
 # Helper modules -- extracted from this file for maintainability.
 # ---------------------------------------------------------------------------
@@ -121,8 +116,8 @@
 # extracted signatures require them explicitly.
 # ---------------------------------------------------------------------------
 
-def _build_system_snapshot() -> dict[str, Any]:
-    return _build_system_snapshot_impl(app_version, APP_STARTED_AT)
+def _build_system_snapshot(*, capabilities: Any | None = None) -> dict[str, Any]:
+    return _build_system_snapshot_impl(app_version, APP_STARTED_AT, capabilities=capabilities)
 
 
 def _default_settings() -> dict[str, Any]:
@@ -231,6 +226,7 @@ def compute_cache_preview(
     fp16_layers: int = 4,
     num_layers: int = 32,
     num_heads: int = 32,
+    num_kv_heads: int | None = None,
     hidden_size: int = 4096,
     context_tokens: int = 8192,
     params_b: float = 7.0,
@@ -242,6 +238,7 @@ def compute_cache_preview(
         fp16_layers=fp16_layers,
         num_layers=num_layers,
         num_heads=num_heads,
+        num_kv_heads=num_kv_heads,
         hidden_size=hidden_size,
         context_tokens=context_tokens,
         params_b=params_b,
@@ -343,6 +340,8 @@ def _generate_image_artifacts(
     runtime_manager: ImageRuntimeManager | None = None,
 ) -> tuple[list[dict[str, Any]], dict[str, Any]]:
     import logging
+    from backend_service.image_runtime import ImageGenerationConfig, ImageRuntimeManager
+
     logger = logging.getLogger("chaosengine.images")
     effective_width, effective_height = (
         _apply_draft_resolution(request.width, request.height)
@@ -413,6 +412,8 @@ def _generate_video_artifact(
     HTTP error rather than a fake clip.
     """
     import logging
+    from backend_service.video_runtime import VideoGenerationConfig
+
     logger = logging.getLogger("chaosengine.video")
     logger.info(
         "Generating video: model=%s repo=%s size=%dx%d frames=%d steps=%d",
@@ -489,7 +490,10 @@ def create_app(
         allow_methods=["GET", "POST", "PATCH", "DELETE", "OPTIONS"],
         allow_headers=["Accept", "Authorization", "Content-Type", "X-ChaosEngine-Token"],
     )
-    app.state.chaosengine = state or ChaosEngineState(server_port=DEFAULT_PORT)
+    app.state.chaosengine = state or ChaosEngineState(
+        server_port=DEFAULT_PORT,
+        background_capability_probe=True,
+    )
     app.state.chaosengine_api_token = _resolve_api_token(api_token)
     app.state.chaosengine_allowed_origins = frozenset(allowed_origins)
     # Bearer-token enforcement toggle. Reads from (in order) env override,
diff --git a/backend_service/catalog/image_models.py b/backend_service/catalog/image_models.py
index d890a46..fce458b 100644
--- a/backend_service/catalog/image_models.py
+++ b/backend_service/catalog/image_models.py
@@ -44,7 +44,7 @@
                 "taskSupport": ["txt2img"],
                 "sizeGb": 6.8,
                 "recommendedResolution": "1024x1024",
-                "note": "GGUF Q4_K_M — runs on ~8 GB VRAM / Apple Silicon with near-unchanged quality.",
+                "note": "GGUF Q4_K_M — quantizes the FLUX transformer; the full diffusers pipeline still carries the base text encoders/VAE in memory.",
                 "estimatedGenerationSeconds": 5.2,
                 "releaseDate": "2024-09",
             },
@@ -62,7 +62,7 @@
                 "taskSupport": ["txt2img"],
                 "sizeGb": 12.7,
                 "recommendedResolution": "1024x1024",
-                "note": "GGUF Q8_0 — near-bf16 quality at ~half the memory footprint.",
+                "note": "GGUF Q8_0 — near-bf16 transformer quality; text encoders/VAE still make the full FLUX runtime memory-heavy.",
                 "estimatedGenerationSeconds": 4.8,
                 "releaseDate": "2024-09",
             },
@@ -125,7 +125,7 @@
                 "taskSupport": ["txt2img"],
                 "sizeGb": 6.8,
                 "recommendedResolution": "1024x1024",
-                "note": "GGUF Q4_K_M — fits FLUX Dev on 8 GB VRAM / Apple Silicon with minimal quality loss.",
+                "note": "GGUF Q4_K_M — quantizes the FLUX Dev transformer; expect the full diffusers pipeline to remain memory-heavy from text encoders/VAE.",
                 "estimatedGenerationSeconds": 9.0,
                 "releaseDate": "2024-09",
             },
@@ -143,7 +143,7 @@
                 "taskSupport": ["txt2img"],
                 "sizeGb": 9.9,
                 "recommendedResolution": "1024x1024",
-                "note": "GGUF Q6_K — mid-point between Q4 size and Q8 quality.",
+                "note": "GGUF Q6_K — mid-point between Q4 size and Q8 transformer quality; FLUX text encoders/VAE still dominate runtime memory.",
                 "estimatedGenerationSeconds": 8.4,
                 "releaseDate": "2024-09",
             },
@@ -161,7 +161,7 @@
                 "taskSupport": ["txt2img"],
                 "sizeGb": 12.7,
                 "recommendedResolution": "1024x1024",
-                "note": "GGUF Q8_0 — near-bf16 quality at roughly half the memory.",
+                "note": "GGUF Q8_0 — near-bf16 transformer quality; text encoders/VAE still make the full FLUX runtime memory-heavy.",
                 "estimatedGenerationSeconds": 7.8,
                 "releaseDate": "2024-09",
             },
@@ -271,6 +271,154 @@
 ]
 
 LATEST_IMAGE_TRACKED_SEEDS: list[dict[str, Any]] = [
+    {
+        "repo": "baidu/ERNIE-Image",
+        "name": "ERNIE-Image",
+        "provider": "Baidu",
+        "styleTags": ["general", "detailed"],
+        "taskSupport": ["txt2img"],
+        "sizeGb": 29.43,
+        "runtimeFootprintGb": 24.0,
+        "runtimeFootprintMpsGb": 32.0,
+        "runtimeFootprintCpuGb": 36.0,
+        "coreWeightsGb": 29.43,
+        "repoSizeGb": 29.47,
+        "recommendedResolution": "1024x1024",
+        "note": "Tracked current text-to-image DiT release from Baidu.",
+        "gated": False,
+        "pipelineTag": "text-to-image",
+        "updatedLabel": "Tracked latest",
+        "releaseDate": "2026-04",
+    },
+    {
+        "repo": "baidu/ERNIE-Image-Turbo",
+        "name": "ERNIE-Image-Turbo",
+        "provider": "Baidu",
+        "styleTags": ["general", "fast"],
+        "taskSupport": ["txt2img"],
+        "sizeGb": 29.43,
+        "runtimeFootprintGb": 24.0,
+        "runtimeFootprintMpsGb": 32.0,
+        "runtimeFootprintCpuGb": 36.0,
+        "coreWeightsGb": 29.43,
+        "repoSizeGb": 29.47,
+        "recommendedResolution": "1024x1024",
+        "note": "Tracked faster ERNIE-Image lane for current local image generation discovery.",
+        "gated": False,
+        "pipelineTag": "text-to-image",
+        "updatedLabel": "Tracked latest",
+        "releaseDate": "2026-04",
+    },
+    {
+        "repo": "NucleusAI/Nucleus-Image",
+        "name": "Nucleus-Image",
+        "provider": "NucleusAI",
+        "styleTags": ["general", "detailed"],
+        "taskSupport": ["txt2img"],
+        "sizeGb": 48.09,
+        "runtimeFootprintGb": 48.0,
+        "runtimeFootprintMpsGb": 55.0,
+        "runtimeFootprintCpuGb": 60.0,
+        "coreWeightsGb": 48.09,
+        "repoSizeGb": 48.11,
+        "recommendedResolution": "1024x1024",
+        "note": "Tracked current diffusers-compatible text-to-image release.",
+        "gated": False,
+        "pipelineTag": "text-to-image",
+        "updatedLabel": "Tracked latest",
+        "releaseDate": "2026-04",
+    },
+    {
+        "repo": "black-forest-labs/FLUX.2-dev",
+        "name": "FLUX.2 Dev",
+        "provider": "Black Forest Labs",
+        "styleTags": ["general", "detailed", "flux"],
+        "taskSupport": ["txt2img", "img2img"],
+        "sizeGb": 64.7,
+        "runtimeFootprintGb": 65.0,
+        "runtimeFootprintMpsGb": 78.0,
+        "runtimeFootprintCpuGb": 90.0,
+        "recommendedResolution": "1024x1024",
+        "note": "Tracked FLUX.2 generation-and-editing release.",
+        "gated": True,
+        "pipelineTag": "image-to-image",
+        "updatedLabel": "Tracked latest",
+        "releaseDate": "2026-02",
+    },
+    {
+        "repo": "black-forest-labs/FLUX.2-klein-9B",
+        "name": "FLUX.2 Klein 9B",
+        "provider": "Black Forest Labs",
+        "styleTags": ["general", "flux", "fast"],
+        "taskSupport": ["txt2img", "img2img"],
+        "sizeGb": 49.23,
+        "runtimeFootprintGb": 49.0,
+        "runtimeFootprintMpsGb": 55.0,
+        "runtimeFootprintCpuGb": 64.0,
+        "coreWeightsGb": 49.23,
+        "repoSizeGb": 49.26,
+        "recommendedResolution": "1024x1024",
+        "note": "Tracked smaller FLUX.2 lane.",
+        "gated": False,
+        "pipelineTag": "image-to-image",
+        "updatedLabel": "Tracked latest",
+        "releaseDate": "2026-02",
+    },
+    {
+        "repo": "Tongyi-MAI/Z-Image-Turbo",
+        "name": "Z-Image-Turbo",
+        "provider": "Tongyi-MAI",
+        "styleTags": ["general", "fast"],
+        "taskSupport": ["txt2img"],
+        "sizeGb": 30.58,
+        "runtimeFootprintGb": 16.0,
+        "runtimeFootprintMpsGb": 20.0,
+        "runtimeFootprintCpuGb": 24.0,
+        "coreWeightsGb": 30.58,
+        "repoSizeGb": 30.64,
+        "recommendedResolution": "1024x1024",
+        "note": "Tracked current Z-Image turbo text-to-image release.",
+        "gated": False,
+        "pipelineTag": "text-to-image",
+        "updatedLabel": "Tracked latest",
+        "releaseDate": "2026-01",
+    },
+    {
+        "repo": "Tongyi-MAI/Z-Image",
+        "name": "Z-Image",
+        "provider": "Tongyi-MAI",
+        "styleTags": ["general", "detailed"],
+        "taskSupport": ["txt2img"],
+        "sizeGb": 19.11,
+        "runtimeFootprintGb": 22.0,
+        "runtimeFootprintMpsGb": 24.0,
+        "runtimeFootprintCpuGb": 30.0,
+        "coreWeightsGb": 19.11,
+        "repoSizeGb": 19.14,
+        "recommendedResolution": "1024x1024",
+        "note": "Tracked current Z-Image text-to-image release.",
+        "gated": False,
+        "pipelineTag": "text-to-image",
+        "updatedLabel": "Tracked latest",
+        "releaseDate": "2026-01",
+    },
+    {
+        "repo": "Qwen/Qwen-Image-Edit-2511",
+        "name": "Qwen-Image-Edit-2511",
+        "provider": "Qwen",
+        "styleTags": ["edit", "qwenimage", "general"],
+        "taskSupport": ["img2img"],
+        "sizeGb": 57.7,
+        "runtimeFootprintGb": 58.0,
+        "runtimeFootprintMpsGb": 72.0,
+        "runtimeFootprintCpuGb": 72.0,
+        "recommendedResolution": "1024x1024",
+        "note": "Tracked newer Qwen image editing release with improved consistency.",
+        "gated": False,
+        "pipelineTag": "image-to-image",
+        "updatedLabel": "Tracked latest",
+        "releaseDate": "2025-12",
+    },
     {
         "repo": "Qwen/Qwen-Image",
         "name": "Qwen-Image",
@@ -278,6 +426,9 @@
         "styleTags": ["general", "detailed", "qwenimage"],
         "taskSupport": ["txt2img"],
         "sizeGb": 57.7,
+        "runtimeFootprintGb": 58.0,
+        "runtimeFootprintMpsGb": 72.0,
+        "runtimeFootprintCpuGb": 72.0,
         "recommendedResolution": "1024x1024",
         "note": "Tracked diffusers-native Qwen image generation family.",
         "gated": False,
@@ -292,6 +443,9 @@
         "styleTags": ["edit", "qwenimage", "general"],
         "taskSupport": ["img2img"],
         "sizeGb": 57.7,
+        "runtimeFootprintGb": 58.0,
+        "runtimeFootprintMpsGb": 72.0,
+        "runtimeFootprintCpuGb": 72.0,
         "recommendedResolution": "1024x1024",
         "note": "Tracked Qwen edit lane so Image Discover can surface newer editing-capable models too.",
         "gated": False,
@@ -306,6 +460,9 @@
         "styleTags": ["hidream", "detailed", "quality"],
         "taskSupport": ["txt2img"],
         "sizeGb": 47.2,
+        "runtimeFootprintGb": 58.0,
+        "runtimeFootprintMpsGb": 62.0,
+        "runtimeFootprintCpuGb": 70.0,
         "recommendedResolution": "1024x1024",
         "note": "Tracked larger open-image generation lane from the HiDream family.",
         "gated": False,
@@ -320,6 +477,9 @@
         "styleTags": ["general", "edit", "detailed"],
         "taskSupport": ["txt2img", "img2img"],
         "sizeGb": 35.8,
+        "runtimeFootprintGb": 40.0,
+        "runtimeFootprintMpsGb": 45.0,
+        "runtimeFootprintCpuGb": 52.0,
         "recommendedResolution": "1024x1024",
         "note": "Tracked unified generation-and-editing lane from the GLM image family.",
         "gated": False,
@@ -333,6 +493,9 @@
         "styleTags": ["sana", "fast", "small"],
         "taskSupport": ["txt2img"],
         "sizeGb": 7.7,
+        "runtimeFootprintGb": 8.0,
+        "runtimeFootprintMpsGb": 10.0,
+        "runtimeFootprintCpuGb": 12.0,
         "recommendedResolution": "1024x1024",
         "note": "Tracked smaller Sana Sprint lane for faster local image generation.",
         "gated": False,
@@ -347,6 +510,9 @@
         "styleTags": ["sana", "fast", "detailed"],
         "taskSupport": ["txt2img"],
         "sizeGb": 9.74,
+        "runtimeFootprintGb": 10.0,
+        "runtimeFootprintMpsGb": 12.0,
+        "runtimeFootprintCpuGb": 15.0,
         "recommendedResolution": "1024x1024",
         "note": "Tracked larger Sana Sprint lane with a better quality-to-speed balance.",
         "gated": False,
diff --git a/backend_service/catalog/video_models.py b/backend_service/catalog/video_models.py
index e3509bc..9fd6773 100644
--- a/backend_service/catalog/video_models.py
+++ b/backend_service/catalog/video_models.py
@@ -35,6 +35,7 @@
                 "styleTags": ["general", "fast", "motion"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 2.0,
+                "runtimeFootprintGb": 10.0,
                 "recommendedResolution": "768x512",
                 "defaultDurationSeconds": 4.0,
                 "note": "Small, fast, Apache 2.0 — best starter pick for a local video runtime.",
@@ -55,9 +56,10 @@
                 "styleTags": ["general", "fast", "motion", "gguf"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 1.4,
+                "runtimeFootprintGb": 10.0,
                 "recommendedResolution": "768x512",
                 "defaultDurationSeconds": 4.0,
-                "note": "GGUF Q4_K_M — runs on 6-8 GB VRAM / Apple Silicon at near-native quality.",
+                "note": "GGUF Q4_K_M — quantizes the transformer, but the LTX pipeline still needs roughly a 10 GB runtime envelope for text encoder/VAE/buffers.",
                 "estimatedGenerationSeconds": 50.0,
                 "availableLocally": False,
                 "releaseDate": "2024-12",
@@ -75,6 +77,7 @@
                 "styleTags": ["general", "motion", "quality", "gguf"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 1.7,
+                "runtimeFootprintGb": 10.0,
                 "recommendedResolution": "768x512",
                 "defaultDurationSeconds": 4.0,
                 "note": "GGUF Q6_K — mid-point between Q4 footprint and Q8 fidelity.",
@@ -95,6 +98,7 @@
                 "styleTags": ["general", "motion", "quality", "gguf"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 2.2,
+                "runtimeFootprintGb": 10.0,
                 "recommendedResolution": "768x512",
                 "defaultDurationSeconds": 4.0,
                 "note": "GGUF Q8_0 — near-bf16 quality at roughly half the memory.",
@@ -129,6 +133,7 @@
                 "styleTags": ["general", "fast", "motion", "mlx"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 19.0,
+                "runtimeFootprintGb": 27.0,
                 "recommendedResolution": "768x512",
                 "defaultDurationSeconds": 4.0,
                 "note": "Distilled LTX-2 — fastest MLX path for previews. Use the dev variant for final fidelity.",
@@ -147,6 +152,7 @@
                 "styleTags": ["general", "quality", "motion", "mlx"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 19.0,
+                "runtimeFootprintGb": 27.0,
                 "recommendedResolution": "768x512",
                 "defaultDurationSeconds": 4.0,
                 "note": "Full LTX-2 dev weights — higher fidelity, longer sampling than distilled.",
@@ -160,11 +166,13 @@
                 "name": "LTX-2.3 · distilled (MLX)",
                 "provider": "Lightricks · prince-canuma",
                 "repo": "prince-canuma/LTX-2.3-distilled",
+                "textEncoderRepo": "prince-canuma/LTX-2-distilled",
                 "link": "https://huggingface.co/prince-canuma/LTX-2.3-distilled",
                 "runtime": "mlx-video (MLX native)",
                 "styleTags": ["general", "fast", "motion", "mlx"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 19.0,
+                "runtimeFootprintGb": 27.0,
                 "recommendedResolution": "768x512",
                 "defaultDurationSeconds": 4.0,
                 "note": "LTX-2.3 distilled — refreshed fast preview path with sharper texture detail vs LTX-2. Use the dev variant for final fidelity.",
@@ -178,11 +186,13 @@
                 "name": "LTX-2.3 · dev (MLX)",
                 "provider": "Lightricks · prince-canuma",
                 "repo": "prince-canuma/LTX-2.3-dev",
+                "textEncoderRepo": "prince-canuma/LTX-2-distilled",
                 "link": "https://huggingface.co/prince-canuma/LTX-2.3-dev",
                 "runtime": "mlx-video (MLX native)",
                 "styleTags": ["general", "quality", "motion", "mlx"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 19.0,
+                "runtimeFootprintGb": 27.0,
                 "recommendedResolution": "768x512",
                 "defaultDurationSeconds": 4.0,
                 "note": "LTX-2.3 dev — quality tier; full sampler steps for best output. Apple Silicon native via MLX. Install mlx-video from Setup → GPU runtime bundle to enable.",
@@ -222,6 +232,7 @@
                 # Resident peak ~14 GB during text encoding (UMT5-XXL bf16);
                 # drops to ~4 GB during diffusion when encoder is freed.
                 "runtimeFootprintGb": 14.0,
+                "runtimeFootprintMpsGb": 23.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 4.0,
                 "note": "1.3B transformer + UMT5 text encoder. ~16GB on disk. Best starter pick for trying local video end-to-end on modest hardware.",
@@ -267,9 +278,10 @@
                 # ~0.9 GB GGUF transformer + ~14 GB shared UMT5-XXL/VAE base.
                 "sizeGb": 14.9,
                 "runtimeFootprintGb": 12.5,  # Q4_K_M trans (~0.9 GB) + UMT5 (~11 GB)
+                "runtimeFootprintMpsGb": 21.5,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 4.0,
-                "note": "Q4_K_M — smallest quantized 1.3B; runs in <8 GB unified memory once base is cached.",
+                "note": "Q4_K_M — smallest quantized 1.3B. The transformer is tiny, but UMT5/VAE keep the full runtime envelope in the 12-23 GB range depending on device/offload.",
                 "estimatedGenerationSeconds": 70.0,
                 "availableLocally": False,
                 "releaseDate": "2025-03",
@@ -287,9 +299,11 @@
                 "styleTags": ["general", "fast", "small", "gguf"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 15.2,
+                "runtimeFootprintGb": 13.2,
+                "runtimeFootprintMpsGb": 22.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 4.0,
-                "note": "Q6_K — mid-point between Q4 footprint and Q8 fidelity.",
+                "note": "Q6_K — mid-point between Q4 footprint and Q8 fidelity; still carries the shared UMT5/VAE runtime overhead.",
                 "estimatedGenerationSeconds": 68.0,
                 "availableLocally": False,
                 "releaseDate": "2025-03",
@@ -307,9 +321,11 @@
                 "styleTags": ["general", "quality", "small", "gguf"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 15.5,
+                "runtimeFootprintGb": 13.8,
+                "runtimeFootprintMpsGb": 22.5,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 4.0,
-                "note": "Q8_0 — near-bf16 quality at roughly half the transformer footprint.",
+                "note": "Q8_0 — near-bf16 quality at roughly half the transformer footprint; shared UMT5/VAE still dominate peak RAM/VRAM.",
                 "estimatedGenerationSeconds": 65.0,
                 "availableLocally": False,
                 "releaseDate": "2025-03",
@@ -329,6 +345,8 @@
                 # ~7 GB GGUF transformer + ~14 GB shared UMT5-XXL/VAE — fits
                 # comfortably on a 24 GB RTX 4090 with VAE headroom.
                 "sizeGb": 21.0,
+                "runtimeFootprintGb": 18.0,
+                "runtimeFootprintMpsGb": 27.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 5.0,
                 "note": "Q4_K_M — unlocks Wan 2.1 14B on 24 GB VRAM (RTX 4090) without bnb.",
@@ -349,6 +367,8 @@
                 "styleTags": ["general", "quality", "motion", "gguf"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 24.0,
+                "runtimeFootprintGb": 21.0,
+                "runtimeFootprintMpsGb": 30.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 5.0,
                 "note": "Q6_K — mid-point between Q4 footprint and Q8 fidelity.",
@@ -369,6 +389,8 @@
                 "styleTags": ["general", "quality", "motion", "gguf"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 28.0,
+                "runtimeFootprintGb": 25.0,
+                "runtimeFootprintMpsGb": 34.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 5.0,
                 "note": "Q8_0 — near-bf16 quality at roughly half the transformer footprint.",
@@ -415,6 +437,7 @@
                 # over-estimates resident because the repo carries duplicate
                 # sharded safetensors + tokenizer caches.
                 "runtimeFootprintGb": 22.0,
+                "runtimeFootprintMpsGb": 24.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 5.0,
                 "note": "Best Wan 2.2 pick for consumer hardware. 24 GB on disk, runs on a 24 GB GPU or a 32 GB+ Mac.",
@@ -440,6 +463,7 @@
                 "sizeGb": 17.5,
                 # GGUF Q4_K_M trans (~3.5 GB) + UMT5-XXL during encode (~11 GB).
                 "runtimeFootprintGb": 14.5,
+                "runtimeFootprintMpsGb": 22.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 5.0,
                 "note": "Q4_K_M — smallest Wan 2.2 that still generates usable quality. Best fit for 16 GB unified memory.",
@@ -461,6 +485,7 @@
                 "taskSupport": ["txt2video"],
                 "sizeGb": 18.2,
                 "runtimeFootprintGb": 16.5,  # Q6_K trans ~5 GB + UMT5 ~11 GB
+                "runtimeFootprintMpsGb": 24.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 5.0,
                 "note": "Q6_K — mid-point between Q4 footprint and Q8 fidelity.",
@@ -482,6 +507,7 @@
                 "taskSupport": ["txt2video"],
                 "sizeGb": 19.0,
                 "runtimeFootprintGb": 18.0,  # Q8 trans ~7 GB + UMT5 ~11 GB
+                "runtimeFootprintMpsGb": 26.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 5.0,
                 "note": "Q8_0 — near-bf16 quality at roughly half the transformer footprint.",
@@ -518,6 +544,7 @@
                 # bogus "needs 176 GB" warning, but the note flags that the
                 # offload mode is required.
                 "runtimeFootprintGb": 30.0,
+                "runtimeFootprintMpsGb": 36.0,
                 "recommendedResolution": "832x480",
                 "defaultDurationSeconds": 5.0,
                 "note": (
@@ -591,9 +618,10 @@
                 "styleTags": ["general", "motion", "balanced"],
                 "taskSupport": ["txt2video"],
                 "sizeGb": 10.0,
+                "runtimeFootprintGb": 22.0,
                 "recommendedResolution": "848x480",
                 "defaultDurationSeconds": 5.4,
-                "note": "Apache 2.0, balanced footprint, strong motion quality.",
+                "note": "Apache 2.0, balanced footprint, strong motion quality. Diffusers' bf16/offload path lands around a 22 GB runtime envelope.",
                 "estimatedGenerationSeconds": 150.0,
                 "availableLocally": False,
                 "releaseDate": "2024-10",
@@ -629,9 +657,10 @@
                 # CPU-offload tricks. Smaller than Wan 2.1 1.3B because there's
                 # no UMT5-XXL — just the standard T5.
                 "sizeGb": 9.0,
+                "runtimeFootprintGb": 19.0,
                 "recommendedResolution": "720x480",
                 "defaultDurationSeconds": 6.0,
-                "note": "Smallest CogVideoX. Apache 2.0 weights, ~9 GB on disk, runs on consumer GPUs.",
+                "note": "Smallest CogVideoX. Apache 2.0 weights, ~9 GB on disk; runtime peak is closer to 19 GB without the most aggressive offload/tiling.",
                 "estimatedGenerationSeconds": 90.0,
                 "availableLocally": False,
                 "releaseDate": "2024-08",
@@ -650,9 +679,10 @@
                 # same envelope as Wan 2.2 — needs 24 GB VRAM or 32 GB+
                 # unified memory.
                 "sizeGb": 18.0,
+                "runtimeFootprintGb": 33.0,
                 "recommendedResolution": "720x480",
                 "defaultDurationSeconds": 6.0,
-                "note": "Quality tier. ~18 GB on disk. Same CogVideoXPipeline class as the 2B.",
+                "note": "Quality tier. ~18 GB on disk; budget for a 32 GB-class runtime envelope unless aggressive offload is enabled.",
                 "estimatedGenerationSeconds": 200.0,
                 "availableLocally": False,
                 "releaseDate": "2024-08",
diff --git a/backend_service/helpers/discovery.py b/backend_service/helpers/discovery.py
index 49519cf..676e5c1 100644
--- a/backend_service/helpers/discovery.py
+++ b/backend_service/helpers/discovery.py
@@ -46,7 +46,7 @@ def _path_size_bytes(path: Path, *, seen: set[tuple[int, int]] | None = None) ->
         with iterator as entries:
             for entry in entries:
                 try:
-                    entry_stat = entry.stat(follow_symlinks=False)
+                    entry_stat = entry.stat(follow_symlinks=True)
                 except OSError:
                     continue
                 entry_id = (entry_stat.st_dev, entry_stat.st_ino)
@@ -54,7 +54,7 @@ def _path_size_bytes(path: Path, *, seen: set[tuple[int, int]] | None = None) ->
                     continue
                 visited.add(entry_id)
                 try:
-                    is_dir = entry.is_dir(follow_symlinks=False)
+                    is_dir = entry.is_dir(follow_symlinks=True)
                 except OSError:
                     is_dir = False
                 if is_dir:
@@ -324,6 +324,7 @@ def _detect_model_quantization(path: Path, fmt: str, *, name_hint: str = "") ->
     "stable-diffusion", "sdxl", "flux.", "flux1", "flux-",
     "dall-e", "imagen", "kandinsky", "wuerstchen",
     "diffusion-pipe", "qwen-image", "qwen/qwen-image",
+    "sana_sprint", "sana-sprint", "sana sprint", "sana_1600m", "sana-1600m",
 )
 
 
@@ -348,6 +349,7 @@ def _detect_model_quantization(path: Path, fmt: str, *, name_hint: str = "") ->
     "mochi-1",
     "cogvideo",
     "ltx-video",
+    "ltx-2",
     "zeroscope",
     "animatediff",
 )
diff --git a/backend_service/helpers/huggingface.py b/backend_service/helpers/huggingface.py
index b4c192b..8c379ce 100644
--- a/backend_service/helpers/huggingface.py
+++ b/backend_service/helpers/huggingface.py
@@ -7,6 +7,7 @@
 import urllib.error
 import urllib.parse
 import urllib.request
+from hashlib import sha256
 from datetime import datetime, timezone
 from pathlib import Path
 from typing import Any
@@ -17,7 +18,7 @@
 
 
 _HF_REPO_PATTERN = re.compile(r"^[a-zA-Z0-9_.\-]+/[a-zA-Z0-9_.\-]+$")
-_HUB_FILE_CACHE: dict[str, dict[str, Any]] = {}
+_HUB_FILE_CACHE: dict[tuple[str, str], dict[str, Any]] = {}
 _DISCOVER_SEARCH_PUNCT_RE = re.compile(r"[^a-z0-9]+")
 _DISCOVER_SEARCH_ALPHA_NUM_RE = re.compile(r"([a-z])(\d)|(\d)([a-z])")
 _TEXT_DISCOVER_PIPELINES = {
@@ -30,6 +31,21 @@
 _HF_QUERY_URL_HOSTS = {"huggingface.co", "www.huggingface.co", "hf.co", "www.hf.co"}
 
 
+def _hf_token_value() -> str:
+    return str(os.environ.get("HF_TOKEN") or os.environ.get("HUGGING_FACE_HUB_TOKEN") or "").strip()
+
+
+def _hf_token_cache_key() -> str:
+    token = _hf_token_value()
+    if not token:
+        return "anonymous"
+    return f"token:{sha256(token.encode('utf-8')).hexdigest()[:16]}"
+
+
+def _clear_huggingface_caches() -> None:
+    _HUB_FILE_CACHE.clear()
+
+
 def _extract_hf_repo_id_from_query(value: str) -> str | None:
     text = str(value or "").strip()
     if not text:
@@ -122,6 +138,9 @@ def _search_huggingface_hub(query: str, library: list[dict[str, Any]], limit: in
         })
         url = f"https://huggingface.co/api/models?{params}"
         req = urllib.request.Request(url, headers={"User-Agent": "ChaosEngineAI/0.2.0"})
+        token = _hf_token_value()
+        if token:
+            req.add_header("Authorization", f"Bearer {token}")
         with urllib.request.urlopen(req, timeout=8) as resp:
             data = json.loads(resp.read().decode())
     except Exception:
@@ -246,11 +265,12 @@ def _hub_repo_files(repo_id: str) -> dict[str, Any]:
     HUGGING_FACE_HUB_TOKEN for gated repos and degrades to a non-fatal
     warning on transient upstream 5xx errors.
     """
-    cached = _HUB_FILE_CACHE.get(repo_id)
+    cache_key = (repo_id, _hf_token_cache_key())
+    cached = _HUB_FILE_CACHE.get(cache_key)
     if cached is not None:
         return cached
 
-    token = os.environ.get("HF_TOKEN") or os.environ.get("HUGGING_FACE_HUB_TOKEN")
+    token = _hf_token_value()
     try:
         encoded_repo = urllib.parse.quote(repo_id, safe="/")
         url = f"https://huggingface.co/api/models/{encoded_repo}?blobs=true"
@@ -326,7 +346,7 @@ def _hub_repo_files(repo_id: str) -> dict[str, Any]:
         pipeline_tag=data.get("pipeline_tag"),
         last_modified=data.get("lastModified"),
     )
-    _HUB_FILE_CACHE[repo_id] = payload
+    _HUB_FILE_CACHE[cache_key] = payload
     return payload
 
 
@@ -509,7 +529,7 @@ def _hf_repo_snapshot_dir(repo_id: str) -> Path | None:
 
 
 def _known_repo_size_gb(repo_id: str) -> float | None:
-    cached = _HUB_FILE_CACHE.get(repo_id)
+    cached = _HUB_FILE_CACHE.get((repo_id, _hf_token_cache_key()))
     if cached is not None:
         cached_total = cached.get("totalSizeGb")
         if isinstance(cached_total, (int, float)) and cached_total > 0:
diff --git a/backend_service/helpers/images.py b/backend_service/helpers/images.py
index b58f064..51fcd7d 100644
--- a/backend_service/helpers/images.py
+++ b/backend_service/helpers/images.py
@@ -21,15 +21,17 @@
     _format_release_label,
     _hf_number_label,
     _hf_repo_snapshot_dir,
+    _hf_token_cache_key,
+    _hf_token_value,
     _parse_iso_datetime,
 )
 from backend_service.helpers.discovery import _candidate_model_dirs, _path_size_bytes
 from backend_service.image_runtime import validate_local_diffusers_snapshot
 
 
-_IMAGE_DISCOVER_METADATA_CACHE: dict[str, tuple[float, dict[str, Any]]] = {}
+_IMAGE_DISCOVER_METADATA_CACHE: dict[tuple[str, str], tuple[float, dict[str, Any]]] = {}
 _IMAGE_DISCOVER_METADATA_TTL_SECONDS = 6 * 60 * 60
-_LATEST_IMAGE_MODELS_CACHE: tuple[float, list[dict[str, Any]]] | None = None
+_LATEST_IMAGE_MODELS_CACHE: tuple[float, str, list[dict[str, Any]]] | None = None
 _LATEST_IMAGE_MODELS_TTL_SECONDS = 3 * 60 * 60
 
 # Cache keyed by (path, mtime_ns) — we recompute only when the snapshot dir
@@ -37,6 +39,47 @@
 _SNAPSHOT_SIZE_CACHE: dict[tuple[str, int], int] = {}
 
 
+def _positive_float(value: Any) -> float | None:
+    try:
+        parsed = float(value)
+    except (TypeError, ValueError):
+        return None
+    if parsed > 0:
+        return parsed
+    return None
+
+
+def _positive_int(value: Any) -> int | None:
+    try:
+        parsed = int(value)
+    except (TypeError, ValueError):
+        return None
+    if parsed > 0:
+        return parsed
+    return None
+
+
+def _image_seed_size_metadata(seed: dict[str, Any]) -> tuple[float, float | None, float | None]:
+    catalog_size_gb = _positive_float(seed.get("sizeGb"))
+    core_weights_gb = _positive_float(seed.get("coreWeightsGb")) or catalog_size_gb
+    repo_size_gb = _positive_float(seed.get("repoSizeGb"))
+    size_gb = core_weights_gb or repo_size_gb or catalog_size_gb or 0.0
+    return float(size_gb), core_weights_gb, repo_size_gb
+
+
+def _tracked_seed_for_repo(repo_id: str) -> dict[str, Any] | None:
+    for seed in LATEST_IMAGE_TRACKED_SEEDS:
+        if str(seed.get("repo") or "") == repo_id:
+            return seed
+    return None
+
+
+def _clear_image_discover_caches() -> None:
+    global _LATEST_IMAGE_MODELS_CACHE
+    _IMAGE_DISCOVER_METADATA_CACHE.clear()
+    _LATEST_IMAGE_MODELS_CACHE = None
+
+
 def _snapshot_on_disk_bytes(snapshot_dir: Path | None) -> int | None:
     """Walk the HF snapshot dir and return its true on-disk byte size.
 
@@ -166,12 +209,19 @@ def _find_image_variant(model_id: str) -> dict[str, Any] | None:
     for seed in LATEST_IMAGE_TRACKED_SEEDS:
         repo = str(seed.get("repo") or "")
         if repo == model_id:
+            size_gb, core_weights_gb, repo_size_gb = _image_seed_size_metadata(seed)
             return {
                 "id": repo,
                 "repo": repo,
                 "name": seed.get("name") or repo.split("/", 1)[-1],
                 "provider": seed.get("provider") or "Community",
-                "sizeGb": seed.get("sizeGb") or 0,
+                "sizeGb": size_gb,
+                "runtimeFootprintGb": seed.get("runtimeFootprintGb"),
+                "runtimeFootprintMpsGb": seed.get("runtimeFootprintMpsGb"),
+                "runtimeFootprintCudaGb": seed.get("runtimeFootprintCudaGb"),
+                "runtimeFootprintCpuGb": seed.get("runtimeFootprintCpuGb"),
+                "coreWeightsGb": core_weights_gb,
+                "repoSizeGb": repo_size_gb,
                 "styleTags": list(seed.get("styleTags") or []),
                 "taskSupport": list(seed.get("taskSupport") or ["txt2img"]),
                 "recommendedResolution": seed.get("recommendedResolution") or "1024x1024",
@@ -188,12 +238,19 @@ def _find_image_variant_by_repo(repo: str) -> dict[str, Any] | None:
     for seed in LATEST_IMAGE_TRACKED_SEEDS:
         seed_repo = str(seed.get("repo") or "")
         if seed_repo == repo:
+            size_gb, core_weights_gb, repo_size_gb = _image_seed_size_metadata(seed)
             return {
                 "id": seed_repo,
                 "repo": seed_repo,
                 "name": seed.get("name") or seed_repo.split("/", 1)[-1],
                 "provider": seed.get("provider") or "Community",
-                "sizeGb": seed.get("sizeGb") or 0,
+                "sizeGb": size_gb,
+                "runtimeFootprintGb": seed.get("runtimeFootprintGb"),
+                "runtimeFootprintMpsGb": seed.get("runtimeFootprintMpsGb"),
+                "runtimeFootprintCudaGb": seed.get("runtimeFootprintCudaGb"),
+                "runtimeFootprintCpuGb": seed.get("runtimeFootprintCpuGb"),
+                "coreWeightsGb": core_weights_gb,
+                "repoSizeGb": repo_size_gb,
                 "styleTags": list(seed.get("styleTags") or []),
                 "taskSupport": list(seed.get("taskSupport") or ["txt2img"]),
                 "recommendedResolution": seed.get("recommendedResolution") or "1024x1024",
@@ -203,13 +260,14 @@ def _find_image_variant_by_repo(repo: str) -> dict[str, Any] | None:
 
 def _image_repo_live_metadata(repo_id: str) -> dict[str, Any]:
     now = time.time()
-    cached = _IMAGE_DISCOVER_METADATA_CACHE.get(repo_id)
+    cache_key = (repo_id, _hf_token_cache_key())
+    cached = _IMAGE_DISCOVER_METADATA_CACHE.get(cache_key)
     if cached is not None:
         cached_at, payload = cached
         if (now - cached_at) < _IMAGE_DISCOVER_METADATA_TTL_SECONDS:
             return payload
 
-    token = os.environ.get("HF_TOKEN") or os.environ.get("HUGGING_FACE_HUB_TOKEN")
+    token = _hf_token_value()
     payload: dict[str, Any]
     try:
         encoded_repo = urllib.parse.quote(repo_id, safe="/")
@@ -222,6 +280,7 @@ def _image_repo_live_metadata(repo_id: str) -> dict[str, Any]:
 
         total_bytes = 0
         weight_bytes = 0
+        used_storage_bytes = _positive_int(data.get("usedStorage"))
         for sibling in data.get("siblings") or []:
             if not isinstance(sibling, dict):
                 continue
@@ -229,14 +288,12 @@ def _image_repo_live_metadata(repo_id: str) -> dict[str, Any]:
             if not path:
                 continue
             lfs = sibling.get("lfs") if isinstance(sibling.get("lfs"), dict) else {}
-            size_bytes = sibling.get("size") or lfs.get("size") or 0
-            try:
-                size_int = int(size_bytes)
-            except (TypeError, ValueError):
-                size_int = 0
+            size_int = _positive_int(sibling.get("size")) or _positive_int(lfs.get("size")) or 0
             total_bytes += size_int
             if _classify_hub_file(path) == "weight":
                 weight_bytes += size_int
+        if total_bytes <= 0 and used_storage_bytes is not None:
+            total_bytes = used_storage_bytes
 
         card = data.get("cardData") or {}
         license_value = str(card.get("license") or "").strip() or None if isinstance(card, dict) else None
@@ -276,7 +333,7 @@ def _image_repo_live_metadata(repo_id: str) -> dict[str, Any]:
             "metadataWarning": "Live Hugging Face metadata is temporarily unavailable. Showing curated defaults.",
         }
 
-    _IMAGE_DISCOVER_METADATA_CACHE[repo_id] = (now, payload)
+    _IMAGE_DISCOVER_METADATA_CACHE[cache_key] = (now, payload)
     return payload
 
 
@@ -365,6 +422,7 @@ def _tracked_latest_seed_payloads(library: list[dict[str, Any]]) -> list[dict[st
         release_date = str(seed.get("releaseDate") or "").strip() or None
         snapshot_dir = _hf_repo_snapshot_dir(repo_id)
         on_disk_bytes = _snapshot_on_disk_bytes(snapshot_dir)
+        size_gb, core_weights_gb, repo_size_gb = _image_seed_size_metadata(seed)
         payloads.append(
             {
                 "id": repo_id,
@@ -377,7 +435,11 @@ def _tracked_latest_seed_payloads(library: list[dict[str, Any]]) -> list[dict[st
                 "runtime": "Tracked diffusers candidate",
                 "styleTags": list(seed.get("styleTags") or []),
                 "taskSupport": list(seed.get("taskSupport") or ["txt2img"]),
-                "sizeGb": float(seed.get("sizeGb") or 0.0),
+                "sizeGb": size_gb,
+                "runtimeFootprintGb": seed.get("runtimeFootprintGb"),
+                "runtimeFootprintMpsGb": seed.get("runtimeFootprintMpsGb"),
+                "runtimeFootprintCudaGb": seed.get("runtimeFootprintCudaGb"),
+                "runtimeFootprintCpuGb": seed.get("runtimeFootprintCpuGb"),
                 "recommendedResolution": str(seed.get("recommendedResolution") or "Unknown"),
                 "note": str(
                     seed.get("note")
@@ -402,9 +464,9 @@ def _tracked_latest_seed_payloads(library: list[dict[str, Any]]) -> list[dict[st
                 "gated": seed.get("gated"),
                 "pipelineTag": seed.get("pipelineTag"),
                 "repoSizeBytes": None,
-                "repoSizeGb": None,
+                "repoSizeGb": repo_size_gb,
                 "coreWeightsBytes": None,
-                "coreWeightsGb": None,
+                "coreWeightsGb": core_weights_gb,
                 "metadataWarning": "Showing ChaosEngineAI tracked latest defaults until live Hugging Face metadata is available.",
                 "source": "latest",
             }
@@ -419,11 +481,15 @@ def _is_latest_image_candidate(model: dict[str, Any], curated_repos: set[str]) -
     lowered = model_id.lower()
     excluded_fragments = (
         "-lora",
+        "_lora",
+        "lora-",
         "controlnet",
         "ip-adapter",
+        "adapter",
         "tensorrt",
         "_amdgpu",
         "onnx",
+        "embedding",
         "instruct-pix2pix",
     )
     if any(fragment in lowered for fragment in excluded_fragments):
@@ -431,19 +497,44 @@ def _is_latest_image_candidate(model: dict[str, Any], curated_repos: set[str]) -
 
     tags = {str(tag).lower() for tag in (model.get("tags") or [])}
     pipeline_tag = str(model.get("pipeline_tag") or "").lower()
-    allowed_orgs = {
+    excluded_tags = {
+        "lora",
+        "controlnet",
+        "adapter",
+        "adapters",
+        "textual-inversion",
+        "embedding",
+        "embeddings",
+        "onnx",
+    }
+    if tags & excluded_tags:
+        return False
+
+    trusted_providers = {
         "black-forest-labs",
+        "baidu",
         "stabilityai",
         "qwen",
         "hidream-ai",
         "zai-org",
+        "tongyi-mai",
+        "nucleusai",
         "efficient-large-model",
         "hunyuanvideo-community",
         "tencent-hunyuan",
         "thudm",
+        "diffusers",
     }
     provider = model_id.split("/", 1)[0].lower() if "/" in model_id else ""
-    if provider and provider not in allowed_orgs:
+    try:
+        downloads = int(model.get("downloads") or 0)
+    except (TypeError, ValueError):
+        downloads = 0
+    try:
+        likes = int(model.get("likes") or 0)
+    except (TypeError, ValueError):
+        likes = 0
+    if provider and provider not in trusted_providers and downloads < 1000 and likes < 25:
         return False
 
     if "diffusers" not in tags:
@@ -467,9 +558,14 @@ def _latest_image_model_payloads(library: list[dict[str, Any]], limit: int = 10)
     }
 
     now = time.time()
+    token_cache_key = _hf_token_cache_key()
     cached_entries = _LATEST_IMAGE_MODELS_CACHE
-    if cached_entries is not None and (now - cached_entries[0]) < _LATEST_IMAGE_MODELS_TTL_SECONDS:
-        latest = cached_entries[1]
+    if (
+        cached_entries is not None
+        and cached_entries[1] == token_cache_key
+        and (now - cached_entries[0]) < _LATEST_IMAGE_MODELS_TTL_SECONDS
+    ):
+        latest = cached_entries[2]
         return [
             {
                 **entry,
@@ -481,18 +577,21 @@ def _latest_image_model_payloads(library: list[dict[str, Any]], limit: int = 10)
     try:
         params = urllib.parse.urlencode({
             "filter": "diffusers",
-            "sort": "modified",
+            "sort": "createdAt",
             "direction": "-1",
-            "limit": "48",
+            "limit": "96",
             "full": "true",
         })
         url = f"https://huggingface.co/api/models?{params}"
         req = urllib.request.Request(url, headers={"User-Agent": "ChaosEngineAI/0.2.0"})
+        token = _hf_token_value()
+        if token:
+            req.add_header("Authorization", f"Bearer {token}")
         with urllib.request.urlopen(req, timeout=8) as resp:
             data = json.loads(resp.read().decode())
     except Exception:
-        if cached_entries is not None:
-            latest = cached_entries[1]
+        if cached_entries is not None and cached_entries[1] == token_cache_key:
+            latest = cached_entries[2]
             return [
                 {
                     **entry,
@@ -502,10 +601,16 @@ def _latest_image_model_payloads(library: list[dict[str, Any]], limit: int = 10)
             ]
         return _tracked_latest_seed_payloads(library)[:limit]
 
-    candidates: list[dict[str, Any]] = []
+    accepted_models: list[dict[str, Any]] = []
     for model in data:
         if not isinstance(model, dict) or not _is_latest_image_candidate(model, curated_repos):
             continue
+        accepted_models.append(model)
+        if len(accepted_models) >= max(limit * 2, limit):
+            break
+
+    candidates: list[dict[str, Any]] = []
+    for model in accepted_models:
         model_id = str(model.get("id") or "")
         provider = model_id.split("/", 1)[0] if "/" in model_id else "Community"
         tags = [str(tag) for tag in (model.get("tags") or [])]
@@ -513,6 +618,22 @@ def _latest_image_model_payloads(library: list[dict[str, Any]], limit: int = 10)
         metadata = _image_repo_live_metadata(model_id)
         snapshot_dir = _hf_repo_snapshot_dir(model_id)
         on_disk_bytes = _snapshot_on_disk_bytes(snapshot_dir)
+        on_disk_gb = _bytes_to_gb(on_disk_bytes) if on_disk_bytes else None
+        tracked_seed = _tracked_seed_for_repo(model_id)
+        fallback_size_gb, fallback_core_weights_gb, fallback_repo_size_gb = (
+            _image_seed_size_metadata(tracked_seed)
+            if tracked_seed is not None
+            else (0.0, None, None)
+        )
+        core_weights_gb = _positive_float(metadata.get("coreWeightsGb")) or fallback_core_weights_gb
+        repo_size_gb = _positive_float(metadata.get("repoSizeGb")) or fallback_repo_size_gb
+        size_gb = (
+            _positive_float(metadata.get("coreWeightsGb"))
+            or _positive_float(metadata.get("repoSizeGb"))
+            or _positive_float(on_disk_gb)
+            or _positive_float(fallback_size_gb)
+            or 0.0
+        )
         candidates.append({
             "id": model_id,
             "familyId": "latest",
@@ -524,7 +645,7 @@ def _latest_image_model_payloads(library: list[dict[str, Any]], limit: int = 10)
             "runtime": "Diffusers candidate",
             "styleTags": _image_discover_style_tags(tags),
             "taskSupport": _image_task_support_from_metadata(pipeline_tag, tags),
-            "sizeGb": float(metadata.get("coreWeightsGb") or metadata.get("repoSizeGb") or 0.0),
+            "sizeGb": size_gb,
             "recommendedResolution": _image_recommended_resolution(model_id, pipeline_tag, tags),
             "note": (
                 "Latest official diffusers-compatible image model tracked by ChaosEngineAI. "
@@ -534,7 +655,7 @@ def _latest_image_model_payloads(library: list[dict[str, Any]], limit: int = 10)
             "hasLocalData": snapshot_dir is not None,
             "localPath": str(snapshot_dir) if snapshot_dir else None,
             "onDiskBytes": on_disk_bytes,
-            "onDiskGb": _bytes_to_gb(on_disk_bytes) if on_disk_bytes else None,
+            "onDiskGb": on_disk_gb,
             "estimatedGenerationSeconds": None,
             "downloads": metadata.get("downloads"),
             "likes": metadata.get("likes"),
@@ -548,9 +669,9 @@ def _latest_image_model_payloads(library: list[dict[str, Any]], limit: int = 10)
             "gated": bool(metadata.get("gated")) if metadata.get("gated") is not None else None,
             "pipelineTag": metadata.get("pipelineTag") or pipeline_tag,
             "repoSizeBytes": metadata.get("repoSizeBytes"),
-            "repoSizeGb": metadata.get("repoSizeGb"),
+            "repoSizeGb": repo_size_gb,
             "coreWeightsBytes": metadata.get("coreWeightsBytes"),
-            "coreWeightsGb": metadata.get("coreWeightsGb"),
+            "coreWeightsGb": core_weights_gb,
             "metadataWarning": metadata.get("metadataWarning"),
             "source": "latest",
         })
@@ -572,7 +693,7 @@ def _latest_image_model_payloads(library: list[dict[str, Any]], limit: int = 10)
         seen_repos.add(repo_id)
 
     latest = candidates[:limit]
-    _LATEST_IMAGE_MODELS_CACHE = (now, latest)
+    _LATEST_IMAGE_MODELS_CACHE = (now, token_cache_key, latest)
     return latest
 
 
@@ -662,7 +783,7 @@ def _image_download_repo_ids() -> set[str]:
     if cached_entries is not None:
         repos.update(
             str(entry.get("repo") or "")
-            for entry in cached_entries[1]
+            for entry in cached_entries[2]
             if str(entry.get("repo") or "")
         )
     return repos
diff --git a/backend_service/helpers/persistence.py b/backend_service/helpers/persistence.py
index 86322c2..b8f3d75 100644
--- a/backend_service/helpers/persistence.py
+++ b/backend_service/helpers/persistence.py
@@ -11,7 +11,7 @@
 LEGACY_SEEDED_CHAT_IDS = {"ui-direction", "model-shortlist"}
 LEGACY_SEEDED_BENCHMARK_IDS = {"baseline", "native-34", "native-36", "native-44"}
 
-LIBRARY_CACHE_VERSION = 1
+LIBRARY_CACHE_VERSION = 3
 
 
 def _default_chat_variant() -> dict[str, Any]:
diff --git a/backend_service/helpers/system.py b/backend_service/helpers/system.py
index b3a5584..fad84ce 100644
--- a/backend_service/helpers/system.py
+++ b/backend_service/helpers/system.py
@@ -378,9 +378,23 @@ def _list_llm_processes(limit: int = 12) -> list[dict[str, Any]]:
     return matches[:limit]
 
 
-def _build_system_snapshot(app_version: str, app_started_at: float) -> dict[str, Any]:
-    from backend_service.inference import get_backend_capabilities
-    native = get_backend_capabilities().to_dict()
+def _capabilities_payload(capabilities: Any | None = None) -> dict[str, Any]:
+    if capabilities is None:
+        from backend_service.inference import get_backend_capabilities
+        return get_backend_capabilities().to_dict()
+    to_dict = getattr(capabilities, "to_dict", None)
+    if callable(to_dict):
+        return dict(to_dict())
+    return dict(capabilities)
+
+
+def _build_system_snapshot(
+    app_version: str,
+    app_started_at: float,
+    *,
+    capabilities: Any | None = None,
+) -> dict[str, Any]:
+    native = _capabilities_payload(capabilities)
     memory = psutil.virtual_memory()
     try:
         swap = psutil.swap_memory()
diff --git a/backend_service/helpers/video.py b/backend_service/helpers/video.py
index d0409ab..d5b6684 100644
--- a/backend_service/helpers/video.py
+++ b/backend_service/helpers/video.py
@@ -67,8 +67,27 @@ def _video_model_payloads(library: list[dict[str, Any]]) -> list[dict[str, Any]]
             # Merge live metadata first so curated fields (releaseDate,
             # familyName) still win when both exist.
             enriched = {**enriched, **live_metadata}
-            enriched["availableLocally"] = _video_repo_runtime_ready(repo) if repo else False
-            enriched["hasLocalData"] = enriched["availableLocally"] or _video_repo_has_any_local_data(repo)
+            validation_error = _video_variant_validation_error(enriched)
+            local_data_repos = _video_variant_local_data_repos(enriched)
+            enriched["availableLocally"] = validation_error is None
+            enriched["hasLocalData"] = (
+                enriched["availableLocally"]
+                or bool(local_data_repos)
+            )
+            primary_local_repo = (
+                repo
+                if repo and repo in local_data_repos
+                else local_data_repos[0]
+                if local_data_repos
+                else None
+            )
+            enriched["localDataRepos"] = local_data_repos
+            enriched["primaryLocalRepo"] = primary_local_repo
+            enriched["localStatusReason"] = (
+                _video_variant_local_status_reason(enriched, validation_error)
+                if enriched["hasLocalData"] and validation_error
+                else None
+            )
             enriched["familyName"] = family["name"]
             release_date = str(variant.get("releaseDate") or "").strip() or None
             enriched["releaseDate"] = release_date
@@ -81,7 +100,11 @@ def _video_model_payloads(library: list[dict[str, Any]]) -> list[dict[str, Any]]
             # Absolute path to the HF snapshot, used by the Reveal File button.
             # Only populated when there is actually something on disk so the
             # UI can reliably hide the button otherwise.
-            snapshot_dir = _hf_repo_snapshot_dir(repo) if (enriched["hasLocalData"] and repo) else None
+            snapshot_dir = (
+                _hf_repo_snapshot_dir(primary_local_repo)
+                if (enriched["hasLocalData"] and primary_local_repo)
+                else None
+            )
             enriched["localPath"] = str(snapshot_dir) if snapshot_dir else None
             on_disk_bytes = _snapshot_on_disk_bytes(snapshot_dir)
             enriched["onDiskBytes"] = on_disk_bytes
@@ -104,11 +127,20 @@ def _find_video_variant(model_id: str) -> dict[str, Any] | None:
 def _find_video_variant_by_repo(repo: str) -> dict[str, Any] | None:
     for family in VIDEO_MODEL_FAMILIES:
         for variant in family["variants"]:
-            if variant["repo"] == repo:
+            if repo in _video_variant_download_repos(variant):
                 return variant
     return None
 
 
+def _video_variant_download_repos(variant: dict[str, Any]) -> list[str]:
+    repos: list[str] = []
+    for key in ("repo", "ggufRepo", "textEncoderRepo"):
+        repo = str(variant.get(key) or "").strip()
+        if repo and repo not in repos:
+            repos.append(repo)
+    return repos
+
+
 def _is_video_repo(repo_id: str) -> bool:
     return any(
         str(variant.get("repo") or "") == repo_id
@@ -117,19 +149,23 @@ def _is_video_repo(repo_id: str) -> bool:
     )
 
 
+def _is_video_download_repo(repo_id: str) -> bool:
+    return repo_id in _video_download_repo_ids()
+
+
 def _video_repo_runtime_ready(repo_id: str) -> bool:
     """True if the local snapshot is complete enough to load.
 
-    Routes the validator by engine: mlx-video repos ship text_encoder /
-    tokenizer / transformer / vae folders without ``model_index.json``,
-    so the diffusers-shape check would always falsely fail for them.
-    Diffusers repos still go through ``validate_local_diffusers_snapshot``.
+    Routes the validator by engine: mlx-video repos ship component folders
+    without ``model_index.json``, so the diffusers-shape check would always
+    falsely fail for them. Diffusers repos still go through
+    ``validate_local_diffusers_snapshot``.
     """
     snapshot_dir = _hf_repo_snapshot_dir(repo_id)
     if snapshot_dir is None:
         return False
     if _is_mlx_video_routed_repo(repo_id):
-        return _validate_mlx_video_snapshot(snapshot_dir) is None
+        return _validate_mlx_video_snapshot(snapshot_dir, repo_id) is None
     return validate_local_diffusers_snapshot(snapshot_dir, repo_id) is None
 
 
@@ -155,20 +191,154 @@ def _video_repo_has_any_local_data(repo_id: str) -> bool:
         return False
 
 
+def _video_variant_local_data_repos(variant: dict[str, Any]) -> list[str]:
+    return [
+        repo
+        for repo in _video_variant_download_repos(variant)
+        if _video_repo_has_any_local_data(repo)
+    ]
+
+
 def _video_variant_available_locally(variant: dict[str, Any]) -> bool:
+    return _video_variant_validation_error(variant) is None
+
+
+def _video_variant_has_any_local_data(variant: dict[str, Any]) -> bool:
+    return bool(_video_variant_local_data_repos(variant))
+
+
+def _video_variant_validation_error(variant: dict[str, Any]) -> str | None:
     repo = str(variant.get("repo") or "")
     if not repo:
-        return False
-    return _video_repo_runtime_ready(repo)
+        return "Video model variant is missing its base repo id."
+    repo_error = _video_download_validation_error(repo)
+    if repo_error:
+        return repo_error
+    text_error = _video_variant_mlx_text_components_validation_error(variant)
+    if text_error:
+        return text_error
+    return _video_variant_gguf_validation_error(variant)
+
+
+def _video_variant_mlx_text_components_validation_error(variant: dict[str, Any]) -> str | None:
+    repo = str(variant.get("repo") or "")
+    if not _is_mlx_video_routed_repo(repo):
+        return None
+    snapshot_dir = _hf_repo_snapshot_dir(repo)
+    if snapshot_dir is None:
+        return None
+    missing = _missing_mlx_text_components(Path(snapshot_dir))
+    if not missing:
+        return None
+
+    text_encoder_repo = str(variant.get("textEncoderRepo") or "").strip()
+    if text_encoder_repo and text_encoder_repo != repo:
+        text_snapshot = _hf_repo_snapshot_dir(text_encoder_repo)
+        if text_snapshot is not None and not _missing_mlx_text_components(Path(text_snapshot)):
+            return None
+        return (
+            "The local snapshot is missing shared mlx-video text components: "
+            f"{', '.join(missing)}. Download the shared text encoder "
+            f"({text_encoder_repo}) and retry."
+        )
+
+    return (
+        "The local snapshot is incomplete. Missing mlx-video components: "
+        f"{', '.join(missing)}. Re-download the model and keep ChaosEngineAI "
+        "open until the download completes."
+    )
+
+
+def _video_variant_missing_text_encoder_repo(variant: dict[str, Any]) -> str | None:
+    error = _video_variant_mlx_text_components_validation_error(variant)
+    text_encoder_repo = str(variant.get("textEncoderRepo") or "").strip()
+    if error and text_encoder_repo:
+        return text_encoder_repo
+    return None
+
+
+def _video_variant_local_status_reason(
+    variant: dict[str, Any],
+    validation_error: str | None,
+) -> str | None:
+    if not validation_error:
+        return None
+    gguf_file = str(variant.get("ggufFile") or "").strip()
+    gguf_repo = str(variant.get("ggufRepo") or "").strip()
+    if gguf_file and gguf_repo and "GGUF transformer file is missing" in validation_error:
+        return f"Base model installed; missing GGUF transformer: {gguf_repo}/{gguf_file}."
+
+    prefix = "The local snapshot is incomplete. Missing mlx-video components: "
+    if validation_error.startswith(prefix):
+        missing = validation_error[len(prefix):].split(". Re-download", 1)[0]
+        return f"Missing MLX components: {missing}."
+
+    shared_prefix = "The local snapshot is missing shared mlx-video text components: "
+    if validation_error.startswith(shared_prefix):
+        missing = validation_error[len(shared_prefix):].split(". Download", 1)[0]
+        text_encoder_repo = str(variant.get("textEncoderRepo") or "").strip()
+        source = f" from {text_encoder_repo}" if text_encoder_repo else ""
+        return f"Missing shared MLX text components{source}: {missing}."
+
+    if validation_error.startswith("The selected GGUF transformer resolved to a cache path"):
+        return f"GGUF transformer cache path is invalid: {gguf_repo}/{gguf_file}."
+
+    return validation_error
+
+
+def _video_variant_gguf_validation_error(variant: dict[str, Any]) -> str | None:
+    gguf_file = str(variant.get("ggufFile") or "").strip()
+    if not gguf_file:
+        return None
+    gguf_repo = str(variant.get("ggufRepo") or "").strip()
+    if not gguf_repo:
+        return (
+            f"{variant.get('name') or 'This GGUF video variant'} is missing "
+            "its GGUF repository metadata."
+        )
+    try:
+        from huggingface_hub import hf_hub_download  # type: ignore
+
+        local_path = hf_hub_download(
+            repo_id=gguf_repo,
+            filename=gguf_file,
+            local_files_only=True,
+        )
+    except Exception:
+        return (
+            "The base diffusers snapshot is installed, but the selected GGUF "
+            f"transformer file is missing: {gguf_repo}/{gguf_file}. Download "
+            "the GGUF variant before generating so the app does not fall back "
+            "to the full BF16 transformer."
+        )
+    if not Path(local_path).exists():
+        return (
+            "The selected GGUF transformer resolved to a cache path that does "
+            f"not exist: {gguf_repo}/{gguf_file}. Retry the GGUF download."
+        )
+    return None
 
 
 def _video_download_repo_ids() -> set[str]:
-    return {
+    repos = {
         str(variant.get("repo") or "")
         for family in VIDEO_MODEL_FAMILIES
         for variant in family["variants"]
         if str(variant.get("repo") or "")
     }
+    repos.update(
+        str(variant.get("ggufRepo") or "")
+        for family in VIDEO_MODEL_FAMILIES
+        for variant in family["variants"]
+        if str(variant.get("ggufRepo") or "")
+    )
+    repos.update(
+        str(variant.get("textEncoderRepo") or "")
+        for family in VIDEO_MODEL_FAMILIES
+        for variant in family["variants"]
+        if str(variant.get("textEncoderRepo") or "")
+    )
+    return repos
 
 
 # Diffusers pipelines only need the standard per-component folders
@@ -202,13 +372,23 @@ def _video_download_repo_ids() -> set[str]:
 _VIDEO_MLX_ALLOW_PATTERNS: list[str] = [
     "text_encoder/**",
     "tokenizer/**",
+    "text_projections/**",
+    "audio_vae/**",
     "transformer/**",
     "vae/**",
+    "vocoder/**",
     "*spatial-upscaler*.safetensors",
     "*.md",
     "LICENSE*",
 ]
 
+_VIDEO_MLX_TEXT_ENCODER_ALLOW_PATTERNS: list[str] = [
+    "text_encoder/**",
+    "tokenizer/**",
+    "*.md",
+    "LICENSE*",
+]
+
 
 def _video_repo_allow_patterns(repo_id: str) -> list[str] | None:
     """Patterns to pass to ``snapshot_download`` for a video repo.
@@ -236,11 +416,10 @@ def _video_download_validation_error(repo_id: str) -> str | None:
             "Retry the download and make sure the backend can access Hugging Face."
         )
     # mlx-video routed repos (e.g. ``prince-canuma/LTX-2-*``) ship MLX
-    # layout — text_encoder / tokenizer / transformer / vae folders
-    # without ``model_index.json``. Don't apply the diffusers-shape
-    # validator to them; check for the MLX component folders instead.
+    # layouts without ``model_index.json``. Don't apply the diffusers-shape
+    # validator to them; check for the expected MLX component folders instead.
     if _is_mlx_video_routed_repo(repo_id):
-        return _validate_mlx_video_snapshot(snapshot_dir)
+        return _validate_mlx_video_snapshot(snapshot_dir, repo_id)
     return validate_local_diffusers_snapshot(snapshot_dir, repo_id)
 
 
@@ -261,16 +440,54 @@ def _is_mlx_video_routed_repo(repo_id: str) -> bool:
 # diffusers layout — no model_index.json. Lifted from the ``prince-canuma/
 # LTX-2-distilled`` repo tree as the canonical shape; bump as new mlx-video
 # families with different layouts come online.
-_MLX_VIDEO_REQUIRED_COMPONENTS: tuple[str, ...] = (
+_MLX_VIDEO_LTX2_REQUIRED_COMPONENTS: tuple[str, ...] = (
     "text_encoder",
     "tokenizer",
+    "text_projections",
+    "transformer",
+    "vae",
+)
+
+_MLX_VIDEO_LTX23_REQUIRED_COMPONENTS: tuple[str, ...] = (
+    "audio_vae",
+    "text_projections",
     "transformer",
     "vae",
+    "vocoder",
 )
 
 
-def _validate_mlx_video_snapshot(snapshot_dir: str) -> str | None:
-    """Return ``None`` if the snapshot has the four MLX component folders.
+def _mlx_video_required_components(repo_id: str | None = None) -> tuple[str, ...]:
+    repo_key = str(repo_id or "").lower()
+    if "ltx-2.3" in repo_key:
+        return _MLX_VIDEO_LTX23_REQUIRED_COMPONENTS
+    return _MLX_VIDEO_LTX2_REQUIRED_COMPONENTS
+
+
+def _missing_mlx_text_components(root: Path) -> list[str]:
+    missing: list[str] = []
+    checks = {
+        "text_encoder": (
+            root / "text_encoder" / "config.json",
+            root / "text_encoder" / "model.safetensors.index.json",
+        ),
+        "tokenizer": (
+            root / "tokenizer" / "tokenizer.json",
+            root / "tokenizer" / "tokenizer.model",
+        ),
+    }
+    for component, required_paths in checks.items():
+        component_dir = root / component
+        if not component_dir.is_dir():
+            missing.append(component)
+            continue
+        if not all(path.exists() for path in required_paths):
+            missing.append(component)
+    return missing
+
+
+def _validate_mlx_video_snapshot(snapshot_dir: str, repo_id: str | None = None) -> str | None:
+    """Return ``None`` if the snapshot has the required MLX component folders.
 
     Mirrors the contract of ``validate_local_diffusers_snapshot`` so the
     callers can swap one for the other without restructuring the result
@@ -284,7 +501,7 @@ def _validate_mlx_video_snapshot(snapshot_dir: str) -> str | None:
             "Re-download the model."
         )
     missing: list[str] = []
-    for component in _MLX_VIDEO_REQUIRED_COMPONENTS:
+    for component in _mlx_video_required_components(repo_id):
         component_dir = root / component
         if not component_dir.is_dir():
             missing.append(component)
diff --git a/backend_service/image_runtime.py b/backend_service/image_runtime.py
index c4f987b..5fd46ea 100644
--- a/backend_service/image_runtime.py
+++ b/backend_service/image_runtime.py
@@ -26,7 +26,6 @@
     PHASE_LOADING,
     PHASE_SAVING,
 )
-from cache_compression import apply_diffusion_cache_strategy
 
 
 WORKSPACE_ROOT = Path(__file__).resolve().parents[1]
@@ -660,6 +659,8 @@ def generate(self, config: ImageGenerationConfig) -> list[GeneratedImage]:
             # for this pipeline yet we swallow NotImplementedError and run
             # the stock pipeline — the UI surfaces the "Scaffold" badge so
             # users know why speedup didn't appear.
+            from cache_compression import apply_diffusion_cache_strategy
+
             cache_note = apply_diffusion_cache_strategy(
                 pipeline,
                 strategy_id=config.cacheStrategy,
diff --git a/backend_service/inference.py b/backend_service/inference.py
index 423c0fe..ef8c321 100644
--- a/backend_service/inference.py
+++ b/backend_service/inference.py
@@ -593,6 +593,7 @@ class BackendCapabilities:
     converterAvailable: bool = False
     vllmAvailable: bool = False
     vllmVersion: str | None = None
+    probing: bool = False
 
     def to_dict(self) -> dict[str, Any]:
         return {
@@ -610,6 +611,7 @@ def to_dict(self) -> dict[str, Any]:
             "converterAvailable": self.converterAvailable,
             "vllmAvailable": self.vllmAvailable,
             "vllmVersion": self.vllmVersion,
+            "probing": self.probing,
         }
 
 
@@ -617,6 +619,35 @@ def to_dict(self) -> dict[str, Any]:
 _capability_lock = RLock()
 
 
+def _initial_backend_capabilities() -> BackendCapabilities:
+    """Cheap capability placeholder used while the real probe runs.
+
+    The full probe imports/spawns MLX and checks vLLM, which can add seconds
+    to cold start. These path checks are safe enough for initial UI rendering;
+    load_model() still refreshes capabilities synchronously before selecting
+    an engine.
+    """
+    python_executable = _resolve_mlx_python()
+    llama_server_path = _resolve_llama_server()
+    llama_server_turbo_path = _resolve_llama_server_turbo()
+    llama_cli_path = _resolve_llama_cli()
+    return BackendCapabilities(
+        pythonExecutable=python_executable,
+        mlxAvailable=False,
+        mlxLmAvailable=False,
+        mlxUsable=False,
+        mlxMessage="Native backend detection is still running.",
+        ggufAvailable=bool(llama_server_path) or bool(llama_server_turbo_path),
+        llamaCliPath=llama_cli_path,
+        llamaServerPath=llama_server_path,
+        llamaServerTurboPath=llama_server_turbo_path,
+        converterAvailable=False,
+        vllmAvailable=False,
+        vllmVersion=None,
+        probing=True,
+    )
+
+
 def _probe_native_backends() -> BackendCapabilities:
     python_executable = _resolve_mlx_python()
     llama_server_path = _resolve_llama_server()
@@ -2165,10 +2196,16 @@ def stream_generate(
 
 
 class RuntimeController:
+    # Hard upper bound on the warm pool independently of memory accounting —
+    # if psutil isn't available we still want a sane cap.
     MAX_WARM_MODELS = 2
+    # Reserve this much physical memory for the OS / UI / unrelated
+    # processes when deciding whether a new (or incoming) model fits. Mirrors
+    # the headroom used by ``helpers/system.py::spareHeadroomGb``.
+    WARM_POOL_MEMORY_HEADROOM_BYTES = 6 * 1024 * 1024 * 1024
 
-    def __init__(self) -> None:
-        self.capabilities = get_backend_capabilities()
+    def __init__(self, *, background_probe: bool = False) -> None:
+        self.capabilities = _initial_backend_capabilities()
         self.engine: BaseInferenceEngine = MockInferenceEngine(self.capabilities)
         self.loaded_model: LoadedModelInfo | None = None
         self.runtime_note: str | None = None
@@ -2178,6 +2215,51 @@ def __init__(self) -> None:
         self._loading_progress: dict[str, Any] | None = None
         self._loading_log_tail: list[str] = []
         self._recent_orphaned_workers: list[dict[str, Any]] = []
+        self._capability_probe_thread: Thread | None = None
+        self._capability_probe_lock = Lock()
+        if background_probe:
+            self.start_capability_probe()
+
+    def start_capability_probe(self, *, force: bool = False) -> None:
+        with self._capability_probe_lock:
+            if (
+                self._capability_probe_thread is not None
+                and self._capability_probe_thread.is_alive()
+                and not force
+            ):
+                return
+            thread = Thread(
+                target=self._capability_probe_worker,
+                kwargs={"force": force},
+                name="chaosengine-capability-probe",
+                daemon=True,
+            )
+            self._capability_probe_thread = thread
+            thread.start()
+
+    def _capability_probe_worker(self, *, force: bool = False) -> None:
+        try:
+            capabilities = get_backend_capabilities(force=force)
+        except Exception as exc:
+            current = self.capabilities
+            capabilities = BackendCapabilities(
+                pythonExecutable=current.pythonExecutable,
+                mlxAvailable=False,
+                mlxLmAvailable=False,
+                mlxUsable=False,
+                mlxMessage=f"Native backend detection failed: {type(exc).__name__}: {exc}",
+                ggufAvailable=current.ggufAvailable,
+                llamaCliPath=current.llamaCliPath,
+                llamaServerPath=current.llamaServerPath,
+                llamaServerTurboPath=current.llamaServerTurboPath,
+                converterAvailable=False,
+                vllmAvailable=False,
+                vllmVersion=None,
+                probing=False,
+            )
+        self.capabilities = capabilities
+        if isinstance(self.engine, MockInferenceEngine):
+            self.engine.capabilities = capabilities
 
     @staticmethod
     def _warm_pool_key(
@@ -2266,6 +2348,7 @@ def _park_active_engine_or_unload(
         *,
         requested_identity: str,
         keep_warm_previous: bool = True,
+        required_free_bytes: int = 0,
     ) -> None:
         if not self.loaded_model or not self.engine:
             return
@@ -2284,7 +2367,19 @@ def _park_active_engine_or_unload(
             except Exception:
                 pass
             return
-        self._evict_warm_pool()
+        active_bytes = max(
+            self._model_resident_bytes(self.loaded_model),
+            self._engine_resident_bytes(self.engine),
+        )
+        self._evict_warm_pool(
+            incoming_bytes=active_bytes,
+        )
+        if not self._can_keep_warm_model(active_bytes, required_free_bytes=required_free_bytes):
+            try:
+                self.engine.unload_model()
+            except Exception:
+                pass
+            return
         self._warm_pool[current_key] = (self.engine, self.loaded_model)
 
     def _tracked_process_pids(self) -> set[int]:
@@ -2460,6 +2555,8 @@ def refresh_capabilities(self, *, force: bool = False) -> BackendCapabilities:
                 _LLAMA_HELP_CACHE.clear()
             _CACHE_TYPE_CACHE.clear()
         self.capabilities = get_backend_capabilities(force=force)
+        if isinstance(self.engine, MockInferenceEngine):
+            self.engine.capabilities = self.capabilities
         return self.capabilities
 
     def _select_engine(
@@ -2540,15 +2637,100 @@ def warm_models(self) -> list[dict[str, Any]]:
             result.append({**info.to_dict(), "warm": True, "active": False})
         return result
 
-    def _evict_warm_pool(self) -> None:
-        """Remove the oldest entry from the warm pool if at capacity."""
+    @staticmethod
+    def _model_resident_bytes(info: LoadedModelInfo) -> int:
+        """Best-effort estimate of RAM held by a loaded model.
+
+        For local weights we use on-disk size as a proxy — mlx-lm mmaps the
+        weights so RSS tracks file size closely; for llama.cpp / GGUF the
+        whole file ends up resident once warm. For catalog/no-path entries
+        we fall back to 0 (no useful estimate, treat as memory-free).
+        """
+        return _path_size_bytes(info.path) if info.path else 0
+
+    @staticmethod
+    def _target_resident_bytes(*, path: str | None, runtime_target: str | None) -> int:
+        for candidate in (path, runtime_target):
+            if not candidate:
+                continue
+            size = _path_size_bytes(candidate)
+            if size > 0:
+                return size
+        return 0
+
+    @staticmethod
+    def _engine_resident_bytes(engine: BaseInferenceEngine | None) -> int:
+        if engine is None:
+            return 0
+        pid_getter = getattr(engine, "process_pid", None)
+        pid = pid_getter() if callable(pid_getter) else None
+        if not isinstance(pid, int):
+            return 0
+        try:
+            import psutil
+
+            return int(psutil.Process(pid).memory_info().rss)
+        except Exception:
+            return 0
+
+    def _warm_pool_resident_bytes(self) -> int:
+        return sum(
+            max(self._model_resident_bytes(info), self._engine_resident_bytes(engine))
+            for engine, info in self._warm_pool.values()
+        )
+
+    def _memory_budget_bytes(self) -> int:
+        """Bytes available for warm-pool weights, after OS headroom.
+
+        Returns 0 when psutil isn't usable; callers must fall back to the
+        count-based MAX_WARM_MODELS cap in that case.
+        """
+        try:
+            import psutil
+
+            available = int(psutil.virtual_memory().available)
+        except Exception:
+            return 0
+        return max(0, available - self.WARM_POOL_MEMORY_HEADROOM_BYTES)
+
+    def _pop_oldest_warm_entry(self) -> None:
+        if not self._warm_pool:
+            return
+        oldest_key = next(iter(self._warm_pool))
+        old_engine, _ = self._warm_pool.pop(oldest_key)
+        try:
+            old_engine.unload_model()
+        except Exception:
+            pass
+
+    def _can_keep_warm_model(self, incoming_bytes: int, *, required_free_bytes: int = 0) -> bool:
+        budget = self._memory_budget_bytes()
+        if budget <= 0:
+            return True
+        if required_free_bytes > budget:
+            return False
+        return self._warm_pool_resident_bytes() + incoming_bytes <= budget
+
+    def _evict_warm_pool(self, *, incoming_bytes: int = 0) -> None:
+        """Make room for an incoming entry in the warm pool.
+
+        First applies the count cap (MAX_WARM_MODELS) so a flapping budget
+        can never grow the pool unboundedly. Then, if ``psutil`` reports a
+        live memory budget, evicts oldest entries until the pool plus the
+        incoming model fits within ``available - headroom``.
+
+        ``incoming_bytes`` is the resident-byte estimate for the model
+        about to enter the pool (typically the model being parked from
+        active to warm). Passing 0 still triggers the count cap.
+        """
         while len(self._warm_pool) >= self.MAX_WARM_MODELS:
-            oldest_key = next(iter(self._warm_pool))
-            old_engine, _ = self._warm_pool.pop(oldest_key)
-            try:
-                old_engine.unload_model()
-            except Exception:
-                pass
+            self._pop_oldest_warm_entry()
+
+        budget = self._memory_budget_bytes()
+        if budget <= 0:
+            return
+        while self._warm_pool and self._warm_pool_resident_bytes() + incoming_bytes > budget:
+            self._pop_oldest_warm_entry()
 
     def load_model(
         self,
@@ -2598,6 +2780,10 @@ def _internal_progress(progress: dict[str, Any]) -> None:
             runtime_target=runtime_target,
             path=path,
         )
+        incoming_load_bytes = self._target_resident_bytes(
+            path=path,
+            runtime_target=runtime_target,
+        )
 
         # Check warm pool first — instant switch if the exact runtime profile is cached
         pool_key = self._warm_pool_key(
@@ -2639,6 +2825,7 @@ def _internal_progress(progress: dict[str, Any]) -> None:
         self._park_active_engine_or_unload(
             requested_identity=requested_identity,
             keep_warm_previous=keep_warm_previous,
+            required_free_bytes=incoming_load_bytes,
         )
 
         self.engine = selected_engine
diff --git a/backend_service/mlx_video_runtime.py b/backend_service/mlx_video_runtime.py
index b52abfb..346d170 100644
--- a/backend_service/mlx_video_runtime.py
+++ b/backend_service/mlx_video_runtime.py
@@ -88,6 +88,11 @@
         ("Lightricks/LTX-2.3", "ltx-2.3-spatial-upscaler-x2-1.0.safetensors"),
     ),
 }
+_LTX2_SHARED_TEXT_ENCODER_CANDIDATES: tuple[str, ...] = (
+    "prince-canuma/LTX-2-distilled",
+    "Lightricks/LTX-2",
+)
+_LTX2_TEXT_COMPONENTS: tuple[str, ...] = ("text_encoder", "tokenizer")
 _LTX2_DISTILLED_STAGE_1_STEPS = 8
 _LTX2_DISTILLED_STAGE_2_STEPS = 3
 
@@ -255,6 +260,86 @@ def _resolve_ltx2_spatial_upscaler(
     )
 
 
+def _resolve_local_snapshot(repo_or_path: str) -> Path | None:
+    candidate = Path(repo_or_path)
+    if candidate.exists():
+        return candidate
+    try:
+        from huggingface_hub import snapshot_download  # type: ignore
+
+        return Path(snapshot_download(repo_id=repo_or_path, local_files_only=True))
+    except Exception:
+        return None
+
+
+def _missing_ltx2_text_components(root: Path) -> list[str]:
+    missing: list[str] = []
+    checks = {
+        "text_encoder": (
+            root / "text_encoder" / "config.json",
+            root / "text_encoder" / "model.safetensors.index.json",
+        ),
+        "tokenizer": (
+            root / "tokenizer" / "tokenizer.json",
+            root / "tokenizer" / "tokenizer.model",
+        ),
+    }
+    for component, required_paths in checks.items():
+        if not (root / component).is_dir():
+            missing.append(component)
+            continue
+        if not all(path.exists() for path in required_paths):
+            missing.append(component)
+    return missing
+
+
+def _resolve_ltx2_text_component_source(repo: str) -> Path:
+    for candidate_repo in tuple(dict.fromkeys((repo, *_LTX2_SHARED_TEXT_ENCODER_CANDIDATES))):
+        snapshot = _resolve_local_snapshot(candidate_repo)
+        if snapshot is not None and not _missing_ltx2_text_components(snapshot):
+            return snapshot
+    checked = ", ".join(_LTX2_SHARED_TEXT_ENCODER_CANDIDATES)
+    raise RuntimeError(
+        "LTX-2.3 MLX generation needs shared text_encoder and tokenizer "
+        f"components, but none were found locally. Download {checked} or "
+        "resume this model download, then try again."
+    )
+
+
+def _prepare_ltx2_model_path(repo: str, workspace: Path) -> Path:
+    model_path = _resolve_local_snapshot(repo)
+    if model_path is None:
+        raise RuntimeError(
+            f"LTX-2 MLX model snapshot is not available locally for {repo}. "
+            "Download the model before generating."
+        )
+
+    missing = _missing_ltx2_text_components(model_path)
+    if not missing:
+        return model_path
+
+    text_source = _resolve_ltx2_text_component_source(repo)
+    overlay = workspace / "model-overlay"
+    shutil.rmtree(overlay, ignore_errors=True)
+    overlay.mkdir(parents=True, exist_ok=True)
+
+    missing_set = set(missing)
+    for entry in model_path.iterdir():
+        if entry.name in missing_set:
+            continue
+        (overlay / entry.name).symlink_to(entry, target_is_directory=entry.is_dir())
+    for component in _LTX2_TEXT_COMPONENTS:
+        target = overlay / component
+        if target.exists() or target.is_symlink():
+            if target.is_dir() and not target.is_symlink():
+                shutil.rmtree(target)
+            else:
+                target.unlink()
+        source = text_source / component
+        target.symlink_to(source, target_is_directory=True)
+    return overlay
+
+
 class _ProgressSink(Protocol):
     def __call__(self, phase: str, message: str, fraction: float) -> None: ...
 
@@ -409,12 +494,15 @@ def _build_cmd(
         entry = _resolve_entry_point(config.repo)
         python = _resolve_video_python()
         pipeline_flag = _resolve_pipeline_flag(config.repo)
+        model_repo_arg = config.repo
+        if resolve_aux_files and "ltx-2.3" in config.repo.lower():
+            model_repo_arg = str(_prepare_ltx2_model_path(config.repo, output_path.parent))
         cmd = [
             python,
             "-m",
             entry,
             "--model-repo",
-            config.repo,
+            model_repo_arg,
             "--pipeline",
             pipeline_flag,
             "--prompt",
diff --git a/backend_service/models/__init__.py b/backend_service/models/__init__.py
index fe70463..a47fe80 100644
--- a/backend_service/models/__init__.py
+++ b/backend_service/models/__init__.py
@@ -195,6 +195,7 @@ class DeleteModelRequest(BaseModel):
 
 class DownloadModelRequest(BaseModel):
     repo: str = Field(min_length=3, max_length=256)
+    modelId: str | None = Field(default=None, min_length=1, max_length=256)
 
 
 class ImageGenerationRequest(BaseModel):
diff --git a/backend_service/plugins/__init__.py b/backend_service/plugins/__init__.py
index f218910..7d8f56d 100644
--- a/backend_service/plugins/__init__.py
+++ b/backend_service/plugins/__init__.py
@@ -9,6 +9,7 @@
 from dataclasses import dataclass, field
 from enum import Enum
 from pathlib import Path
+from threading import RLock
 from typing import Any
 import importlib
 import json
@@ -38,28 +39,43 @@ class BasePlugin(ABC):
     def manifest(self) -> PluginManifest: ...
 
 class PluginRegistry:
-    def __init__(self):
+    def __init__(self, *, auto_register_builtins: bool = False):
         self._plugins: dict[str, tuple[PluginManifest, Any]] = {}
+        self._auto_register_builtins = auto_register_builtins
+        self._builtins_registered = False
+        self._lock = RLock()
 
     def register(self, manifest: PluginManifest, instance: Any = None):
         self._plugins[manifest.id] = (manifest, instance)
 
+    def ensure_builtins(self) -> None:
+        if not self._auto_register_builtins or self._builtins_registered:
+            return
+        with self._lock:
+            if not self._builtins_registered:
+                self.register_builtins()
+
     def get(self, plugin_id: str) -> tuple[PluginManifest, Any] | None:
+        self.ensure_builtins()
         return self._plugins.get(plugin_id)
 
     def list_all(self) -> list[PluginManifest]:
+        self.ensure_builtins()
         return [m for m, _ in self._plugins.values()]
 
     def list_by_type(self, plugin_type: PluginType) -> list[tuple[PluginManifest, Any]]:
+        self.ensure_builtins()
         return [(m, i) for m, i in self._plugins.values() if m.plugin_type == plugin_type]
 
     def enable(self, plugin_id: str) -> bool:
+        self.ensure_builtins()
         if plugin_id in self._plugins:
             self._plugins[plugin_id][0].enabled = True
             return True
         return False
 
     def disable(self, plugin_id: str) -> bool:
+        self.ensure_builtins()
         if plugin_id in self._plugins:
             self._plugins[plugin_id][0].enabled = False
             return True
@@ -89,7 +105,7 @@ def register_builtins(self):
         """Register all built-in components as plugins."""
         # Cache strategies
         from cache_compression import registry as cache_registry
-        for strategy in cache_registry._strategies.values():
+        for strategy in cache_registry.strategies():
             manifest = PluginManifest(
                 id=f"cache.{strategy.strategy_id}",
                 name=strategy.name,
@@ -110,7 +126,7 @@ def register_builtins(self):
                 description=tool.description,
             )
             self.register(manifest, tool)
+        self._builtins_registered = True
 
 # Module singleton
-plugin_registry = PluginRegistry()
-plugin_registry.register_builtins()
+plugin_registry = PluginRegistry(auto_register_builtins=True)
diff --git a/backend_service/routes/cache.py b/backend_service/routes/cache.py
index 418b20e..1edd5ed 100644
--- a/backend_service/routes/cache.py
+++ b/backend_service/routes/cache.py
@@ -2,7 +2,7 @@
 
 from typing import Any
 
-from fastapi import APIRouter, Query
+from fastapi import APIRouter, Query, Request
 
 from backend_service.app import _build_system_snapshot, compute_cache_preview
 
@@ -11,6 +11,7 @@
 
 @router.get("/api/cache/preview")
 def cache_preview(
+    request: Request,
     bits: int = Query(3, ge=0, le=8),
     fp16_layers: int = Query(4, ge=0, le=16),
     num_layers: int = Query(32, ge=1, le=160),
@@ -21,7 +22,7 @@ def cache_preview(
     params_b: float = Query(7.0, ge=0.5, le=1000.0),
     strategy: str = Query("native"),
 ) -> dict[str, Any]:
-    system_stats = _build_system_snapshot()
+    system_stats = _build_system_snapshot(capabilities=request.app.state.chaosengine.runtime.capabilities)
     return compute_cache_preview(
         bits=bits,
         fp16_layers=fp16_layers,
diff --git a/backend_service/routes/health.py b/backend_service/routes/health.py
index 8ddf97e..8d40109 100644
--- a/backend_service/routes/health.py
+++ b/backend_service/routes/health.py
@@ -15,18 +15,16 @@ def health(request: Request) -> dict[str, Any]:
     state = request.app.state.chaosengine
     from backend_service.app import WORKSPACE_ROOT, app_version
 
-    runtime_status = state.runtime.status(
-        active_requests=state.active_requests,
-        requests_served=state.requests_served,
-    )
+    capabilities = state.runtime.capabilities
+    loaded_model = state.runtime.loaded_model
     return {
         "status": "ok",
         "workspaceRoot": str(WORKSPACE_ROOT),
-        "runtime": _runtime_label(),
+        "runtime": _runtime_label(capabilities.to_dict()),
         "appVersion": app_version,
-        "engine": runtime_status["engine"],
-        "loadedModel": runtime_status["loadedModel"],
-        "nativeBackends": runtime_status["nativeBackends"],
+        "engine": state.runtime.engine.engine_name,
+        "loadedModel": loaded_model.to_dict() if loaded_model is not None else None,
+        "nativeBackends": capabilities.to_dict(),
     }
 
 
diff --git a/backend_service/routes/images.py b/backend_service/routes/images.py
index 9a741c5..7f81689 100644
--- a/backend_service/routes/images.py
+++ b/backend_service/routes/images.py
@@ -25,11 +25,53 @@
     _find_image_output,
     _delete_image_output,
 )
-from backend_service.progress import GenerationCancelled, IMAGE_PROGRESS
+from backend_service.progress import GenerationCancelled, IMAGE_PROGRESS, VIDEO_PROGRESS
 
 router = APIRouter()
 
 
+def _unload_idle_video_runtime_for_image(request: Request, action: str) -> None:
+    """Free resident video diffusion weights before image work starts.
+
+    Image and video pipelines live in separate managers, so loading an image
+    model no longer implicitly releases a previously-loaded video model. That
+    can leave tens of GB resident across Studio switches. If video generation
+    is actively running, fail fast instead of blocking the image request behind
+    a long render.
+    """
+    state = request.app.state.chaosengine
+    if VIDEO_PROGRESS.snapshot().get("active"):
+        raise HTTPException(
+            status_code=409,
+            detail=(
+                "A video generation is still running. Wait for it to finish or cancel it "
+                "before loading an image model."
+            ),
+        )
+    try:
+        runtime = state.video_runtime.capabilities()
+    except Exception:
+        return
+    loaded_repo = str(runtime.get("loadedModelRepo") or "")
+    if not loaded_repo:
+        return
+    try:
+        state.video_runtime.unload()
+    except Exception as exc:
+        state.add_log(
+            "images",
+            "warning",
+            f"Could not unload video model before {action}: {type(exc).__name__}: {exc}",
+        )
+        return
+    state.add_log(
+        "images",
+        "info",
+        f"Unloaded video model {loaded_repo} before {action} to free memory.",
+    )
+    state.add_activity("Video model unloaded", f"Freed memory for {action}")
+
+
 @router.get("/api/images/catalog")
 def image_catalog(request: Request) -> dict[str, Any]:
     state = request.app.state.chaosengine
@@ -89,6 +131,7 @@ def preload_image_model(request: Request, body: ImageRuntimePreloadRequest) -> d
         validation_error = _image_download_validation_error(variant["repo"])
         detail = validation_error or f"{variant['name']} is not installed locally yet."
         raise HTTPException(status_code=409, detail=detail)
+    _unload_idle_video_runtime_for_image(request, "image preload")
     try:
         runtime = state.image_runtime.preload(variant["repo"])
     except RuntimeError as exc:
@@ -185,6 +228,7 @@ def generate_image(request: Request, body: ImageGenerationRequest) -> dict[str,
         state.add_log("images", "error", f"Image model not found in catalog or tracked seeds: '{body.modelId}'")
         raise HTTPException(status_code=404, detail=f"Unknown image model '{body.modelId}'. The model isn't in the curated catalog or tracked seeds.")
     state.add_log("images", "info", f"Resolved variant: {variant.get('name')} (repo={variant.get('repo')})")
+    _unload_idle_video_runtime_for_image(request, "image generation")
     try:
         artifacts, runtime = _generate_image_artifacts(body, variant, state.image_runtime)
     except GenerationCancelled:
diff --git a/backend_service/routes/setup.py b/backend_service/routes/setup.py
index 413e333..dcdfd92 100644
--- a/backend_service/routes/setup.py
+++ b/backend_service/routes/setup.py
@@ -1,5 +1,6 @@
 from __future__ import annotations
 
+import importlib
 import os
 import platform
 import shutil
@@ -210,6 +211,8 @@ def install_pip_package(request: Request, body: InstallPackageRequest) -> dict[s
                 f"{', '.join(unique)}"
             ).strip()
 
+    importlib.invalidate_caches()
+
     # Re-probe capabilities after install
     state.runtime.refresh_capabilities(force=True)
     caps = state.runtime.capabilities.to_dict()
diff --git a/backend_service/routes/video.py b/backend_service/routes/video.py
index 54485ec..c11a977 100644
--- a/backend_service/routes/video.py
+++ b/backend_service/routes/video.py
@@ -13,13 +13,17 @@
 from fastapi.responses import FileResponse
 
 from backend_service.helpers.video import (
+    _VIDEO_MLX_TEXT_ENCODER_ALLOW_PATTERNS,
     _find_video_variant,
     _find_video_variant_by_repo,
+    _is_video_download_repo,
     _is_video_repo,
     _video_download_repo_ids,
     _video_download_validation_error,
     _video_model_payloads,
+    _video_variant_missing_text_encoder_repo,
     _video_variant_available_locally,
+    _video_variant_validation_error,
 )
 from backend_service.models import (
     DownloadModelRequest,
@@ -27,12 +31,47 @@
     VideoRuntimePreloadRequest,
     VideoRuntimeUnloadRequest,
 )
-from backend_service.progress import GenerationCancelled, VIDEO_PROGRESS
+from backend_service.progress import GenerationCancelled, IMAGE_PROGRESS, VIDEO_PROGRESS
 
 
 router = APIRouter()
 
 
+def _unload_idle_image_runtime_for_video(request: Request, action: str) -> None:
+    """Free resident image diffusion weights before video work starts."""
+    state = request.app.state.chaosengine
+    if IMAGE_PROGRESS.snapshot().get("active"):
+        raise HTTPException(
+            status_code=409,
+            detail=(
+                "An image generation is still running. Wait for it to finish or cancel it "
+                "before loading a video model."
+            ),
+        )
+    try:
+        runtime = state.image_runtime.capabilities()
+    except Exception:
+        return
+    loaded_repo = str(runtime.get("loadedModelRepo") or "")
+    if not loaded_repo:
+        return
+    try:
+        state.image_runtime.unload()
+    except Exception as exc:
+        state.add_log(
+            "video",
+            "warning",
+            f"Could not unload image model before {action}: {type(exc).__name__}: {exc}",
+        )
+        return
+    state.add_log(
+        "video",
+        "info",
+        f"Unloaded image model {loaded_repo} before {action} to free memory.",
+    )
+    state.add_activity("Image model unloaded", f"Freed memory for {action}")
+
+
 @router.get("/api/video/catalog")
 def video_catalog(request: Request) -> dict[str, Any]:
     """Return the curated catalog of video generation models."""
@@ -114,10 +153,11 @@ def preload_video_model(request: Request, body: VideoRuntimePreloadRequest) -> d
         raise HTTPException(status_code=404, detail=f"Unknown video model '{body.modelId}'.")
 
     if not _video_variant_available_locally(variant):
-        validation_error = _video_download_validation_error(variant["repo"])
+        validation_error = _video_variant_validation_error(variant)
         detail = validation_error or f"{variant['name']} is not installed locally yet."
         raise HTTPException(status_code=409, detail=detail)
 
+    _unload_idle_image_runtime_for_video(request, "video preload")
     try:
         runtime = state.video_runtime.preload(variant["repo"])
     except RuntimeError as exc:
@@ -257,10 +297,11 @@ def generate_video(request: Request, body: VideoGenerationRequest) -> dict[str,
         )
 
     if not _video_variant_available_locally(variant):
-        validation_error = _video_download_validation_error(variant["repo"])
+        validation_error = _video_variant_validation_error(variant)
         detail = validation_error or f"{variant['name']} is not installed locally yet."
         raise HTTPException(status_code=409, detail=detail)
 
+    _unload_idle_image_runtime_for_video(request, "video generation")
     try:
         artifact, runtime = _generate_video_artifact(body, variant, state.video_runtime)
     except GenerationCancelled:
@@ -305,12 +346,47 @@ def download_video_model(request: Request, body: DownloadModelRequest) -> dict[s
     at an arbitrary model via the API.
     """
     state = request.app.state.chaosengine
+    variant = _find_video_variant(body.modelId) if body.modelId else None
+    if body.modelId and variant is None:
+        raise HTTPException(status_code=404, detail=f"Unknown video model '{body.modelId}'.")
+    if variant is not None and variant.get("ggufFile"):
+        base_error = _video_download_validation_error(str(variant["repo"]))
+        if base_error:
+            label = variant["name"]
+            state.add_log("video", "info", f"Video download requested: {label} base ({variant['repo']})")
+            return {"download": state.start_download(str(variant["repo"]))}
+        gguf_repo = str(variant.get("ggufRepo") or "")
+        gguf_file = str(variant.get("ggufFile") or "")
+        if not gguf_repo or not gguf_file:
+            raise HTTPException(status_code=400, detail=f"GGUF metadata is incomplete for {variant['name']}.")
+        state.add_log("video", "info", f"Video download requested: {variant['name']} GGUF ({gguf_repo}/{gguf_file})")
+        return {
+            "download": state.start_download(
+                gguf_repo,
+                allow_patterns=[gguf_file, "*.md", "LICENSE*"],
+            )
+        }
+
+    if variant is not None:
+        text_encoder_repo = _video_variant_missing_text_encoder_repo(variant)
+        if text_encoder_repo:
+            state.add_log(
+                "video",
+                "info",
+                f"Video download requested: {variant['name']} shared text encoder ({text_encoder_repo})",
+            )
+            return {
+                "download": state.start_download(
+                    text_encoder_repo,
+                    allow_patterns=list(_VIDEO_MLX_TEXT_ENCODER_ALLOW_PATTERNS),
+                )
+            }
+
     if not _is_video_repo(body.repo):
         raise HTTPException(
             status_code=404,
             detail=f"Repo '{body.repo}' is not in the curated video model catalog.",
         )
-    variant = _find_video_variant_by_repo(body.repo)
     label = variant["name"] if variant else body.repo
     state.add_log("video", "info", f"Video download requested: {label} ({body.repo})")
     return {"download": state.start_download(body.repo)}
@@ -332,7 +408,7 @@ def video_download_status(request: Request) -> dict[str, Any]:
 @router.post("/api/video/download/cancel")
 def cancel_video_download(request: Request, body: DownloadModelRequest) -> dict[str, Any]:
     state = request.app.state.chaosengine
-    if not _is_video_repo(body.repo):
+    if not _is_video_download_repo(body.repo):
         raise HTTPException(
             status_code=404,
             detail=f"Repo '{body.repo}' is not in the curated video model catalog.",
@@ -343,7 +419,7 @@ def cancel_video_download(request: Request, body: DownloadModelRequest) -> dict[
 @router.post("/api/video/download/delete")
 def delete_video_download(request: Request, body: DownloadModelRequest) -> dict[str, Any]:
     state = request.app.state.chaosengine
-    if not _is_video_repo(body.repo):
+    if not _is_video_download_repo(body.repo):
         raise HTTPException(
             status_code=404,
             detail=f"Repo '{body.repo}' is not in the curated video model catalog.",
diff --git a/backend_service/state.py b/backend_service/state.py
index 63582f9..67fcfa9 100644
--- a/backend_service/state.py
+++ b/backend_service/state.py
@@ -18,7 +18,6 @@
 from fastapi import HTTPException
 from starlette.responses import StreamingResponse
 
-from cache_compression import registry as cache_registry
 from backend_service.catalog import CATALOG
 from backend_service.inference import RuntimeController
 
@@ -170,6 +169,7 @@ def __init__(
         benchmarks_path: Path | None = None,
         chat_sessions_path: Path | None = None,
         library_cache_path: Path | None = None,
+        background_capability_probe: bool = False,
     ) -> None:
         # Defer imports of module-level constants to avoid circular imports
         from backend_service.app import (
@@ -210,7 +210,7 @@ def __init__(
                     self._library_scan_done.set()
         else:
             self._library_scan_done.set()
-        self.runtime = RuntimeController()
+        self.runtime = RuntimeController(background_probe=background_capability_probe)
         self._image_runtime: "ImageRuntimeManager | None" = None
         self._video_runtime: "VideoRuntimeManager | None" = None
         self._chat_sessions_path = chat_sessions_path if chat_sessions_path is not None else CHAT_SESSIONS_PATH
@@ -419,10 +419,16 @@ def _settings_payload(self, library: list[dict[str, Any]]) -> dict[str, Any]:
             "hfCachePath": str(self.settings.get("hfCachePath") or ""),
         }
 
+    def _system_snapshot(self) -> dict[str, Any]:
+        try:
+            return self._system_snapshot_provider(capabilities=self.runtime.capabilities)
+        except TypeError:
+            return self._system_snapshot_provider()
+
     def _bootstrap(self) -> None:
         from backend_service.app import app_version
 
-        system = self._system_snapshot_provider()
+        system = self._system_snapshot()
         recommendation = _best_fit_recommendation(system)
         self.add_log("chaosengine", "info", f"Workspace booted in {system['backendLabel']} mode.")
         self.add_log("chaosengine", "info", f"ChaosEngine v{app_version} detected.")
@@ -494,6 +500,8 @@ def _native_cache_label() -> str:
         return "Native f16 cache"
 
     def _cache_label(self, *, cache_strategy: str, bits: int, fp16_layers: int) -> str:
+        from cache_compression import registry as cache_registry
+
         strategy = cache_registry.get(cache_strategy)
         if strategy is not None:
             return strategy.label(bits, fp16_layers)
@@ -853,6 +861,40 @@ def _default_session_model(self) -> dict[str, Any]:
                 "treeBudget": model_info.treeBudget,
             }
 
+        # No model is currently loaded. Prefer a model the user actually has
+        # downloaded over a catalog default — surfacing a catalog-only entry
+        # (e.g. nvidia/NVIDIA-Nemotron-3-Nano-4B-GGUF) just produces a
+        # confusing "Failed to load … isn't downloaded on this machine"
+        # error when the user clicks Load.
+        for entry in self._library():
+            entry_type = entry.get("modelType")
+            if entry_type and entry_type != "text":
+                continue
+            if entry.get("broken"):
+                continue
+            return {
+                "model": entry["name"],
+                "modelRef": entry["name"],
+                "canonicalRepo": entry.get("canonicalRepo") or entry.get("repo"),
+                "modelSource": "library",
+                "modelPath": entry["path"],
+                "modelBackend": entry.get("backend", "auto"),
+                "cacheLabel": self._cache_label(
+                    cache_strategy=str(launch_preferences["cacheStrategy"]),
+                    bits=int(launch_preferences["cacheBits"]),
+                    fp16_layers=int(launch_preferences["fp16Layers"]),
+                ),
+                "cacheStrategy": launch_preferences["cacheStrategy"],
+                "cacheBits": launch_preferences["cacheBits"],
+                "fp16Layers": launch_preferences["fp16Layers"],
+                "fusedAttention": launch_preferences["fusedAttention"],
+                "fitModelInMemory": launch_preferences["fitModelInMemory"],
+                "contextTokens": launch_preferences["contextTokens"],
+                "speculativeDecoding": launch_preferences.get("speculativeDecoding", False),
+                "dflashDraftModel": None,
+                "treeBudget": launch_preferences.get("treeBudget", 0),
+            }
+
         default_variant = _default_chat_variant()
         return {
             "model": default_variant["name"],
@@ -1087,6 +1129,7 @@ def update_settings(self, request: UpdateSettingsRequest) -> dict[str, Any]:
                 next_settings["remoteProviders"] = normalized
 
             if request.huggingFaceToken is not None:
+                previous_token_value = str(next_settings.get("huggingFaceToken") or "")
                 token_value = request.huggingFaceToken.strip()
                 next_settings["huggingFaceToken"] = token_value
                 if token_value:
@@ -1095,6 +1138,12 @@ def update_settings(self, request: UpdateSettingsRequest) -> dict[str, Any]:
                 else:
                     os.environ.pop("HF_TOKEN", None)
                     os.environ.pop("HUGGING_FACE_HUB_TOKEN", None)
+                if token_value != previous_token_value:
+                    from backend_service.helpers.huggingface import _clear_huggingface_caches
+                    from backend_service.helpers.images import _clear_image_discover_caches
+
+                    _clear_huggingface_caches()
+                    _clear_image_discover_caches()
 
             # Output directory overrides. Empty string clears the override.
             # Anything non-empty must be absolute or ~-relative — same rule as
@@ -1199,7 +1248,7 @@ def _conversion_details(
                 fp16_layers=launch_preferences["fp16Layers"],
                 context_tokens=launch_preferences["contextTokens"],
                 params_b=params_b,
-                system_stats=self._system_snapshot_provider(),
+                system_stats=self._system_snapshot(),
             )
             if params_b is not None
             else None
@@ -1307,7 +1356,7 @@ def run_benchmark(self, request: BenchmarkRunRequest) -> dict[str, Any]:
                 fp16_layers=request.fp16Layers,
                 context_tokens=request.contextTokens,
                 params_b=params_b,
-                system_stats=self._system_snapshot_provider(),
+                system_stats=self._system_snapshot(),
             )
             use_compressed = request.cacheBits > 0
             cache_gb = preview["optimizedCacheGb"] if use_compressed else preview["baselineCacheGb"]
@@ -2428,7 +2477,7 @@ def _sse_stream():
             headers={"Cache-Control": "no-cache", "Connection": "keep-alive", "X-Accel-Buffering": "no"},
         )
 
-    def start_download(self, repo: str) -> dict[str, Any]:
+    def start_download(self, repo: str, allow_patterns: list[str] | None = None) -> dict[str, Any]:
         from backend_service.helpers.huggingface import (
             _friendly_hf_download_error,
             _hf_repo_downloaded_bytes,
@@ -2535,7 +2584,7 @@ def _progress_worker() -> None:
                     # allowlist so we skip legacy single-file checkpoints the
                     # pipelines never load. Both helpers return None for repos
                     # outside their catalog, so only one ever applies.
-                    allow_patterns = (
+                    effective_allow_patterns = allow_patterns or (
                         _video_repo_allow_patterns(repo)
                         or _image_repo_allow_patterns(repo)
                     )
@@ -2543,7 +2592,7 @@ def _progress_worker() -> None:
                         repo,
                         env,
                         process_log,
-                        allow_patterns=allow_patterns,
+                        allow_patterns=effective_allow_patterns,
                     )
                     with self._lock:
                         if self._download_tokens.get(repo) == download_token:
@@ -2869,7 +2918,7 @@ def server_status(self) -> dict[str, Any]:
     def workspace(self) -> dict[str, Any]:
         from backend_service.app import compute_cache_preview
 
-        system_stats = self._system_snapshot_provider()
+        system_stats = self._system_snapshot()
         try:
             loaded_name = self.runtime.loaded_model.name if self.runtime.loaded_model else None
             loaded_engine = self.runtime.engine.engine_name if self.runtime.engine else None
diff --git a/backend_service/video_runtime.py b/backend_service/video_runtime.py
index e7426ce..f301294 100644
--- a/backend_service/video_runtime.py
+++ b/backend_service/video_runtime.py
@@ -32,7 +32,6 @@
 
 from backend_service.helpers.gpu import nvidia_gpu_present
 from backend_service.image_runtime import validate_local_diffusers_snapshot
-from cache_compression import apply_diffusion_cache_strategy
 from backend_service.progress import (
     GenerationCancelled,
     PHASE_DECODING,
@@ -540,15 +539,15 @@ def _enhance_prompt(repo: str, prompt: str) -> tuple[str, str | None]:
 # pressure. Numbers come from the catalog ``sizeGb`` estimates for the
 # stock variants; GGUF Q4/Q6/Q8 variants override at the call site.
 _VIDEO_MODEL_FOOTPRINT_BF16_GB: dict[str, float] = {
-    "Lightricks/LTX-Video": 14.0,
+    "Lightricks/LTX-Video": 10.0,
     "Wan-AI/Wan2.1-T2V-1.3B-Diffusers": 9.0,
     "Wan-AI/Wan2.1-T2V-14B-Diffusers": 28.0,
     "Wan-AI/Wan2.2-TI2V-5B-Diffusers": 11.0,
     "Wan-AI/Wan2.2-T2V-A14B-Diffusers": 28.0,
     "hunyuanvideo-community/HunyuanVideo": 26.0,
-    "genmo/mochi-1-preview": 20.0,
-    "THUDM/CogVideoX-2b": 10.0,
-    "THUDM/CogVideoX-5b": 18.0,
+    "genmo/mochi-1-preview": 22.0,
+    "THUDM/CogVideoX-2b": 19.0,
+    "THUDM/CogVideoX-5b": 33.0,
 }
 
 # GGUF quant level → multiplier vs the bf16 footprint. Keys are matched as
@@ -985,6 +984,8 @@ def generate(self, config: VideoGenerationConfig) -> GeneratedVideo:
             # ~1.3–2× on Wan). NotImplementedError is swallowed by the
             # helper when the pipeline class has no vendored patch yet;
             # see FU-007 in CLAUDE.md.
+            from cache_compression import apply_diffusion_cache_strategy
+
             apply_diffusion_cache_strategy(
                 pipeline,
                 strategy_id=config.cacheStrategy,
@@ -1527,6 +1528,11 @@ def _ensure_pipeline(
                     pipeline_kwargs["transformer"] = quantized_transformer
                 if gguf_note:
                     VIDEO_PROGRESS.set_phase(PHASE_LOADING, message=gguf_note)
+                if quantized_transformer is None:
+                    raise RuntimeError(
+                        gguf_note
+                        or f"Could not load requested GGUF transformer {gguf_file}."
+                    )
             elif use_nf4:
                 VIDEO_PROGRESS.set_phase(
                     PHASE_LOADING,
@@ -1635,9 +1641,10 @@ def _try_load_gguf_transformer(
 
         Mirrors the image-side loader: GGUF weights cover the DiT only;
         VAE and text encoders are loaded from the base ``repo`` snapshot.
-        All failure modes are non-fatal — a missing ``gguf`` package, an
-        old diffusers without ``GGUFQuantizationConfig``, or an HF cache
-        miss falls back to the standard fp16 / bf16 transformer path.
+        The helper itself only reports ``(None, note)`` on failure so tests
+        can exercise each missing-dependency path. ``_ensure_pipeline`` treats
+        a requested GGUF variant as strict and raises with that note rather
+        than silently loading the full fp16 / bf16 transformer.
         """
         if importlib.util.find_spec("gguf") is None:
             return None, (
diff --git a/cache_compression/__init__.py b/cache_compression/__init__.py
index ad3cb81..1bcfa2c 100644
--- a/cache_compression/__init__.py
+++ b/cache_compression/__init__.py
@@ -10,6 +10,7 @@
 from abc import ABC, abstractmethod
 import importlib
 import platform
+from threading import RLock
 from typing import Any
 
 
@@ -147,18 +148,27 @@ class CacheStrategyRegistry:
 
     def __init__(self) -> None:
         self._strategies: dict[str, CacheStrategy] = {}
+        self._discovered = False
+        self._lock = RLock()
 
     def register(self, strategy: CacheStrategy) -> None:
         self._strategies[strategy.strategy_id] = strategy
 
     def get(self, strategy_id: str) -> CacheStrategy | None:
+        self._ensure_discovered()
         return self._strategies.get(strategy_id)
 
     def default(self) -> CacheStrategy:
+        self._ensure_discovered()
         return self._strategies["native"]
 
+    def strategies(self) -> list[CacheStrategy]:
+        self._ensure_discovered()
+        return list(self._strategies.values())
+
     def available(self) -> list[dict[str, Any]]:
         """Return a JSON-friendly list for the frontend."""
+        self._ensure_discovered()
         out: list[dict[str, Any]] = []
         for s in self._strategies.values():
             out.append({
@@ -176,11 +186,19 @@ def available(self) -> list[dict[str, Any]]:
             })
         return out
 
+    def _ensure_discovered(self) -> None:
+        if self._discovered:
+            return
+        with self._lock:
+            if not self._discovered:
+                self.discover()
+
     def discover(self) -> list[CacheStrategy]:
         """Import all known adapter modules and return available strategies."""
-        self._strategies = {}
+        with self._lock:
+            self._strategies = {}
 
-        strategy_specs = [
+            strategy_specs = [
             {
                 "id": "native",
                 "name": "Native f16",
@@ -248,31 +266,32 @@ def discover(self) -> list[CacheStrategy]:
                 "supports_fp16_layers": False,
                 "required_llama_binary": "standard",
             },
-        ]
-
-        for spec in strategy_specs:
-            try:
-                module = importlib.import_module(spec["module"])
-                cls = getattr(module, spec["class_name"])
-                instance = cls()
-            except Exception as exc:
-                if spec["id"] == "native":
-                    raise
-                instance = _BrokenStrategy(
-                    strategy_id=str(spec["id"]),
-                    name=str(spec["name"]),
-                    bit_range=spec["bit_range"],
-                    default_bits=spec["default_bits"],
-                    supports_fp16_layers=bool(spec["supports_fp16_layers"]),
-                    required_llama_binary=str(spec.get("required_llama_binary", "standard")),
-                    reason=(
-                        f"{spec['name']} could not be loaded in this runtime. "
-                        f"ChaosEngineAI kept the card visible so the UI does not silently collapse to Native f16 only. "
-                        f"Import error: {exc}"
-                    ),
-                )
-            self.register(instance)
-        return list(self._strategies.values())
+            ]
+
+            for spec in strategy_specs:
+                try:
+                    module = importlib.import_module(spec["module"])
+                    cls = getattr(module, spec["class_name"])
+                    instance = cls()
+                except Exception as exc:
+                    if spec["id"] == "native":
+                        raise
+                    instance = _BrokenStrategy(
+                        strategy_id=str(spec["id"]),
+                        name=str(spec["name"]),
+                        bit_range=spec["bit_range"],
+                        default_bits=spec["default_bits"],
+                        supports_fp16_layers=bool(spec["supports_fp16_layers"]),
+                        required_llama_binary=str(spec.get("required_llama_binary", "standard")),
+                        reason=(
+                            f"{spec['name']} could not be loaded in this runtime. "
+                            f"ChaosEngineAI kept the card visible so the UI does not silently collapse to Native f16 only. "
+                            f"Import error: {exc}"
+                        ),
+                    )
+                self.register(instance)
+            self._discovered = True
+            return list(self._strategies.values())
 
 
 class _BrokenStrategy(CacheStrategy):
@@ -330,7 +349,6 @@ def required_llama_binary(self) -> str:
 
 # Module-level singleton — import and use ``registry`` directly.
 registry = CacheStrategyRegistry()
-registry.discover()
 
 
 def apply_diffusion_cache_strategy(
diff --git a/cache_compression/chaosengine.py b/cache_compression/chaosengine.py
index e088dfe..c8d9000 100644
--- a/cache_compression/chaosengine.py
+++ b/cache_compression/chaosengine.py
@@ -16,28 +16,16 @@
 
 from __future__ import annotations
 
-import importlib
+import importlib.util
 from typing import Any
 
 from cache_compression import CacheStrategy
 
 
-def _load_chaosengine() -> Any | None:
-    try:
-        return importlib.import_module("chaos_engine")
-    except ImportError:
-        return None
-
-
 def _chaosengine_available() -> bool:
-    mod = _load_chaosengine()
-    if mod is None:
-        return False
-    # Check for the core cache module
     try:
-        cache_mod = importlib.import_module("chaos_engine.cache")
-        return hasattr(cache_mod, "config") or True
-    except ImportError:
+        return importlib.util.find_spec("chaos_engine") is not None
+    except (ImportError, AttributeError, ValueError):
         return False
 
 
diff --git a/cache_compression/triattention.py b/cache_compression/triattention.py
index fe2d339..ef524ec 100644
--- a/cache_compression/triattention.py
+++ b/cache_compression/triattention.py
@@ -17,36 +17,23 @@
 
 from __future__ import annotations
 
+import importlib.util
 from typing import Any
 
 from cache_compression import CacheStrategy
 
 
-_triattention = None
-_vllm = None
-_mlx_lm = None
-try:
-    import triattention as _triattention  # type: ignore[import-untyped]
-except ImportError:
-    pass
-try:
-    import vllm as _vllm  # type: ignore[import-untyped]
-except ImportError:
-    pass
-try:
-    import mlx_lm as _mlx_lm  # type: ignore[import-untyped]
-except ImportError:
-    pass
+def _module_available(module_name: str) -> bool:
+    try:
+        return importlib.util.find_spec(module_name) is not None
+    except (ImportError, AttributeError, ValueError):
+        return False
 
 
 def _has_mlx_entrypoint() -> bool:
-    if _triattention is None or _mlx_lm is None:
-        return False
-    try:
-        from triattention.mlx import apply_triattention_mlx  # noqa: F401
-        return True
-    except ImportError:
-        return False
+    # Keep availability checks side-effect free. Importing mlx_lm can touch
+    # MLX/Metal at module load and can abort in headless or sandboxed contexts.
+    return _module_available("triattention") and _module_available("mlx_lm")
 
 
 class TriAttentionStrategy(CacheStrategy):
@@ -63,7 +50,7 @@ def has_mlx_backend(self) -> bool:
         return _has_mlx_entrypoint()
 
     def has_vllm_backend(self) -> bool:
-        return _triattention is not None and _vllm is not None
+        return _module_available("triattention") and _module_available("vllm")
 
     def is_available(self) -> bool:
         return self.has_mlx_backend() or self.has_vllm_backend()
@@ -119,7 +106,7 @@ def apply_vllm_patches(self) -> None:
 
         Must be called BEFORE creating a ``vllm.LLM`` instance.
         """
-        if _triattention is None:
+        if not _module_available("triattention"):
             raise RuntimeError("triattention is not installed.")
         try:
             from triattention.vllm.runtime.integration_monkeypatch import (
diff --git a/cache_compression/turboquant.py b/cache_compression/turboquant.py
index 32797f4..52e8044 100644
--- a/cache_compression/turboquant.py
+++ b/cache_compression/turboquant.py
@@ -51,6 +51,22 @@ def _has_required_turboquant_mlx_hooks() -> bool:
     return all(any(hook in source for source in sources) for hook in _REQUIRED_HOOKS)
 
 
+def _has_full_turboquant_mlx_package() -> bool:
+    if not _has_required_turboquant_mlx_hooks():
+        return False
+    try:
+        module = importlib.import_module("turboquant_mlx")
+    except ImportError:
+        return False
+    checker = getattr(module, "_has_full_turboquant", None)
+    if not callable(checker):
+        return False
+    try:
+        return bool(checker())
+    except Exception:
+        return False
+
+
 def _load_turboquant_mlx_hooks() -> tuple[Any | None, Any | None]:
     if not _has_required_turboquant_mlx_hooks():
         return None, None
@@ -72,10 +88,10 @@ def name(self) -> str:
         return "TurboQuant"
 
     def is_available(self) -> bool:
-        # Keep availability probing side-effect free. Some MLX packages touch
-        # Metal during import, so we only report ready when the expected hooks
-        # are present in the installed source tree.
-        return _has_required_turboquant_mlx_hooks()
+        # The in-tree adapter provides ChaosEngineAI's stable hooks, while
+        # turboquant-mlx-full provides the actual TurboQuantKVCache. Report
+        # "Ready" only when both are visible to the backend runtime.
+        return _has_full_turboquant_mlx_package()
 
     def availability_badge(self) -> str:
         return "Ready" if self.is_available() else "Experimental"
@@ -86,6 +102,11 @@ def availability_tone(self) -> str:
     def availability_reason(self) -> str | None:
         if self.is_available():
             return None
+        if not _has_required_turboquant_mlx_hooks():
+            return (
+                "ChaosEngineAI's TurboQuant MLX adapter is not available in "
+                "this runtime. Rebuild or update the app, then retry."
+            )
         return (
             "Install turboquant-mlx (arozanov fork; PyPI name "
             "``turboquant-mlx-full``) into ChaosEngineAI's backend runtime: "
diff --git a/pyproject.toml b/pyproject.toml
index 479aec4..6e93ee3 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -69,4 +69,4 @@ testpaths = ["tests"]
 addopts = "--tb=short -q"
 
 [tool.setuptools.packages.find]
-include = ["backend_service*", "cache_compression*", "dflash*"]
+include = ["backend_service*", "cache_compression*", "dflash*", "turboquant_mlx*"]
diff --git a/scripts/stage-runtime.mjs b/scripts/stage-runtime.mjs
index 714e63d..bded9c9 100644
--- a/scripts/stage-runtime.mjs
+++ b/scripts/stage-runtime.mjs
@@ -61,7 +61,7 @@ function main() {
   pruneBundledProjectArtifacts();
 
   ensureDir(backendDest);
-  for (const relativePath of ["backend_service", "cache_compression"]) {
+  for (const relativePath of ["backend_service", "cache_compression", "turboquant_mlx"]) {
     copyTree(path.join(workspaceRoot, relativePath), path.join(backendDest, relativePath));
   }
   for (const relativeFile of ["README.md", "pyproject.toml"]) {
diff --git a/src-tauri/src/lib.rs b/src-tauri/src/lib.rs
index a46edc2..4f29137 100644
--- a/src-tauri/src/lib.rs
+++ b/src-tauri/src/lib.rs
@@ -636,12 +636,15 @@ fn apply_embedded_runtime_env(command: &mut Command, runtime: &EmbeddedRuntime)
         .env("PYTHONNOUSERSITE", "1")
         .env("CHAOSENGINE_EMBEDDED_RUNTIME", "1");
 
-    // Prepend the user-local extras dir to PYTHONPATH so packages installed
-    // at runtime (CUDA torch, diffusers, etc. via /api/setup/install-gpu-bundle)
-    // shadow anything in the bundled site-packages. The extras dir lives
-    // outside the ephemeral %TEMP% runtime extraction so it survives app
-    // updates — the installer re-extracts the bundled runtime from scratch
-    // on each launch, but never touches the extras tree.
+    // Insert the user-local extras dir after the app backend but before
+    // bundled site-packages. Runtime-installed packages (CUDA torch,
+    // diffusers, etc.) still shadow bundled third-party wheels, while
+    // app-owned adapter modules in backend/ keep priority over same-named
+    // upstream packages installed into extras.
+    //
+    // The extras dir lives outside the ephemeral %TEMP% runtime extraction
+    // so it survives app updates — the installer re-extracts the bundled
+    // runtime from scratch on each launch, but never touches the extras tree.
     // (CHAOSENGINE_EXTRAS_SITE_PACKAGES is already set by the caller so
     // the backend can target it for pip --target installs.)
     let extras_dir = chaosengine_extras_site_packages_for_python(
@@ -650,10 +653,13 @@ fn apply_embedded_runtime_env(command: &mut Command, runtime: &EmbeddedRuntime)
     )
     .filter(|path| path.is_dir());
     let mut python_path_entries: Vec<PathBuf> = Vec::with_capacity(runtime.python_path.len() + 1);
+    if let Some(first) = runtime.python_path.first() {
+        python_path_entries.push(first.clone());
+    }
     if let Some(extras) = extras_dir.as_ref() {
         python_path_entries.push(extras.clone());
     }
-    python_path_entries.extend(runtime.python_path.iter().cloned());
+    python_path_entries.extend(runtime.python_path.iter().skip(1).cloned());
     if let Some(python_path) = join_paths(&python_path_entries) {
         command.env("PYTHONPATH", python_path);
     }
diff --git a/src/App.tsx b/src/App.tsx
index 877691a..20c2555 100644
--- a/src/App.tsx
+++ b/src/App.tsx
@@ -1,4 +1,4 @@
-import { useEffect, useRef, useState } from "react";
+import { useEffect, useMemo, useRef, useState } from "react";
 import {
   checkBackend,
   convertModel,
@@ -67,6 +67,7 @@ import {
   libraryItemBackend,
   libraryItemSourceKind,
   inferHfRepoFromLocalPath,
+  isChatLibraryItem,
   downloadProgressLabel,
   syncRuntime,
   settingsDraftFromWorkspace,
@@ -174,6 +175,7 @@ export default function App() {
     systemPrompt, setSystemPrompt,
     serverModelKey, setServerModelKey,
     installingPackage,
+    installLogs,
     updateLaunchSetting,
     updateConversionDraft,
     handleAddDirectory,
@@ -230,17 +232,18 @@ export default function App() {
 
   // ── Library state ──────────────────────────────────────────
   const [librarySearchInput, setLibrarySearchInput] = useState("");
-  const [selectedLibraryPath, setSelectedLibraryPath] = useState(workspace.library[0]?.path ?? "");
+  const [selectedLibraryPath, setSelectedLibraryPath] = useState(workspace.library.find(isChatLibraryItem)?.path ?? "");
   const [expandedLibraryPath, setExpandedLibraryPath] = useState<string | null>(null);
   const [librarySortKey, setLibrarySortKey] = useState<"name" | "format" | "backend" | "size" | "ram" | "compressed" | "modified" | "context">("modified");
   const [librarySortDir, setLibrarySortDir] = useState<"asc" | "desc">("desc");
   const [libraryCapFilter, setLibraryCapFilter] = useState<string | null>(null);
   const [libraryFormatFilter, setLibraryFormatFilter] = useState<string | null>(null);
   const [libraryBackendFilter, setLibraryBackendFilter] = useState<string | null>(null);
+  const chatLibrary = useMemo(() => workspace.library.filter(isChatLibraryItem), [workspace.library]);
 
   // Library search sync
   useEffect(() => {
-    const nextFilteredLibrary = workspace.library
+    const nextFilteredLibrary = chatLibrary
       .filter((item) => {
         const haystack = `${item.name} ${item.path} ${item.format} ${item.directoryLabel ?? ""}`.toLowerCase();
         return haystack.includes(librarySearchInput.trim().toLowerCase());
@@ -253,10 +256,10 @@ export default function App() {
     setSelectedLibraryPath((current) =>
       nextFilteredLibrary.some((item) => item.path === current) ? current : nextFilteredLibrary[0].path,
     );
-  }, [workspace.library, librarySearchInput]);
+  }, [chatLibrary, librarySearchInput]);
 
   // Library rows
-  const libraryRows = workspace.library.map((item) => {
+  const libraryRows = chatLibrary.map((item) => {
     const matchedVariant = findCatalogVariantForLibraryItem(workspace.featuredModels, item);
     return {
       item,
@@ -314,7 +317,6 @@ export default function App() {
       };
     });
   const filteredLibraryRows = [...libraryRows, ...syntheticDownloadRows]
-    .filter(({ item }) => item.modelType === "text" || (!item.modelType))
     .filter(({ item, displayFormat, displayQuantization, displayBackend, sourceKind }) => {
       const haystack = `${item.name} ${item.path} ${displayFormat} ${displayQuantization ?? ""} ${displayBackend} ${sourceKind} ${item.directoryLabel ?? ""}`.toLowerCase();
       return haystack.includes(librarySearchInput.trim().toLowerCase());
@@ -337,28 +339,11 @@ export default function App() {
   const selectedLibraryVariant = selectedLibraryRow?.matchedVariant ?? null;
 
   // ── Chat model options ─────────────────────────────────────
-  const catalogChatOptions: ChatModelOption[] = allFeaturedVariants
-    .filter((variant) => variant.launchMode === "direct")
-    .map((variant) => ({
-      key: `catalog:${variant.id}`,
-      label: variant.name,
-      detail: `${variant.format} / ${variant.quantization}`,
-      group: "Catalog",
-      model: variant.name,
-      modelRef: variant.id,
-      canonicalRepo: variant.repo,
-      source: "catalog",
-      backend: variant.backend,
-      paramsB: variant.paramsB,
-      sizeGb: variant.sizeGb,
-      contextWindow: variant.contextWindow,
-      format: variant.format,
-      quantization: variant.quantization,
-      maxContext: variant.maxContext ?? null,
-    }));
-
-  const libraryChatOptions: ChatModelOption[] = workspace.library
-    .filter((item) => (item.modelType === "text" || (!item.modelType)) && !item.broken)
+  // Only list models present in the local library — catalog-only entries
+  // would let the user pick a model that isn't downloaded yet, which then
+  // 500s on Load. Discover tab is the place to pull a new model.
+  const libraryChatOptions: ChatModelOption[] = chatLibrary
+    .filter((item) => !item.broken)
     .map((item) => {
       const matched = findCatalogVariantForLibraryItem(workspace.featuredModels, item);
       const displayFormat = libraryItemFormat(item, matched);
@@ -383,7 +368,7 @@ export default function App() {
       };
     });
 
-  const threadModelOptions = [...catalogChatOptions, ...libraryChatOptions];
+  const threadModelOptions = libraryChatOptions;
 
   // ── Cache labels (needed early by useChat) ──────────────────
   const currentCacheLabel = launchSettings.cacheStrategy === "native"
@@ -639,7 +624,7 @@ export default function App() {
   const previewSavings = Math.max(0, preview.baselineCacheGb - preview.optimizedCacheGb);
   const conversionReady = Boolean(nativeBackends?.converterAvailable ?? workspace.system.mlxLmAvailable);
   const enabledDirectoryCount = (workspace.settings?.modelDirectories ?? []).filter((directory) => directory.enabled).length;
-  const libraryTotalSizeGb = workspace.library.reduce((sum, item) => sum + item.sizeGb, 0);
+  const libraryTotalSizeGb = chatLibrary.reduce((sum, item) => sum + item.sizeGb, 0);
   const localVariantCount = allFeaturedVariants.filter((variant) => variant.availableLocally).length;
   const fileRevealLabel =
     workspace.system.platform === "Darwin" ? "Show in Finder" :
@@ -664,11 +649,11 @@ export default function App() {
     if (!selectedServerOptionBase || selectedServerOptionBase.source !== "catalog") return selectedServerOptionBase;
     const variant = findVariantForReference(workspace.featuredModels, selectedServerOptionBase.modelRef, selectedServerOptionBase.model);
     if (!variant) return selectedServerOptionBase;
-    const localItem = findLibraryItemForVariant(workspace.library, variant);
+    const localItem = findLibraryItemForVariant(chatLibrary, variant);
     if (!localItem) return selectedServerOptionBase;
     return libraryChatOptions.find((option) => option.path === localItem.path) ?? selectedServerOptionBase;
   })();
-  const convertibleLibrary = workspace.library.filter((item) => libraryItemFormat(item) !== "MLX");
+  const convertibleLibrary = chatLibrary.filter((item) => libraryItemFormat(item) !== "MLX");
   const conversionSource = convertibleLibrary.find((item) => item.path === conversionDraft.path) ?? null;
   const conversionVariant =
     (conversionSource ? findCatalogVariantForLibraryItem(workspace.featuredModels, conversionSource) : null) ??
@@ -777,12 +762,12 @@ export default function App() {
     if (!threadModelOptions.length) { setBenchmarkModelKey(""); return; }
     setBenchmarkModelKey((current) => {
       if (threadModelOptions.some((option) => option.key === current)) return current;
-      const firstHealthy = workspace.library.find((item) => !item.broken);
+      const firstHealthy = chatLibrary.find((item) => !item.broken);
       if (firstHealthy) return `library:${firstHealthy.path}`;
-      if (workspace.library.length > 0) return `library:${workspace.library[0].path}`;
+      if (chatLibrary.length > 0) return `library:${chatLibrary[0].path}`;
       return activeThreadOption?.key ?? loadedModelOption?.key ?? threadModelOptions[0].key;
     });
-  }, [activeThreadOption?.key, loadedModelOption?.key, serverOptionKeySignature, workspace.library, setBenchmarkModelKey]);
+  }, [activeThreadOption?.key, chatLibrary, loadedModelOption?.key, serverOptionKeySignature, setBenchmarkModelKey]);
 
   // Sync benchmarkDraft model fields
   useEffect(() => {
@@ -1022,7 +1007,7 @@ export default function App() {
   }
 
   function loadPayloadFromVariant(variant: ModelVariant, nextTab?: TabId) {
-    const localItem = findLibraryItemForVariant(workspace.library, variant);
+    const localItem = findLibraryItemForVariant(chatLibrary, variant);
     if (localItem) {
       return {
         modelRef: localItem.name,
@@ -1050,7 +1035,7 @@ export default function App() {
     | "cacheStrategy" | "cacheBits" | "fp16Layers" | "fusedAttention" | "fitModelInMemory"
     | "contextTokens" | "speculativeDecoding" | "dflashDraftModel" | "treeBudget"
   > {
-    const localItem = findLibraryItemForVariant(workspace.library, variant);
+    const localItem = findLibraryItemForVariant(chatLibrary, variant);
     const modelRef = localItem?.name ?? variant.id;
     const modelName = localItem?.name ?? variant.name;
     const modelBackend = localItem ? libraryItemBackend(localItem, variant) : variant.backend;
@@ -1124,7 +1109,7 @@ export default function App() {
     if (normalizedKey?.startsWith("catalog:")) {
       const modelRef = normalizedKey.slice("catalog:".length);
       const variant = findVariantForReference(workspace.featuredModels, modelRef, undefined);
-      const localItem = variant ? findLibraryItemForVariant(workspace.library, variant) : null;
+      const localItem = variant ? findLibraryItemForVariant(chatLibrary, variant) : null;
       if (localItem) normalizedKey = `library:${localItem.path}`;
     }
     // If no key given, or the key references a model no longer in the options
@@ -1276,7 +1261,7 @@ export default function App() {
         expandedVariantId={expandedVariantId}
         onExpandedVariantIdChange={setExpandedVariantId}
         onDetailFamilyIdChange={setDetailFamilyId}
-        library={workspace.library}
+        library={chatLibrary}
         activeDownloads={activeDownloads}
         onDownloadModel={(repo) => void handleDownloadModel(repo)}
         onCancelModelDownload={(repo) => void handleCancelModelDownload(repo)}
@@ -1491,7 +1476,7 @@ export default function App() {
         longLiveJob={videoState.longLiveJob}
         onActiveTabChange={setActiveTab}
         onOpenVideoStudio={videoState.openVideoStudio}
-        onVideoDownload={(repo) => void videoState.handleVideoDownload(repo)}
+        onVideoDownload={(repo, modelId) => void videoState.handleVideoDownload(repo, modelId)}
         onCancelVideoDownload={(repo) => void videoState.handleCancelVideoDownload(repo)}
         onDeleteVideoDownload={(repo) => void videoState.handleDeleteVideoDownload(repo)}
         onOpenExternalUrl={(url) => void handleOpenExternalUrl(url)}
@@ -1513,7 +1498,7 @@ export default function App() {
         fileRevealLabel={fileRevealLabel}
         onActiveTabChange={setActiveTab}
         onOpenVideoStudio={videoState.openVideoStudio}
-        onVideoDownload={(repo) => void videoState.handleVideoDownload(repo)}
+        onVideoDownload={(repo, modelId) => void videoState.handleVideoDownload(repo, modelId)}
         onCancelVideoDownload={(repo) => void videoState.handleCancelVideoDownload(repo)}
         onDeleteVideoDownload={(repo) => void videoState.handleDeleteVideoDownload(repo)}
         onPreloadVideoModel={(variant) => void videoState.handlePreloadVideoModel(variant)}
@@ -1573,7 +1558,7 @@ export default function App() {
         onActiveTabChange={setActiveTab}
         onPreloadVideoModel={(variant) => void videoState.handlePreloadVideoModel(variant)}
         onUnloadVideoModel={(variant) => void videoState.handleUnloadVideoModel(variant)}
-        onVideoDownload={(repo) => void videoState.handleVideoDownload(repo)}
+        onVideoDownload={(repo, modelId) => void videoState.handleVideoDownload(repo, modelId)}
         onGenerateVideo={() => void videoState.handleVideoGenerate()}
         onOpenExternalUrl={(url) => void handleOpenExternalUrl(url)}
         onRestartServer={() => void handleRestartServer()}
@@ -1613,7 +1598,7 @@ export default function App() {
         convertibleLibrary={convertibleLibrary}
         nativeBackends={nativeBackends}
         preview={preview}
-        workspace={{ system: workspace.system, library: workspace.library }}
+        workspace={{ system: workspace.system, library: chatLibrary }}
         launchCacheLabel={launchCacheLabel}
         busy={busy}
         busyAction={busyAction}
@@ -1730,7 +1715,7 @@ export default function App() {
       <BenchmarkRunTab
         workspace={{
           benchmarks: workspace.benchmarks,
-          library: workspace.library,
+          library: chatLibrary,
           system: {
             availableMemoryGb: workspace.system.availableMemoryGb,
             totalMemoryGb: workspace.system.totalMemoryGb,
@@ -1751,6 +1736,7 @@ export default function App() {
         showBenchmarkPicker={showBenchmarkPicker}
         showBenchmarkModal={showBenchmarkModal}
         installingPackage={installingPackage}
+        installLogs={installLogs}
         onBenchmarkDraftChange={updateBenchmarkDraft}
         onBenchmarkPromptIdChange={setBenchmarkPromptId}
         onBenchmarkModelKeyChange={setBenchmarkModelKey}
@@ -1829,6 +1815,7 @@ export default function App() {
         turboInstalled={Boolean(workspace.system.llamaServerTurboPath)}
         onInstallPackage={handleInstallPackage}
         installingPackage={installingPackage}
+        installLogs={installLogs}
       />
     </div>
   ) : null;
@@ -1982,6 +1969,7 @@ export default function App() {
         availableCacheStrategies={workspace.system.availableCacheStrategies}
         dflashInfo={workspace.system.dflash}
         installingPackage={installingPackage}
+        installLogs={installLogs}
         turboInstalled={Boolean(workspace.system.llamaServerTurboPath)}
         onPendingLaunchChange={setPendingLaunch}
         onLaunchModelSearchChange={setLaunchModelSearch}
@@ -2056,7 +2044,7 @@ export default function App() {
                 <div className="detail-variants">
                   <span className="eyebrow">Variants ({family.variants.length})</span>
                   {family.variants.map((variant) => {
-                    const matchedLocal = findLibraryItemForVariant(workspace.library, variant);
+                    const matchedLocal = findLibraryItemForVariant(chatLibrary, variant);
                     const downloadState = activeDownloads[variant.repo];
                     const isDownloading = downloadState?.state === "downloading";
                     const isDownloadPaused = downloadState?.state === "cancelled";
diff --git a/src/api.ts b/src/api.ts
index 1741f99..1881b06 100644
--- a/src/api.ts
+++ b/src/api.ts
@@ -678,8 +678,8 @@ export async function unloadImageModel(modelId?: string): Promise<ImageRuntimeSt
   return result.runtime;
 }
 
-export async function downloadVideoModel(repo: string): Promise<DownloadStatus> {
-  const result = await postJson<{ download: DownloadStatus }>("/api/video/download", { repo });
+export async function downloadVideoModel(repo: string, modelId?: string): Promise<DownloadStatus> {
+  const result = await postJson<{ download: DownloadStatus }>("/api/video/download", { repo, modelId });
   return result.download;
 }
 
diff --git a/src/components/LatestImageDiscoverCard.tsx b/src/components/LatestImageDiscoverCard.tsx
deleted file mode 100644
index 982e2c3..0000000
--- a/src/components/LatestImageDiscoverCard.tsx
+++ /dev/null
@@ -1,172 +0,0 @@
-import type { ImageModelVariant } from "../types";
-import type { DownloadStatus } from "../api";
-import {
-  imagePrimarySizeLabel,
-  imageSecondarySizeLabel,
-  formatImageLicenseLabel,
-  formatImageAccessError,
-  formatReleaseLabel,
-  isGatedImageAccessError,
-} from "../utils/format";
-import { downloadProgressLabel, downloadSizeTooltip } from "../utils/downloads";
-
-export interface LatestImageDiscoverCardProps {
-  variant: ImageModelVariant;
-  downloadState?: DownloadStatus;
-  fileRevealLabel?: string;
-  onDownload: (repo: string) => void;
-  onCancelDownload: (repo: string) => void;
-  onDeleteDownload: (repo: string) => void;
-  onOpenExternalUrl: (url: string) => void;
-  onNavigateSettings: () => void;
-  onRevealPath?: (path: string) => void;
-}
-
-export function LatestImageDiscoverCard({
-  variant,
-  downloadState,
-  fileRevealLabel,
-  onDownload,
-  onCancelDownload,
-  onDeleteDownload,
-  onOpenExternalUrl,
-  onNavigateSettings,
-  onRevealPath,
-}: LatestImageDiscoverCardProps) {
-  const isDownloadPaused = downloadState?.state === "cancelled";
-  const isDownloadComplete = downloadState?.state === "completed";
-  const isDownloadFailed = downloadState?.state === "failed";
-  const hasLocalData = Boolean(variant.hasLocalData || isDownloadComplete || isDownloadPaused || isDownloadFailed);
-  const friendlyDownloadError = formatImageAccessError(downloadState?.error, variant);
-  const needsGatedAccess = isGatedImageAccessError(downloadState?.error);
-  return (
-    <article key={variant.id} className="image-family-card image-family-card--latest">
-      <div className="image-family-card-head">
-        <div>
-          <div className="image-family-title-row">
-            <h3>{variant.name}</h3>
-            <span className="badge muted">{variant.provider}</span>
-            {!variant.availableLocally && isDownloadComplete ? <span className="badge success">Downloaded</span> : null}
-            {isDownloadPaused ? <span className="badge warning">Paused</span> : null}
-            {isDownloadFailed ? <span className="badge warning">Download Failed</span> : null}
-          </div>
-          <p>{variant.note}</p>
-        </div>
-        <span className="badge muted">{variant.updatedLabel ?? "Recently updated"}</span>
-      </div>
-
-      <div className="image-family-meta">
-        <span>{imagePrimarySizeLabel(variant)}</span>
-        {imageSecondarySizeLabel(variant) ? <span>{imageSecondarySizeLabel(variant)}</span> : null}
-        <span>{variant.recommendedResolution}</span>
-        {variant.pipelineTag ? <span>{variant.pipelineTag}</span> : null}
-      </div>
-
-      <div className="image-family-meta">
-        {formatReleaseLabel(variant.releaseLabel, variant.releaseDate ?? variant.createdAt) ? (
-          <span>{formatReleaseLabel(variant.releaseLabel, variant.releaseDate ?? variant.createdAt)}</span>
-        ) : null}
-        {variant.downloadsLabel ? <span>{variant.downloadsLabel}</span> : null}
-        {variant.likesLabel ? <span>{variant.likesLabel}</span> : null}
-        {variant.license ? <span>{formatImageLicenseLabel(variant.license)}</span> : null}
-        {typeof variant.gated === "boolean" ? <span>{variant.gated ? "Gated access" : "Open access"}</span> : null}
-      </div>
-
-      <div className="chip-row">
-        {variant.taskSupport.map((task) => (
-          <span key={task} className="badge muted">{task}</span>
-        ))}
-        {variant.styleTags.map((tag) => (
-          <span key={tag} className="badge subtle">{tag}</span>
-        ))}
-      </div>
-
-      {isDownloadFailed && downloadState?.error ? (
-        <div className="callout error image-callout">
-          <p>{friendlyDownloadError}</p>
-          {needsGatedAccess ? (
-            <div className="button-row">
-              <button className="secondary-button" type="button" onClick={() => onOpenExternalUrl(variant.link)}>
-                Hugging Face
-              </button>
-              <button className="secondary-button" type="button" onClick={onNavigateSettings}>
-                Settings
-              </button>
-            </div>
-          ) : null}
-          {friendlyDownloadError !== downloadState.error ? (
-            <details className="debug-details">
-              <summary>Technical details</summary>
-              <p className="mono-text">{downloadState.error}</p>
-            </details>
-          ) : null}
-        </div>
-      ) : null}
-
-      <div className="button-row">
-        {variant.availableLocally ? (
-          <span className="badge success">Installed</span>
-        ) : downloadState?.state === "downloading" ? (
-          <>
-            <span className="badge accent" title={downloadSizeTooltip(downloadState)}>{downloadProgressLabel(downloadState)}</span>
-            <button className="secondary-button" type="button" onClick={() => onCancelDownload(variant.repo)}>
-              Pause
-            </button>
-            <button className="secondary-button danger-button" type="button" onClick={() => onDeleteDownload(variant.repo)}>
-              Cancel
-            </button>
-          </>
-        ) : isDownloadPaused ? (
-          <>
-            <span className="badge warning" title={downloadSizeTooltip(downloadState)}>{downloadProgressLabel(downloadState)}</span>
-            <button className="secondary-button" type="button" onClick={() => onDownload(variant.repo)}>
-              Resume
-            </button>
-            <button className="secondary-button danger-button" type="button" onClick={() => onDeleteDownload(variant.repo)}>
-              Delete
-            </button>
-          </>
-        ) : isDownloadFailed ? (
-          <>
-            <button className="secondary-button" type="button" onClick={() => onDownload(variant.repo)}>
-              Retry Download
-            </button>
-            <button className="secondary-button danger-button" type="button" onClick={() => onDeleteDownload(variant.repo)}>
-              Delete
-            </button>
-          </>
-        ) : isDownloadComplete ? (
-          <span className="badge success">Download complete</span>
-        ) : (
-          <>
-            <button className="secondary-button" type="button" onClick={() => onDownload(variant.repo)}>
-              Download
-            </button>
-            {hasLocalData ? (
-              <button className="secondary-button danger-button" type="button" onClick={() => onDeleteDownload(variant.repo)}>
-                Delete
-              </button>
-            ) : null}
-          </>
-        )}
-        {variant.localPath && onRevealPath ? (
-          <button
-            className="secondary-button icon-button"
-            type="button"
-            title={fileRevealLabel ?? "Show in folder"}
-            onClick={() => onRevealPath(variant.localPath as string)}
-          >
-            <svg width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
-              <path d="M18 13v6a2 2 0 0 1-2 2H5a2 2 0 0 1-2-2V8a2 2 0 0 1 2-2h6" />
-              <polyline points="15 3 21 3 21 9" />
-              <line x1="10" y1="14" x2="21" y2="3" />
-            </svg>
-          </button>
-        ) : null}
-        <button className="secondary-button icon-link-button" type="button" onClick={() => onOpenExternalUrl(variant.link)}>
-          Hugging Face <svg width="14" height="14" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round"><path d="M18 13v6a2 2 0 0 1-2 2H5a2 2 0 0 1-2-2V8a2 2 0 0 1 2-2h6"/><polyline points="15 3 21 3 21 9"/><line x1="10" y1="14" x2="21" y2="3"/></svg>
-        </button>
-      </div>
-    </article>
-  );
-}
diff --git a/src/components/LaunchModal.tsx b/src/components/LaunchModal.tsx
index b89d5ab..ba0d7a5 100644
--- a/src/components/LaunchModal.tsx
+++ b/src/components/LaunchModal.tsx
@@ -1,5 +1,5 @@
 import { ModelLaunchModal } from "./ModelLaunchModal";
-import type { LaunchPreferences, PreviewMetrics, SystemStats } from "../types";
+import type { LaunchPreferences, PreviewMetrics, StrategyInstallLog, SystemStats } from "../types";
 import type { ChatModelOption } from "../types/chat";
 
 export interface PendingLaunch {
@@ -19,6 +19,7 @@ export interface LaunchModalProps {
   availableCacheStrategies: SystemStats["availableCacheStrategies"] | undefined;
   dflashInfo?: SystemStats["dflash"];
   installingPackage: string | null;
+  installLogs?: Record<string, StrategyInstallLog>;
   turboInstalled?: boolean;
   onPendingLaunchChange: (value: PendingLaunch | null | ((prev: PendingLaunch | null) => PendingLaunch | null)) => void;
   onLaunchModelSearchChange: (value: string) => void;
@@ -39,6 +40,7 @@ export function LaunchModal({
   availableCacheStrategies,
   dflashInfo,
   installingPackage,
+  installLogs,
   turboInstalled,
   onPendingLaunchChange,
   onLaunchModelSearchChange,
@@ -76,6 +78,7 @@ export function LaunchModal({
       availableCacheStrategies={availableCacheStrategies}
       dflashInfo={dflashInfo}
       installingPackage={installingPackage}
+      installLogs={installLogs}
       turboInstalled={turboInstalled}
       onSelectedKeyChange={setSelectedLaunchKey}
       onSearchChange={onLaunchModelSearchChange}
diff --git a/src/components/ModelActionIcons.tsx b/src/components/ModelActionIcons.tsx
new file mode 100644
index 0000000..7a2329e
--- /dev/null
+++ b/src/components/ModelActionIcons.tsx
@@ -0,0 +1,256 @@
+import type { ButtonHTMLAttributes, ReactNode } from "react";
+
+export type ActionIconName =
+  | "cancel"
+  | "chat"
+  | "convert"
+  | "delete"
+  | "download"
+  | "generate"
+  | "huggingFace"
+  | "install"
+  | "modelCard"
+  | "pause"
+  | "resume"
+  | "retry"
+  | "reveal"
+  | "server";
+
+export type ModelStatusKind =
+  | "downloaded"
+  | "downloading"
+  | "failed"
+  | "incomplete"
+  | "installed"
+  | "loaded"
+  | "paused";
+
+type IconProps = {
+  name: ActionIconName | ModelStatusKind;
+  className?: string;
+};
+
+function Svg({ children, className }: { children: ReactNode; className?: string }) {
+  return (
+    <svg
+      className={className}
+      width="16"
+      height="16"
+      viewBox="0 0 24 24"
+      fill="none"
+      stroke="currentColor"
+      strokeWidth="2"
+      strokeLinecap="round"
+      strokeLinejoin="round"
+      aria-hidden="true"
+      focusable="false"
+    >
+      {children}
+    </svg>
+  );
+}
+
+export function ModelActionIcon({ name, className }: IconProps) {
+  switch (name) {
+    case "cancel":
+    case "failed":
+      return (
+        <Svg className={className}>
+          <circle cx="12" cy="12" r="9" />
+          <path d="M9 9l6 6" />
+          <path d="M15 9l-6 6" />
+        </Svg>
+      );
+    case "chat":
+      return (
+        <Svg className={className}>
+          <path d="M5 6.5A3.5 3.5 0 0 1 8.5 3h7A3.5 3.5 0 0 1 19 6.5v4A3.5 3.5 0 0 1 15.5 14H10l-5 4v-4.8A3.5 3.5 0 0 1 5 12.5z" />
+          <path d="M8.5 8h7" />
+          <path d="M8.5 11h4" />
+        </Svg>
+      );
+    case "convert":
+      return (
+        <Svg className={className}>
+          <path d="M7 7h9.5A3.5 3.5 0 0 1 20 10.5v0" />
+          <path d="M10 4 7 7l3 3" />
+          <path d="M17 17H7.5A3.5 3.5 0 0 1 4 13.5v0" />
+          <path d="m14 14 3 3-3 3" />
+        </Svg>
+      );
+    case "delete":
+      return (
+        <Svg className={className}>
+          <path d="M4 6h16" />
+          <path d="M9 6V4h6v2" />
+          <path d="m6 6 1 14h10l1-14" />
+          <path d="M10 11v5" />
+          <path d="M14 11v5" />
+        </Svg>
+      );
+    case "download":
+    case "downloading":
+      return (
+        <Svg className={className}>
+          <path d="M12 3v11" />
+          <path d="m7 10 5 5 5-5" />
+          <path d="M5 19h14" />
+        </Svg>
+      );
+    case "generate":
+      return (
+        <Svg className={className}>
+          <path d="m12 3 1.6 4.4L18 9l-4.4 1.6L12 15l-1.6-4.4L6 9l4.4-1.6z" />
+          <path d="m19 14 .9 2.1L22 17l-2.1.9L19 20l-.9-2.1L16 17l2.1-.9z" />
+          <path d="M5 15v5" />
+          <path d="M2.5 17.5h5" />
+        </Svg>
+      );
+    case "huggingFace":
+      return (
+        <Svg className={className}>
+          <rect x="4" y="5" width="13" height="14" rx="2" />
+          <path d="M8 9h5" />
+          <path d="M8 13h3" />
+          <path d="M16 4h4v4" />
+          <path d="M13 11 20 4" />
+          <path d="M7.5 17h1.5v-3" />
+          <path d="M9 15.5H7.5" />
+          <path d="M11 17v-3h2" />
+          <path d="M11 15.5h1.5" />
+        </Svg>
+      );
+    case "install":
+      return (
+        <Svg className={className}>
+          <path d="M12 3v10" />
+          <path d="m8 9 4 4 4-4" />
+          <path d="M5 17h14v4H5z" />
+        </Svg>
+      );
+    case "modelCard":
+      return (
+        <Svg className={className}>
+          <rect x="4" y="5" width="13" height="14" rx="2" />
+          <path d="M8 9h5" />
+          <path d="M8 13h5" />
+          <path d="M8 17h3" />
+          <path d="M16 4h4v4" />
+          <path d="M13 11 20 4" />
+        </Svg>
+      );
+    case "pause":
+    case "paused":
+      return (
+        <Svg className={className}>
+          <circle cx="12" cy="12" r="9" />
+          <path d="M9.5 8.5v7" />
+          <path d="M14.5 8.5v7" />
+        </Svg>
+      );
+    case "resume":
+      return (
+        <Svg className={className}>
+          <path d="M8 5v14l11-7z" />
+        </Svg>
+      );
+    case "retry":
+      return (
+        <Svg className={className}>
+          <path d="M20 12a8 8 0 1 1-2.3-5.7" />
+          <path d="M20 5v6h-6" />
+        </Svg>
+      );
+    case "reveal":
+      return (
+        <Svg className={className}>
+          <path d="M3.5 7.5h6l2 2H20a1.5 1.5 0 0 1 1.5 1.5v6A2.5 2.5 0 0 1 19 19.5H5A2.5 2.5 0 0 1 2.5 17V9A1.5 1.5 0 0 1 4 7.5z" />
+          <path d="M13 15h6" />
+          <path d="m16.5 12 2.5 3-2.5 3" />
+        </Svg>
+      );
+    case "server":
+      return (
+        <Svg className={className}>
+          <rect x="4" y="4" width="16" height="6" rx="2" />
+          <rect x="4" y="14" width="16" height="6" rx="2" />
+          <path d="M8 7h.01" />
+          <path d="M8 17h.01" />
+          <path d="M12 7h4" />
+          <path d="M12 17h4" />
+        </Svg>
+      );
+    case "downloaded":
+    case "installed":
+      return (
+        <Svg className={className}>
+          <circle cx="12" cy="12" r="9" />
+          <path d="m8 12 2.6 2.6L16.5 9" />
+        </Svg>
+      );
+    case "loaded":
+      return (
+        <Svg className={className}>
+          <circle cx="12" cy="12" r="9" />
+          <path d="m13 3-4 10h4l-2 8 5-11h-4z" />
+        </Svg>
+      );
+    case "incomplete":
+    default:
+      return (
+        <Svg className={className}>
+          <circle cx="12" cy="12" r="9" />
+          <path d="M8 12h8" />
+        </Svg>
+      );
+  }
+}
+
+type IconActionButtonProps = ButtonHTMLAttributes<HTMLButtonElement> & {
+  icon: ActionIconName;
+  label: string;
+  buttonStyle?: "primary" | "secondary";
+  danger?: boolean;
+};
+
+export function IconActionButton({
+  icon,
+  label,
+  buttonStyle = "secondary",
+  danger = false,
+  className = "",
+  title,
+  type = "button",
+  ...props
+}: IconActionButtonProps) {
+  return (
+    <button
+      {...props}
+      className={`${buttonStyle}-button icon-button action-icon-button${danger ? " danger-button" : ""}${className ? ` ${className}` : ""}`}
+      type={type}
+      title={title ?? label}
+      aria-label={label}
+    >
+      <ModelActionIcon name={icon} />
+      <span className="sr-only">{label}</span>
+    </button>
+  );
+}
+
+export function StatusIcon({
+  status,
+  label,
+  detail,
+}: {
+  status: ModelStatusKind;
+  label: string;
+  detail?: string | null;
+}) {
+  const title = detail ? `${label}: ${detail}` : label;
+  return (
+    <span className={`status-icon-pill status-icon-pill--${status}`} title={title} aria-label={title}>
+      <ModelActionIcon name={status} />
+      <span className="sr-only">{title}</span>
+    </span>
+  );
+}
diff --git a/src/components/ModelLaunchModal.tsx b/src/components/ModelLaunchModal.tsx
index db8ff73..432ce6c 100644
--- a/src/components/ModelLaunchModal.tsx
+++ b/src/components/ModelLaunchModal.tsx
@@ -1,7 +1,7 @@
 import { useEffect, useState } from "react";
 import { RuntimeControls } from "./RuntimeControls";
 import { number, sizeLabel } from "../utils";
-import type { LaunchPreferences, PreviewMetrics, SystemStats } from "../types";
+import type { LaunchPreferences, PreviewMetrics, StrategyInstallLog, SystemStats } from "../types";
 import type { ChatModelOption } from "../types/chat";
 
 export interface ModelLaunchModalProps {
@@ -19,6 +19,7 @@ export interface ModelLaunchModalProps {
   availableCacheStrategies: SystemStats["availableCacheStrategies"] | undefined;
   dflashInfo?: SystemStats["dflash"];
   installingPackage: string | null;
+  installLogs?: Record<string, StrategyInstallLog>;
   turboInstalled?: boolean;
   onSelectedKeyChange: (key: string) => void;
   onSearchChange: (value: string) => void;
@@ -43,6 +44,7 @@ export function ModelLaunchModal({
   availableCacheStrategies,
   dflashInfo,
   installingPackage,
+  installLogs,
   turboInstalled,
   onSelectedKeyChange,
   onSearchChange,
@@ -161,6 +163,7 @@ export function ModelLaunchModal({
               availableCacheStrategies={availableCacheStrategies}
               onInstallPackage={onInstallPackage}
               installingPackage={installingPackage}
+              installLogs={installLogs}
               dflashInfo={dflashInfo}
               selectedBackend={selectedOption?.backend}
               selectedModelRef={selectedOption?.modelRef}
diff --git a/src/components/PerformancePreview.tsx b/src/components/PerformancePreview.tsx
index e7ee592..80e51a8 100644
--- a/src/components/PerformancePreview.tsx
+++ b/src/components/PerformancePreview.tsx
@@ -1,5 +1,6 @@
 import type { PreviewMetrics } from "../types";
 import { ProgressRow } from "./ProgressRow";
+import { getCacheFitStatus } from "../utils/cache";
 
 interface PerformancePreviewProps {
   preview: PreviewMetrics;
@@ -13,48 +14,6 @@ function fmt(value: number, digits = 1): string {
   return value.toFixed(digits);
 }
 
-interface FitStatus {
-  label: string;
-  className: string;
-  /** Human-readable explanation of the dominant lever when things don't
-   * fit. Only populated for the "May not fit" tier — the other tiers are
-   * self-explanatory. */
-  advice: string | null;
-}
-
-function getFitStatus(
-  optimizedCacheGb: number,
-  diskSizeGb: number,
-  totalGb: number,
-  bits: number,
-): FitStatus {
-  // Use total system memory since loading a new model unloads the previous one.
-  const totalNeeded = optimizedCacheGb + diskSizeGb;
-  // Reserve ~20% for OS and other apps
-  const usable = totalGb * 0.80;
-  const ratio = usable > 0 ? totalNeeded / usable : 1;
-  if (ratio < 0.7) return { label: "Fits easily", className: "success", advice: null };
-  if (ratio < 0.95) return { label: "Tight fit", className: "warning", advice: null };
-
-  // "May not fit" — pick the most useful lever to show the user. When the
-  // cache pool dwarfs the weights (classic "256K context on a 26B model"
-  // situation), the right fix is context + strategy, not model size. When
-  // the weights themselves are the problem, no context lever will help.
-  const cacheDominates = optimizedCacheGb > diskSizeGb * 1.5;
-  let advice: string;
-  if (!cacheDominates) {
-    advice =
-      "Model weights alone exceed available RAM. Pick a smaller model or a more aggressive quantisation.";
-  } else if (bits <= 0) {
-    advice =
-      "Native f16 cache grows with context — at this setting it's bigger than RAM. Lower the context slider, or pick a compressed strategy (RotorQuant / TriAttention).";
-  } else {
-    advice =
-      "Compressed cache still exceeds RAM at this context. Lower the context slider or reduce FP16 layers.";
-  }
-  return { label: "May not fit", className: "warning", advice };
-}
-
 function getSpeedLabel(tokS: number): { label: string; className: string } | null {
   if (tokS < 5) return { label: "Slow", className: "perf-preview__speed-label--slow" };
   if (tokS < 15) return { label: "Good", className: "perf-preview__speed-label--good" };
@@ -64,7 +23,7 @@ function getSpeedLabel(tokS: number): { label: string; className: string } | nul
 
 export function PerformancePreview({ preview, availableMemoryGb, totalMemoryGb, compact, actualDiskSizeGb }: PerformancePreviewProps) {
   const diskGb = actualDiskSizeGb ?? preview.diskSizeGb;
-  const fitStatus = getFitStatus(preview.optimizedCacheGb, diskGb, totalMemoryGb, preview.bits);
+  const fitStatus = getCacheFitStatus(preview.optimizedCacheGb, diskGb, totalMemoryGb, preview.bits);
   const cacheDelta = preview.baselineCacheGb - preview.optimizedCacheGb;
   const qualityDelta = preview.qualityPercent - 100;
   const cacheMax = Math.max(preview.baselineCacheGb, totalMemoryGb * 0.6, 1);
diff --git a/src/components/RuntimeControls.tsx b/src/components/RuntimeControls.tsx
index 1d0b98c..9480fcb 100644
--- a/src/components/RuntimeControls.tsx
+++ b/src/components/RuntimeControls.tsx
@@ -1,5 +1,5 @@
 import { useEffect, useState } from "react";
-import type { LaunchPreferences, PreviewMetrics } from "../types";
+import type { LaunchPreferences, PreviewMetrics, StrategyInstallLog } from "../types";
 import { SliderField } from "./SliderField";
 import { PerformancePreview } from "./PerformancePreview";
 import {
@@ -121,6 +121,7 @@ interface RuntimeControlsProps {
   availableCacheStrategies?: CacheStrategyOption[];
   onInstallPackage?: (strategyId: string) => void;
   installingPackage?: string | null;
+  installLogs?: Record<string, StrategyInstallLog>;
   dflashInfo?: DFlashInfo;
   /** Backend of the selected model (e.g. "mlx", "gguf", "vllm", "auto"). Used for compatibility validation. */
   selectedBackend?: string | null;
@@ -133,6 +134,77 @@ interface RuntimeControlsProps {
   turboUpdateAvailable?: boolean;
 }
 
+function StrategyInstallTerminal({
+  label,
+  log,
+}: {
+  label: string;
+  log?: StrategyInstallLog;
+}) {
+  const status = log?.status ?? "idle";
+  const summaryStatus =
+    status === "running" ? "running" :
+    status === "success" ? "complete" :
+    status === "failed" ? "failed" :
+    "ready";
+  const lines = log?.steps.length
+    ? log.steps.map((step) => [
+      `$ ${step.command}`,
+      `[${step.status.toUpperCase()}] ${step.label}`,
+      formatStrategyInstallOutput(step.output, step.status),
+    ].join("\n")).join("\n\n")
+    : "No install output yet. Run the installer to capture stdout and stderr here.";
+
+  return (
+    <details className={`strategy-install-terminal strategy-install-terminal--${status}`}>
+      <summary className="strategy-install-terminal-summary">
+        <span>{label} install terminal</span>
+        <span className={`strategy-install-terminal-status strategy-install-terminal-status--${status}`}>
+          {summaryStatus}
+        </span>
+      </summary>
+      <div className="strategy-install-terminal-meta">
+        {log?.startedAt ? <span>Started {log.startedAt}</span> : <span>Collapsed by default. Open after an install attempt to inspect failures.</span>}
+        {log?.finishedAt ? <span>Finished {log.finishedAt}</span> : null}
+      </div>
+      <pre className="strategy-install-terminal-output">{lines}</pre>
+    </details>
+  );
+}
+
+function formatStrategyInstallOutput(output: string, status: string): string {
+  const trimmed = output.trim();
+  if (!trimmed || status !== "success") return trimmed || "(no output)";
+
+  const lines = trimmed.split(/\r?\n/);
+  const filtered: string[] = [];
+  let omittedResolverWarning = false;
+  let inResolverWarning = false;
+  for (const line of lines) {
+    const text = line.trim();
+    if (/^ERROR: pip's dependency resolver does not currently take into account/i.test(text)) {
+      omittedResolverWarning = true;
+      inResolverWarning = true;
+      continue;
+    }
+    if (inResolverWarning) {
+      if (
+        text === "" ||
+        /^\S+\s+\S+\s+requires\s+.+which is not installed\.$/i.test(text) ||
+        /^\S+\s+\S+\s+requires\s+.+but you have .+ which is incompatible\.$/i.test(text)
+      ) {
+        continue;
+      }
+      inResolverWarning = false;
+    }
+    filtered.push(line);
+  }
+  if (omittedResolverWarning) {
+    filtered.push("[pip resolver warnings omitted; install command exited successfully]");
+  }
+  return filtered.join("\n").trim() || "(no output)";
+}
+
 export function RuntimeControls({
   settings,
   onChange,
@@ -147,6 +219,7 @@ export function RuntimeControls({
   availableCacheStrategies,
   onInstallPackage,
   installingPackage,
+  installLogs,
   dflashInfo,
   selectedBackend,
   selectedModelRef,
@@ -173,6 +246,8 @@ export function RuntimeControls({
   const dflashUnavailableReason = dflashSupport.reason;
   const ddtreeAvailable = dflashSupport.ddtreeAvailable;
   const canInstallDflashForModel = dflashSupport.modelSupported === true;
+  const dflashInstallLog = installLogs?.["dflash-mlx"] ?? installLogs?.dflash;
+  const showDflashInstallTerminal = Boolean(dflashInstallLog || (!dflashInstalled && !isGgufBackend && canInstallDflashForModel && onInstallPackage));
   const specActive = settings.speculativeDecoding && dflashAvailable;
   const strategies = (availableCacheStrategies ?? [{id: "native", name: "Native f16", available: true, bitRange: null, defaultBits: null, supportsFp16Layers: false}])
     .filter((s) => !s.appliesTo || s.appliesTo.length === 0 || s.appliesTo.includes("text"));
@@ -180,6 +255,13 @@ export function RuntimeControls({
   const selectedStrategy = strategies.find(s => s.id === settings.cacheStrategy) ?? strategies[0];
   const fp16LayersSupported = Boolean(selectedStrategy?.supportsFp16Layers) && !isGgufBackend;
   const [expandedInfo, setExpandedInfo] = useState<string | null>(null);
+  const isStrategyRuntimeAvailable = (strategy: CacheStrategyOption) => {
+    if (strategy.requiredLlamaBinary === "turbo" && isGgufBackend) {
+      return Boolean(turboInstalled);
+    }
+    return strategy.available;
+  };
+  const selectedStrategyRuntimeAvailable = selectedStrategy ? isStrategyRuntimeAvailable(selectedStrategy) : false;
 
   useEffect(() => {
     if (isGgufBackend && settings.fp16Layers !== 0) {
@@ -189,7 +271,7 @@ export function RuntimeControls({
 
   useEffect(() => {
     if (settings.cacheStrategy === "native") return;
-    if (hasSelectedStrategy && selectedStrategy?.available && isStrategyCompatible(settings.cacheStrategy, selectedBackend)) return;
+    if (hasSelectedStrategy && selectedStrategyRuntimeAvailable && isStrategyCompatible(settings.cacheStrategy, selectedBackend)) return;
     onChange("cacheStrategy", "native");
     if (settings.cacheBits !== 0) onChange("cacheBits", 0);
     if (settings.fp16Layers !== 0) onChange("fp16Layers", 0);
@@ -197,7 +279,7 @@ export function RuntimeControls({
     hasSelectedStrategy,
     onChange,
     selectedBackend,
-    selectedStrategy?.available,
+    selectedStrategyRuntimeAvailable,
     settings.cacheBits,
     settings.cacheStrategy,
     settings.fp16Layers,
@@ -253,7 +335,7 @@ export function RuntimeControls({
   }
 
   function selectStrategy(strategy: CacheStrategyOption) {
-    if (!strategy.available || !isStrategyCompatible(strategy.id, selectedBackend)) return;
+    if (!isStrategyRuntimeAvailable(strategy) || !isStrategyCompatible(strategy.id, selectedBackend)) return;
     onChange("cacheStrategy", strategy.id);
     if (strategy.defaultBits != null) {
       onChange("cacheBits", strategy.defaultBits);
@@ -285,8 +367,9 @@ export function RuntimeControls({
           const incompatReason = strategyIncompatReason(strategy.id, selectedBackend);
           const isIncompat = incompatReason != null;
           const needsTurbo = strategy.requiredLlamaBinary === "turbo";
-          const turboMissing = needsTurbo && isGgufBackend && turboInstalled === false;
-          const isDisabled = !strategy.available || (specActive && strategy.id !== "native") || isIncompat || turboMissing;
+          const turboMissing = needsTurbo && isGgufBackend && !turboInstalled;
+          const runtimeAvailable = isStrategyRuntimeAvailable(strategy);
+          const isDisabled = !runtimeAvailable || (specActive && strategy.id !== "native") || isIncompat || turboMissing;
 
           return (
             <div key={strategy.id} className={`cache-strategy-card${isSelected ? " cache-strategy-card--active" : ""}${isDisabled ? " cache-strategy-card--disabled" : ""}`} title={incompatReason ?? (turboMissing ? "Requires llama-server-turbo binary. Run scripts/build-llama-turbo.sh to install." : undefined)}>
@@ -301,10 +384,10 @@ export function RuntimeControls({
                   <span className="cache-strategy-card-name">{strategy.name}</span>
                   <span
                     className={`cache-strategy-badge cache-strategy-badge--${
-                      isIncompat ? "warning" : turboMissing ? "warning" : strategy.available ? "ready" : strategy.availabilityTone ?? "install"
+                      isIncompat ? "warning" : turboMissing ? "warning" : runtimeAvailable ? "ready" : strategy.availabilityTone ?? "install"
                     }`}
                   >
-                    {isIncompat ? "N/A" : turboMissing ? "No turbo binary" : strategy.available ? "Ready" : strategy.availabilityBadge ?? "Install"}
+                    {isIncompat ? "N/A" : turboMissing ? "No turbo binary" : runtimeAvailable ? "Ready" : strategy.availabilityBadge ?? "Install"}
                   </span>
                 </button>
                 {info ? (
@@ -321,7 +404,7 @@ export function RuntimeControls({
               {isExpanded && info ? (
                 <div className="cache-strategy-info-panel">
                   <p>{info.description}</p>
-                  {!strategy.available && strategy.availabilityReason ? (
+                  {!runtimeAvailable && strategy.availabilityReason ? (
                     <p className="cache-strategy-status-note">{strategy.availabilityReason}</p>
                   ) : null}
                   <div className="cache-strategy-meta">
@@ -332,7 +415,7 @@ export function RuntimeControls({
                     <div className="cache-strategy-install">
                       <span className="cache-strategy-meta-label">Install:</span>
                       <code>{info.install}</code>
-                      {info.autoInstallPackage && onInstallPackage && !strategy.available ? (
+                      {info.autoInstallPackage && onInstallPackage && !runtimeAvailable ? (
                         <button
                           type="button"
                           className="cache-strategy-install-btn"
@@ -358,6 +441,12 @@ export function RuntimeControls({
                           {installingPackage === strategy.id ? "Updating..." : "Update available"}
                         </button>
                       ) : null}
+                      {info.autoInstallPackage || installLogs?.[strategy.id] ? (
+                        <StrategyInstallTerminal
+                          label={strategy.name}
+                          log={installLogs?.[strategy.id]}
+                        />
+                      ) : null}
                     </div>
                   ) : null}
                 </div>
@@ -524,6 +613,9 @@ export function RuntimeControls({
             ) : null}
           </div>
         ) : null}
+        {showDflashInstallTerminal ? (
+          <StrategyInstallTerminal label="DFlash" log={dflashInstallLog} />
+        ) : null}
         {settings.speculativeDecoding && dflashAvailable ? (
           <div className="slider-row" style={{ marginTop: 6 }}>
             <label className="slider-label" title="DDTree: tree-based speculative decoding. 0 = linear DFlash, >0 = explore multiple draft paths in parallel for higher acceptance rates.">
diff --git a/src/components/StartupProgressPanel.tsx b/src/components/StartupProgressPanel.tsx
index f3619a8..141c164 100644
--- a/src/components/StartupProgressPanel.tsx
+++ b/src/components/StartupProgressPanel.tsx
@@ -12,8 +12,8 @@ interface Props {
 //   1. Tauri extracts the bundled ~280 MB runtime tarball into a
 //      manifest-hash-suffixed cache dir. Cold SSD + gunzip = 5-15 s.
 //   2. The Rust shell spawns the Python sidecar. Python 3.11 imports
-//      FastAPI + uvicorn + huggingface_hub + dflash registry + the
-//      image/video catalogs. First-time page cache warmup = 10-25 s.
+//      the core FastAPI app. Heavier image/video/cache runtimes stay lazy
+//      until their routes are used.
 //   3. The FastAPI server finishes binding its port and answers
 //      /api/workspace, which releases the splash.
 //
@@ -85,14 +85,14 @@ function pickPhase(
   if (elapsedSeconds < 25) {
     return {
       title: "Starting Python runtime",
-      detail: "Loading FastAPI, HuggingFace hub, and the cache strategies.",
+      detail: "Loading the core API and restoring workspace state.",
     };
   }
   if (elapsedSeconds < 45) {
     return {
-      title: "Importing modules",
+      title: "Waiting for backend",
       detail:
-        "Warming up diffusers / MLX / dflash — most of the wait on a cold start.",
+        "The sidecar is still binding its API port and checking local runtime state.",
     };
   }
   return {
diff --git a/src/features/benchmarks/BenchmarkRunTab.tsx b/src/features/benchmarks/BenchmarkRunTab.tsx
index 69424e4..5e92edc 100644
--- a/src/features/benchmarks/BenchmarkRunTab.tsx
+++ b/src/features/benchmarks/BenchmarkRunTab.tsx
@@ -6,7 +6,7 @@ import { RuntimeControls } from "../../components/RuntimeControls";
 import { ModelLaunchModal } from "../../components/ModelLaunchModal";
 import { StatCard } from "../../components/StatCard";
 import { BenchmarkGauge } from "../../components/BenchmarkGauge";
-import type { BenchmarkResult, BenchmarkRunPayload, LibraryItem, PreviewMetrics, SystemStats } from "../../types";
+import type { BenchmarkResult, BenchmarkRunPayload, LibraryItem, PreviewMetrics, StrategyInstallLog, SystemStats } from "../../types";
 import type { ChatModelOption } from "../../types/chat";
 import { BENCHMARK_PROMPTS } from "../../constants";
 import { number, sizeLabel, signedDelta } from "../../utils";
@@ -35,6 +35,7 @@ export interface BenchmarkRunTabProps {
   showBenchmarkPicker: boolean;
   showBenchmarkModal: boolean;
   installingPackage: string | null;
+  installLogs?: Record<string, StrategyInstallLog>;
   onBenchmarkDraftChange: <K extends keyof BenchmarkRunPayload>(key: K, value: BenchmarkRunPayload[K]) => void;
   onBenchmarkPromptIdChange: (id: string) => void;
   onBenchmarkModelKeyChange: (key: string) => void;
@@ -62,6 +63,7 @@ export function BenchmarkRunTab({
   showBenchmarkPicker,
   showBenchmarkModal,
   installingPackage,
+  installLogs,
   onBenchmarkDraftChange,
   onBenchmarkPromptIdChange,
   onBenchmarkModelKeyChange,
@@ -229,6 +231,7 @@ export function BenchmarkRunTab({
               selectedModelName={benchmarkOption?.model}
               onInstallPackage={onInstallPackage}
               installingPackage={installingPackage}
+              installLogs={installLogs}
               turboInstalled={Boolean(workspace.system.llamaServerTurboPath)}
               showTemperature={false}
               showPreview={false}
@@ -466,6 +469,7 @@ export function BenchmarkRunTab({
         availableCacheStrategies={workspace.system.availableCacheStrategies}
         dflashInfo={workspace.system.dflash}
         installingPackage={installingPackage}
+        installLogs={installLogs}
         turboInstalled={Boolean(workspace.system.llamaServerTurboPath)}
         onSelectedKeyChange={(key) => {
           onBenchmarkModelKeyChange(key);
diff --git a/src/features/chat/CompareView.tsx b/src/features/chat/CompareView.tsx
index dc30377..d74eee9 100644
--- a/src/features/chat/CompareView.tsx
+++ b/src/features/chat/CompareView.tsx
@@ -5,7 +5,7 @@ import { ModelLaunchModal } from "../../components/ModelLaunchModal";
 import { Panel } from "../../components/Panel";
 import { ReasoningPanel } from "../../components/ReasoningPanel";
 import { emptyPreview } from "../../defaults";
-import type { GenerationMetrics, LaunchPreferences, PreviewMetrics, SystemStats } from "../../types";
+import type { GenerationMetrics, LaunchPreferences, PreviewMetrics, StrategyInstallLog, SystemStats } from "../../types";
 import type { ChatModelOption } from "../../types/chat";
 import {
   detectBitsPerWeight,
@@ -51,6 +51,7 @@ interface CompareViewProps {
   turboInstalled?: boolean;
   onInstallPackage?: (strategyId: string) => void;
   installingPackage?: string | null;
+  installLogs?: Record<string, StrategyInstallLog>;
 }
 
 interface CompareStreamEvent extends Partial<GenerationMetrics> {
@@ -257,6 +258,7 @@ export function CompareView({
   turboInstalled,
   onInstallPackage,
   installingPackage,
+  installLogs,
 }: CompareViewProps) {
   const [modelKeyA, setModelKeyA] = useState("");
   const [modelKeyB, setModelKeyB] = useState("");
@@ -702,6 +704,7 @@ export function CompareView({
         availableCacheStrategies={availableCacheStrategies}
         dflashInfo={dflashInfo}
         installingPackage={installingPackage ?? null}
+        installLogs={installLogs}
         turboInstalled={turboInstalled}
         onSelectedKeyChange={setPickerDraftKey}
         onSearchChange={setPickerSearch}
diff --git a/src/features/images/ImageDiscoverTab.tsx b/src/features/images/ImageDiscoverTab.tsx
index f7f60f9..d9041ca 100644
--- a/src/features/images/ImageDiscoverTab.tsx
+++ b/src/features/images/ImageDiscoverTab.tsx
@@ -1,5 +1,6 @@
+import { useMemo, useState } from "react";
 import { Panel } from "../../components/Panel";
-import { LatestImageDiscoverCard } from "../../components/LatestImageDiscoverCard";
+import { IconActionButton, StatusIcon } from "../../components/ModelActionIcons";
 import type { DownloadStatus } from "../../api";
 import type {
   ImageModelVariant,
@@ -10,6 +11,22 @@ import type {
   ImageDiscoverTaskFilter,
   ImageDiscoverAccessFilter,
 } from "../../types/image";
+import {
+  compactModelSizeLabel,
+  compactReleaseLabel,
+  downloadProgressLabel,
+  downloadSizeTooltip,
+  formatImageAccessError,
+  formatImageLicenseLabel,
+  formatReleaseLabel,
+  imageDiscoverMemoryEstimate,
+  imagePrimarySizeLabel,
+  imageSecondarySizeLabel,
+  isGatedImageAccessError,
+} from "../../utils";
+
+type MediaStatusFilter = "all" | "installed" | "not-installed" | "downloading" | "paused" | "failed" | "incomplete";
+type SortDir = "asc" | "desc";
 
 export interface ImageDiscoverTabProps {
   combinedImageDiscoverResults: ImageModelVariant[];
@@ -35,6 +52,98 @@ export interface ImageDiscoverTabProps {
   onRevealPath: (path: string) => void;
 }
 
+function imageDiscoverSortLabel(sort: DiscoverSort): string {
+  if (sort === "name") return "name";
+  if (sort === "provider") return "provider";
+  if (sort === "tasks") return "tasks";
+  if (sort === "size") return "largest size first";
+  if (sort === "ram") return "highest RAM/VRAM first";
+  if (sort === "likes") return "most liked first";
+  if (sort === "downloads") return "most downloads first";
+  if (sort === "status") return "status";
+  return "newest released first";
+}
+
+function sortIndicator(activeSort: DiscoverSort, sortDir: SortDir, key: DiscoverSort): string {
+  if (activeSort !== key) return "";
+  return sortDir === "asc" ? " \u25B2" : " \u25BC";
+}
+
+function defaultSortDir(sort: DiscoverSort): SortDir {
+  return sort === "name" || sort === "provider" || sort === "tasks" ? "asc" : "desc";
+}
+
+function releaseSortKey(variant: ImageModelVariant): string {
+  return variant.releaseDate ?? variant.createdAt ?? variant.lastModified ?? "";
+}
+
+function sizeSortKey(variant: ImageModelVariant): number | null {
+  const candidates = [variant.onDiskGb, variant.coreWeightsGb, variant.repoSizeGb, variant.sizeGb];
+  for (const value of candidates) {
+    if (typeof value === "number" && Number.isFinite(value) && value > 0) return value;
+  }
+  return null;
+}
+
+function compareNullableNumberDesc(left: number | null, right: number | null): number {
+  const leftKnown = typeof left === "number" && Number.isFinite(left);
+  const rightKnown = typeof right === "number" && Number.isFinite(right);
+  if (leftKnown && rightKnown) return (right as number) - (left as number);
+  if (leftKnown) return -1;
+  if (rightKnown) return 1;
+  return 0;
+}
+
+function compareNullableNumber(left: number | null, right: number | null, dir: SortDir): number {
+  const desc = compareNullableNumberDesc(left, right);
+  return dir === "desc" ? desc : -desc;
+}
+
+function statusSortKey(status: MediaStatusFilter): number {
+  if (status === "installed") return 0;
+  if (status === "downloading") return 1;
+  if (status === "paused") return 2;
+  if (status === "failed") return 3;
+  if (status === "incomplete") return 4;
+  if (status === "not-installed") return 5;
+  return 6;
+}
+
+function memoryParts(label: string | null | undefined): { primary: string; secondary: string | null } {
+  if (!label) return { primary: "pending", secondary: null };
+  const [primary, secondary] = label.split(" @ ");
+  if (!secondary) return { primary, secondary: null };
+  return { primary: `${primary} @`, secondary };
+}
+
+function imageVariantStatus(
+  variant: ImageModelVariant,
+  downloadState?: DownloadStatus,
+): MediaStatusFilter {
+  if (variant.availableLocally || downloadState?.state === "completed") return "installed";
+  if (downloadState?.state === "downloading") return "downloading";
+  if (downloadState?.state === "cancelled") return "paused";
+  if (downloadState?.state === "failed") return "failed";
+  if (variant.hasLocalData) return "incomplete";
+  return "not-installed";
+}
+
+function statusBadge(status: MediaStatusFilter, downloadState?: DownloadStatus) {
+  const downloadDetail = downloadState
+    ? [downloadProgressLabel(downloadState), downloadSizeTooltip(downloadState)].filter(Boolean).join(" / ")
+    : null;
+  if (status === "installed") return <StatusIcon status="installed" label="Installed" />;
+  if (status === "downloading" && downloadState) {
+    return <StatusIcon status="downloading" label="Downloading" detail={downloadDetail} />;
+  }
+  if (status === "paused" && downloadState) {
+    return <StatusIcon status="paused" label="Paused" detail={downloadDetail} />;
+  }
+  if (status === "failed") return <StatusIcon status="failed" label="Failed" detail={downloadState?.error ?? "Download failed"} />;
+  if (status === "incomplete") return <StatusIcon status="incomplete" label="Incomplete" />;
+  return <StatusIcon status="incomplete" label="Not installed" />;
+}
+
 export function ImageDiscoverTab({
   combinedImageDiscoverResults,
   imageDiscoverSearchInput,
@@ -58,11 +167,69 @@ export function ImageDiscoverTab({
   onOpenExternalUrl,
   onRevealPath,
 }: ImageDiscoverTabProps) {
+  const [statusFilter, setStatusFilter] = useState<MediaStatusFilter>("all");
+  const [sortDir, setSortDir] = useState<SortDir>(defaultSortDir(imageDiscoverSort));
+  const filteredResults = useMemo(
+    () =>
+      combinedImageDiscoverResults
+        .map((variant) => {
+          const downloadState = activeImageDownloads[variant.repo];
+          const status = imageVariantStatus(variant, downloadState);
+          const memoryEstimate = imageDiscoverMemoryEstimate(variant);
+          return { variant, status, memoryEstimate };
+        })
+        .filter(({ status }) => statusFilter === "all" || status === statusFilter)
+        .sort((left, right) => {
+          if (imageDiscoverSort === "name") {
+            const diff = left.variant.name.localeCompare(right.variant.name);
+            return sortDir === "asc" ? diff : -diff;
+          }
+          if (imageDiscoverSort === "provider") {
+            const diff = left.variant.provider.localeCompare(right.variant.provider);
+            if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+          }
+          if (imageDiscoverSort === "tasks") {
+            const diff = left.variant.taskSupport.join(" ").localeCompare(right.variant.taskSupport.join(" "));
+            if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+          }
+          if (imageDiscoverSort === "size") {
+            const diff = compareNullableNumber(sizeSortKey(left.variant), sizeSortKey(right.variant), sortDir);
+            if (diff !== 0) return diff;
+          } else if (imageDiscoverSort === "ram") {
+            const diff = compareNullableNumber(left.memoryEstimate?.estimatedPeakGb ?? null, right.memoryEstimate?.estimatedPeakGb ?? null, sortDir);
+            if (diff !== 0) return diff;
+          } else if (imageDiscoverSort === "status") {
+            const diff = statusSortKey(left.status) - statusSortKey(right.status);
+            if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+          } else if (imageDiscoverSort === "likes") {
+            const diff = compareNullableNumber(left.variant.likes ?? null, right.variant.likes ?? null, sortDir);
+            if (diff !== 0) return diff;
+          } else if (imageDiscoverSort === "downloads") {
+            const diff = compareNullableNumber(left.variant.downloads ?? null, right.variant.downloads ?? null, sortDir);
+            if (diff !== 0) return diff;
+          }
+          const dateDiff = releaseSortKey(right.variant).localeCompare(releaseSortKey(left.variant));
+          if (dateDiff !== 0) return sortDir === "desc" ? dateDiff : -dateDiff;
+          return left.variant.name.localeCompare(right.variant.name);
+        }),
+    [activeImageDownloads, combinedImageDiscoverResults, imageDiscoverSort, sortDir, statusFilter],
+  );
+  const hasActiveFilters = imageDiscoverHasActiveFilters || statusFilter !== "all";
+
+  function applySort(nextSort: DiscoverSort) {
+    if (imageDiscoverSort === nextSort) {
+      setSortDir(sortDir === "asc" ? "desc" : "asc");
+    } else {
+      onImageDiscoverSortChange(nextSort);
+      setSortDir(defaultSortDir(nextSort));
+    }
+  }
+
   return (
     <div className="image-discover-stack">
       <Panel
         title="Image Discover"
-        subtitle={`${combinedImageDiscoverResults.length} models / live Hugging Face metadata`}
+        subtitle={`${filteredResults.length} of ${combinedImageDiscoverResults.length} models / live Hugging Face metadata`}
       >
         <div className="image-hero">
           <div>
@@ -81,7 +248,7 @@ export function ImageDiscoverTab({
           </div>
         </div>
 
-        <div className="image-discover-filter-row">
+        <div className="image-discover-filter-row image-discover-filter-row--wide">
           <label className="image-discover-search">
             Search
             <input
@@ -117,16 +284,42 @@ export function ImageDiscoverTab({
               <option value="gated">Gated only</option>
             </select>
           </label>
+          <label>
+            Status
+            <select
+              className="text-input"
+              value={statusFilter}
+              onChange={(event) => setStatusFilter(event.target.value as MediaStatusFilter)}
+            >
+              <option value="all">Any status</option>
+              <option value="installed">Installed</option>
+              <option value="not-installed">Not installed</option>
+              <option value="downloading">Downloading</option>
+              <option value="paused">Paused</option>
+              <option value="failed">Failed</option>
+              <option value="incomplete">Incomplete</option>
+            </select>
+          </label>
           <label>
             Sort by
             <select
               className="text-input"
               value={imageDiscoverSort}
-              onChange={(event) => onImageDiscoverSortChange(event.target.value as DiscoverSort)}
+              onChange={(event) => {
+                const nextSort = event.target.value as DiscoverSort;
+                onImageDiscoverSortChange(nextSort);
+                setSortDir(defaultSortDir(nextSort));
+              }}
             >
+              <option value="name">Name</option>
+              <option value="provider">Provider</option>
+              <option value="tasks">Tasks</option>
               <option value="release">Newest released</option>
+              <option value="size">Largest size</option>
+              <option value="ram">Highest RAM/VRAM</option>
               <option value="likes">Most likes</option>
               <option value="downloads">Most downloads</option>
+              <option value="status">Status</option>
             </select>
           </label>
           <div className="image-discover-filter-actions">
@@ -137,8 +330,11 @@ export function ImageDiscoverTab({
                 onImageDiscoverSearchInputChange("");
                 onImageDiscoverTaskFilterChange("all");
                 onImageDiscoverAccessFilterChange("all");
+                setStatusFilter("all");
+                onImageDiscoverSortChange("release");
+                setSortDir("desc");
               }}
-              disabled={!imageDiscoverHasActiveFilters}
+              disabled={!hasActiveFilters}
             >
               Clear Filters
             </button>
@@ -147,12 +343,7 @@ export function ImageDiscoverTab({
 
         <div className="image-discover-results-summary">
           <span>
-            {combinedImageDiscoverResults.length} model{combinedImageDiscoverResults.length !== 1 ? "s" : ""} ·{" "}
-            {imageDiscoverSort === "likes"
-              ? "most liked first"
-              : imageDiscoverSort === "downloads"
-                ? "most downloads first"
-                : "newest released first"}
+            {filteredResults.length} model{filteredResults.length !== 1 ? "s" : ""} · {imageDiscoverSortLabel(imageDiscoverSort)}
           </span>
           {imageDiscoverSearchQuery ? (
             <span className="badge subtle">Search: {imageDiscoverSearchInput.trim()}</span>
@@ -165,31 +356,137 @@ export function ImageDiscoverTab({
               Access: {imageDiscoverAccessFilter === "open" ? "Open only" : "Gated only"}
             </span>
           ) : null}
+          {statusFilter !== "all" ? <span className="badge muted">Status: {statusFilter}</span> : null}
         </div>
       </Panel>
 
-      {combinedImageDiscoverResults.length === 0 ? (
+      {filteredResults.length === 0 ? (
         <Panel title="Image Models" subtitle="No models match the current filters" className="image-discover-section-panel">
           <div className="empty-state image-empty-state">
             <p>Try broadening the filters or search terms.</p>
           </div>
         </Panel>
       ) : (
-        <div className="image-discover-grid image-discover-grid--latest">
-          {combinedImageDiscoverResults.map((variant) => (
-            <LatestImageDiscoverCard
-              key={variant.id}
-              variant={variant}
-              downloadState={activeImageDownloads[variant.repo]}
-              fileRevealLabel={fileRevealLabel}
-              onDownload={(repo) => onImageDownload(repo)}
-              onCancelDownload={(repo) => onCancelImageDownload(repo)}
-              onDeleteDownload={(repo) => onDeleteImageDownload(repo)}
-              onOpenExternalUrl={(url) => onOpenExternalUrl(url)}
-              onNavigateSettings={() => onActiveTabChange("settings")}
-              onRevealPath={(path) => onRevealPath(path)}
-            />
-          ))}
+        <div className="media-model-table media-model-table--image">
+          <div className="media-model-head">
+            <button className="sort-header" type="button" onClick={() => applySort("name")}>Model{sortIndicator(imageDiscoverSort, sortDir, "name")}</button>
+            <button className="sort-header" type="button" onClick={() => applySort("provider")}>Provider{sortIndicator(imageDiscoverSort, sortDir, "provider")}</button>
+            <button className="sort-header" type="button" onClick={() => applySort("tasks")}>Tasks{sortIndicator(imageDiscoverSort, sortDir, "tasks")}</button>
+            <button className="sort-header" type="button" onClick={() => applySort("size")}>
+              Size{sortIndicator(imageDiscoverSort, sortDir, "size")}
+            </button>
+            <button className="sort-header" type="button" onClick={() => applySort("ram")}>
+              RAM/VRAM{sortIndicator(imageDiscoverSort, sortDir, "ram")}
+            </button>
+            <button className="sort-header" type="button" onClick={() => applySort("release")}>
+              Released{sortIndicator(imageDiscoverSort, sortDir, "release")}
+            </button>
+            <button className="sort-header" type="button" onClick={() => applySort("status")}>Status{sortIndicator(imageDiscoverSort, sortDir, "status")}</button>
+            <span className="sort-header"></span>
+          </div>
+          <div className="media-model-rows">
+            {filteredResults.map(({ variant, status, memoryEstimate }) => {
+              const downloadState = activeImageDownloads[variant.repo];
+              const isComplete = status === "installed";
+              const isDownloading = status === "downloading";
+              const isPaused = status === "paused";
+              const isDownloadFailed = status === "failed";
+              const isPartial = status === "incomplete";
+              const isDownloadComplete = downloadState?.state === "completed";
+              const hasLocalData = Boolean(variant.hasLocalData || isDownloadComplete || isPaused || isDownloadFailed);
+              const friendlyDownloadError = formatImageAccessError(downloadState?.error, variant);
+              const needsGatedAccess = isGatedImageAccessError(downloadState?.error);
+              const secondarySize = imageSecondarySizeLabel(variant);
+              const releaseLabel = compactReleaseLabel(formatReleaseLabel(variant.releaseLabel, variant.releaseDate ?? variant.createdAt));
+              const primarySizeLabel = imagePrimarySizeLabel(variant);
+              const sizeTitle = [primarySizeLabel, secondarySize].filter(Boolean).join(" / ");
+              const memory = memoryParts(memoryEstimate?.label);
+              return (
+                <div key={variant.id} className={`media-model-row-wrap${isComplete ? " downloaded" : ""}`}>
+                  <div className="media-model-row">
+                    <div className="media-model-name">
+                      <strong>{variant.name}</strong>
+                      <small>{variant.note}</small>
+                      <div className="media-model-chip-row">
+                        {variant.styleTags.slice(0, 4).map((tag) => (
+                          <span key={tag} className="badge subtle">{tag}</span>
+                        ))}
+                        {typeof variant.gated === "boolean" ? (
+                          <span className="badge muted">{variant.gated ? "Gated" : "Open"}</span>
+                        ) : null}
+                      </div>
+                    </div>
+                    <span>{variant.provider}</span>
+                    <div className="media-model-chip-row">
+                      {variant.taskSupport.map((task) => (
+                        <span key={task} className="badge muted">{task}</span>
+                      ))}
+                    </div>
+                    <span title={sizeTitle || undefined}>
+                      {compactModelSizeLabel(primarySizeLabel)}
+                    </span>
+                    <span className="media-model-memory" title={memoryEstimate?.title ?? "RAM/VRAM estimate pending until model weight size is known."}>
+                      <span>{memory.primary}</span>
+                      {memory.secondary ? <small>{memory.secondary}</small> : null}
+                    </span>
+                    <span>
+                      {releaseLabel ?? "Unknown"}
+                      {variant.downloadsLabel ? <small>{variant.downloadsLabel}</small> : null}
+                      {variant.likesLabel ? <small>{variant.likesLabel}</small> : null}
+                      {variant.license ? <small>{formatImageLicenseLabel(variant.license)}</small> : null}
+                    </span>
+                    <span>{statusBadge(status, downloadState)}</span>
+                    <div className="media-model-actions">
+                      {isComplete ? (
+                        <IconActionButton icon="generate" label="Generate" buttonStyle="primary" onClick={() => onOpenImageStudio(variant.id)} />
+                      ) : isDownloading ? (
+                        <>
+                          <IconActionButton icon="pause" label="Pause download" onClick={() => onCancelImageDownload(variant.repo)} />
+                          <IconActionButton icon="cancel" label="Cancel download" danger onClick={() => onDeleteImageDownload(variant.repo)} />
+                        </>
+                      ) : isPaused ? (
+                        <>
+                          <IconActionButton icon="resume" label="Resume download" onClick={() => onImageDownload(variant.repo)} />
+                          <IconActionButton icon="delete" label="Delete download" danger onClick={() => onDeleteImageDownload(variant.repo)} />
+                        </>
+                      ) : isDownloadFailed ? (
+                        <>
+                          <IconActionButton icon="retry" label="Retry download" onClick={() => onImageDownload(variant.repo)} />
+                          <IconActionButton icon="delete" label="Delete download" danger onClick={() => onDeleteImageDownload(variant.repo)} />
+                        </>
+                      ) : (
+                        <>
+                          <IconActionButton icon={isPartial ? "resume" : "download"} label={isPartial ? "Resume download" : "Download model"} onClick={() => onImageDownload(variant.repo)} />
+                          {hasLocalData ? (
+                            <IconActionButton icon="delete" label="Delete model" danger onClick={() => onDeleteImageDownload(variant.repo)} />
+                          ) : null}
+                        </>
+                      )}
+                      {variant.localPath ? (
+                        <IconActionButton icon="reveal" label={fileRevealLabel} title={fileRevealLabel} onClick={() => onRevealPath(variant.localPath as string)} />
+                      ) : null}
+                      <IconActionButton icon="huggingFace" label="Open on Hugging Face" onClick={() => onOpenExternalUrl(variant.link)} />
+                    </div>
+                  </div>
+                  {isDownloadFailed && downloadState?.error ? (
+                    <div className="media-model-row-detail callout error">
+                      <p>{friendlyDownloadError}</p>
+                      {needsGatedAccess ? (
+                        <div className="button-row">
+                          <button className="secondary-button" type="button" onClick={() => onOpenExternalUrl(variant.link)}>
+                            Hugging Face
+                          </button>
+                          <button className="secondary-button" type="button" onClick={() => onActiveTabChange("settings")}>
+                            Settings
+                          </button>
+                        </div>
+                      ) : null}
+                    </div>
+                  ) : null}
+                </div>
+              );
+            })}
+          </div>
         </div>
       )}
     </div>
diff --git a/src/features/images/ImageModelsTab.tsx b/src/features/images/ImageModelsTab.tsx
index f17cd86..5005907 100644
--- a/src/features/images/ImageModelsTab.tsx
+++ b/src/features/images/ImageModelsTab.tsx
@@ -1,4 +1,6 @@
+import { useMemo, useState } from "react";
 import { Panel } from "../../components/Panel";
+import { IconActionButton, StatusIcon } from "../../components/ModelActionIcons";
 import type { DownloadStatus } from "../../api";
 import type {
   ImageModelFamily,
@@ -6,11 +8,19 @@ import type {
   TabId,
 } from "../../types";
 import {
+  compactModelSizeLabel,
+  compactReleaseLabel,
   downloadProgressLabel,
   formatReleaseLabel,
+  imageDiscoverMemoryEstimate,
   imagePrimarySizeLabel,
+  imageSecondarySizeLabel,
 } from "../../utils";
 
+type InstalledImageSort = "name" | "provider" | "tasks" | "size" | "ram" | "date" | "status";
+type SortDir = "asc" | "desc";
+type InstalledImageStatusFilter = "all" | "installed" | "incomplete" | "downloading" | "paused" | "failed";
+
 export interface ImageModelsTabProps {
   installedImageVariants: ImageModelVariant[];
   imageCatalog: ImageModelFamily[];
@@ -25,6 +35,84 @@ export interface ImageModelsTabProps {
   onRevealPath: (path: string) => void;
 }
 
+function releaseSortKey(variant: ImageModelVariant): string {
+  return variant.releaseDate ?? variant.createdAt ?? variant.lastModified ?? "";
+}
+
+function sizeSortKey(variant: ImageModelVariant): number | null {
+  const candidates = [variant.onDiskGb, variant.coreWeightsGb, variant.repoSizeGb, variant.sizeGb];
+  for (const value of candidates) {
+    if (typeof value === "number" && Number.isFinite(value) && value > 0) return value;
+  }
+  return null;
+}
+
+function compareNullableNumberDesc(left: number | null, right: number | null): number {
+  const leftKnown = typeof left === "number" && Number.isFinite(left);
+  const rightKnown = typeof right === "number" && Number.isFinite(right);
+  if (leftKnown && rightKnown) return (right as number) - (left as number);
+  if (leftKnown) return -1;
+  if (rightKnown) return 1;
+  return 0;
+}
+
+function compareNullableNumber(left: number | null, right: number | null, dir: SortDir): number {
+  const desc = compareNullableNumberDesc(left, right);
+  return dir === "desc" ? desc : -desc;
+}
+
+function statusSortKey(status: InstalledImageStatusFilter): number {
+  if (status === "installed") return 0;
+  if (status === "downloading") return 1;
+  if (status === "paused") return 2;
+  if (status === "failed") return 3;
+  if (status === "incomplete") return 4;
+  return 5;
+}
+
+function defaultSortDir(sort: InstalledImageSort): SortDir {
+  return sort === "name" || sort === "provider" || sort === "tasks" ? "asc" : "desc";
+}
+
+function imageStatus(variant: ImageModelVariant, downloadState?: DownloadStatus): InstalledImageStatusFilter {
+  if (downloadState?.state === "downloading") return "downloading";
+  if (downloadState?.state === "cancelled") return "paused";
+  if (downloadState?.state === "failed") return "failed";
+  if (variant.availableLocally || downloadState?.state === "completed") return "installed";
+  return "incomplete";
+}
+
+function statusBadge(status: InstalledImageStatusFilter, downloadState?: DownloadStatus) {
+  if (status === "installed") return <StatusIcon status="installed" label="Installed" />;
+  if (status === "downloading" && downloadState) return <StatusIcon status="downloading" label="Downloading" detail={downloadProgressLabel(downloadState)} />;
+  if (status === "paused" && downloadState) return <StatusIcon status="paused" label="Paused" detail={downloadProgressLabel(downloadState)} />;
+  if (status === "failed") return <StatusIcon status="failed" label="Failed" detail={downloadState?.error ?? "Download failed"} />;
+  return <StatusIcon status="incomplete" label="Incomplete" />;
+}
+
+function sortIndicator(activeSort: InstalledImageSort, sortDir: SortDir, key: InstalledImageSort): string {
+  if (activeSort !== key) return "";
+  return sortDir === "asc" ? " \u25B2" : " \u25BC";
+}
+
+function sortLabel(sort: InstalledImageSort, sortDir: SortDir): string {
+  const direction = sortDir === "asc" ? "ascending" : "descending";
+  if (sort === "provider") return `provider ${direction}`;
+  if (sort === "tasks") return `tasks ${direction}`;
+  if (sort === "size") return sortDir === "desc" ? "largest size first" : "smallest size first";
+  if (sort === "ram") return sortDir === "desc" ? "highest RAM/VRAM first" : "lowest RAM/VRAM first";
+  if (sort === "status") return `status ${direction}`;
+  if (sort === "name") return sortDir === "asc" ? "name A-Z" : "name Z-A";
+  return sortDir === "desc" ? "newest released first" : "oldest released first";
+}
+
+function memoryParts(label: string | null | undefined): { primary: string; secondary: string | null } {
+  if (!label) return { primary: "pending", secondary: null };
+  const [primary, secondary] = label.split(" @ ");
+  if (!secondary) return { primary, secondary: null };
+  return { primary: `${primary} @`, secondary };
+}
+
 export function ImageModelsTab({
   installedImageVariants,
   imageCatalog,
@@ -38,12 +126,84 @@ export function ImageModelsTab({
   onOpenExternalUrl,
   onRevealPath,
 }: ImageModelsTabProps) {
+  const [searchInput, setSearchInput] = useState("");
+  const [taskFilter, setTaskFilter] = useState<"all" | ImageModelVariant["taskSupport"][number]>("all");
+  const [statusFilter, setStatusFilter] = useState<InstalledImageStatusFilter>("all");
+  const [sort, setSort] = useState<InstalledImageSort>("date");
+  const [sortDir, setSortDir] = useState<SortDir>("desc");
+  const normalizedSearch = searchInput.trim().toLowerCase();
+  const hasActiveFilters =
+    normalizedSearch.length > 0 || taskFilter !== "all" || statusFilter !== "all" || sort !== "date" || sortDir !== "desc";
+
+  function applySort(nextSort: InstalledImageSort) {
+    if (sort === nextSort) {
+      setSortDir(sortDir === "asc" ? "desc" : "asc");
+    } else {
+      setSort(nextSort);
+      setSortDir(defaultSortDir(nextSort));
+    }
+  }
+
+  const rows = useMemo(() => {
+    return installedImageVariants
+      .map((variant) => {
+        const family = imageCatalog.find((item) => item.variants.some((candidate) => candidate.id === variant.id));
+        const downloadState = activeImageDownloads[variant.repo];
+        const status = imageStatus(variant, downloadState);
+        const memoryEstimate = imageDiscoverMemoryEstimate(variant);
+        return { variant, family, downloadState, status, memoryEstimate };
+      })
+      .filter(({ variant, family, status }) => {
+        if (taskFilter !== "all" && !variant.taskSupport.includes(taskFilter)) return false;
+        if (statusFilter !== "all" && status !== statusFilter) return false;
+        if (!normalizedSearch) return true;
+        const haystack = [
+          variant.name,
+          variant.provider,
+          variant.repo,
+          variant.runtime,
+          family?.name ?? "",
+          variant.recommendedResolution,
+          variant.styleTags.join(" "),
+          variant.taskSupport.join(" "),
+        ].join(" ").toLowerCase();
+        return haystack.includes(normalizedSearch);
+      })
+      .sort((left, right) => {
+        if (sort === "name") {
+          const diff = left.variant.name.localeCompare(right.variant.name);
+          return sortDir === "asc" ? diff : -diff;
+        }
+        if (sort === "provider") {
+          const diff = left.variant.provider.localeCompare(right.variant.provider);
+          if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+        }
+        if (sort === "tasks") {
+          const diff = left.variant.taskSupport.join(" ").localeCompare(right.variant.taskSupport.join(" "));
+          if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+        }
+        if (sort === "size") {
+          const diff = compareNullableNumber(sizeSortKey(left.variant), sizeSortKey(right.variant), sortDir);
+          if (diff !== 0) return diff;
+        } else if (sort === "ram") {
+          const diff = compareNullableNumber(left.memoryEstimate?.estimatedPeakGb ?? null, right.memoryEstimate?.estimatedPeakGb ?? null, sortDir);
+          if (diff !== 0) return diff;
+        } else if (sort === "status") {
+          const diff = statusSortKey(left.status) - statusSortKey(right.status);
+          if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+        }
+        const dateDiff = releaseSortKey(right.variant).localeCompare(releaseSortKey(left.variant));
+        if (dateDiff !== 0) return sortDir === "desc" ? dateDiff : -dateDiff;
+        return left.variant.name.localeCompare(right.variant.name);
+      });
+  }, [activeImageDownloads, imageCatalog, installedImageVariants, normalizedSearch, sort, sortDir, statusFilter, taskFilter]);
+
   return (
     <div className="content-grid image-page-grid">
       <Panel
         title="Installed Image Models"
         subtitle={installedImageVariants.length > 0
-          ? `${installedImageVariants.length} model${installedImageVariants.length !== 1 ? "s" : ""} with local data`
+          ? `${rows.length} of ${installedImageVariants.length} model${installedImageVariants.length !== 1 ? "s" : ""} with local data`
           : "No image models detected locally yet"}
         className="span-2"
         actions={
@@ -57,94 +217,174 @@ export function ImageModelsTab({
             <p>Download an image model from Image Discover to get started.</p>
           </div>
         ) : (
-          <div className="image-library-grid">
-            {installedImageVariants.map((variant) => {
-              const family = imageCatalog.find((item) => item.variants.some((candidate) => candidate.id === variant.id));
-              const isComplete = variant.availableLocally;
-              const isPartial = !isComplete && variant.hasLocalData;
-              const downloadState = activeImageDownloads[variant.repo];
-              const isDownloading = downloadState?.state === "downloading";
-              const isPaused = downloadState?.state === "cancelled";
-              const isDownloadComplete = downloadState?.state === "completed";
-              const isDownloadFailed = downloadState?.state === "failed";
-              const canDeleteLocalData = Boolean(isComplete || isDownloadComplete || isPaused || isDownloadFailed || isPartial);
-              return (
-                <article key={variant.id} className="image-library-card">
-                  <div className="image-library-card-head">
-                    <div>
-                      <h3>{variant.name}</h3>
-                      <p>{family?.name ?? variant.provider}</p>
-                    </div>
-                    {isComplete || isDownloadComplete ? (
-                      <span className="badge success">Installed</span>
-                    ) : isDownloading ? (
-                      <span className="badge accent">{downloadProgressLabel(downloadState)}</span>
-                    ) : isPaused ? (
-                      <span className="badge warning">{downloadProgressLabel(downloadState)}</span>
-                    ) : isDownloadFailed ? (
-                      <span className="badge warning">Download Failed</span>
-                    ) : isPartial ? (
-                      <span className="badge warning">Incomplete</span>
-                    ) : null}
-                  </div>
-                  <div className="image-library-stats">
-                    <span>{imagePrimarySizeLabel(variant)}</span>
-                    <span>{variant.recommendedResolution}</span>
-                    {formatReleaseLabel(variant.releaseLabel, variant.releaseDate ?? variant.createdAt) ? (
-                      <span>{formatReleaseLabel(variant.releaseLabel, variant.releaseDate ?? variant.createdAt)}</span>
-                    ) : null}
-                    {variant.styleTags.slice(0, 3).map((tag) => (
-                      <span key={tag} className="badge subtle">{tag}</span>
-                    ))}
-                  </div>
-                  {isDownloadFailed && downloadState?.error ? (
-                    <p className="muted-text" style={{ color: "var(--error, #e26d6d)" }}>{downloadState.error}</p>
-                  ) : null}
-                  <div className="button-row">
-                    {isComplete || isDownloadComplete ? (
-                      <button className="primary-button" type="button" onClick={() => onOpenImageStudio(variant.id)}>
-                        Generate
-                      </button>
-                    ) : isDownloading ? (
-                      <button className="secondary-button" type="button" onClick={() => onCancelImageDownload(variant.repo)}>
-                        Pause
-                      </button>
-                    ) : isPaused ? (
-                      <button className="secondary-button" type="button" onClick={() => onImageDownload(variant.repo)}>
-                        Resume
-                      </button>
-                    ) : (
-                      <button className="secondary-button" type="button" onClick={() => onImageDownload(variant.repo)}>
-                        {isDownloadFailed ? "Retry" : isPartial ? "Resume Download" : "Download"}
-                      </button>
-                    )}
-                    {isDownloading || canDeleteLocalData ? (
-                      <button className="secondary-button danger-button" type="button" onClick={() => onDeleteImageDownload(variant.repo)}>
-                        {isDownloading ? "Cancel" : "Delete"}
-                      </button>
-                    ) : null}
-                    {variant.localPath ? (
-                      <button
-                        className="secondary-button icon-button"
-                        type="button"
-                        title={fileRevealLabel}
-                        onClick={() => onRevealPath(variant.localPath as string)}
-                      >
-                        <svg width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
-                          <path d="M18 13v6a2 2 0 0 1-2 2H5a2 2 0 0 1-2-2V8a2 2 0 0 1 2-2h6" />
-                          <polyline points="15 3 21 3 21 9" />
-                          <line x1="10" y1="14" x2="21" y2="3" />
-                        </svg>
-                      </button>
-                    ) : null}
-                    <button className="secondary-button" type="button" onClick={() => onOpenExternalUrl(variant.link)}>
-                      Model Card
-                    </button>
-                  </div>
-                </article>
-              );
-            })}
-          </div>
+          <>
+            <div className="image-discover-filter-row image-discover-filter-row--wide image-model-filter-row">
+              <label className="image-discover-search">
+                Search
+                <input
+                  className="text-input"
+                  type="search"
+                  value={searchInput}
+                  onChange={(event) => setSearchInput(event.target.value)}
+                  placeholder="Filter by model, provider, repo, task, or tag..."
+                />
+              </label>
+              <label>
+                Task
+                <select
+                  className="text-input"
+                  value={taskFilter}
+                  onChange={(event) => setTaskFilter(event.target.value as typeof taskFilter)}
+                >
+                  <option value="all">All tasks</option>
+                  <option value="txt2img">Text to image</option>
+                  <option value="img2img">Image to image</option>
+                  <option value="inpaint">Inpaint</option>
+                </select>
+              </label>
+              <label>
+                Status
+                <select
+                  className="text-input"
+                  value={statusFilter}
+                  onChange={(event) => setStatusFilter(event.target.value as InstalledImageStatusFilter)}
+                >
+                  <option value="all">Any status</option>
+                  <option value="installed">Installed</option>
+                  <option value="incomplete">Incomplete</option>
+                  <option value="downloading">Downloading</option>
+                  <option value="paused">Paused</option>
+                  <option value="failed">Failed</option>
+                </select>
+              </label>
+              <label>
+                Sort by
+                <select
+                  className="text-input"
+                  value={sort}
+                  onChange={(event) => {
+                    const nextSort = event.target.value as InstalledImageSort;
+                    setSort(nextSort);
+                    setSortDir(defaultSortDir(nextSort));
+                  }}
+                >
+                  <option value="name">Name</option>
+                  <option value="provider">Provider</option>
+                  <option value="tasks">Tasks</option>
+                  <option value="date">Newest released</option>
+                  <option value="size">Largest size</option>
+                  <option value="ram">Highest RAM/VRAM</option>
+                  <option value="status">Status</option>
+                </select>
+              </label>
+              <div className="image-discover-filter-actions">
+                <button
+                  className="secondary-button"
+                  type="button"
+                  onClick={() => {
+                    setSearchInput("");
+                    setTaskFilter("all");
+                    setStatusFilter("all");
+                    setSort("date");
+                    setSortDir("desc");
+                  }}
+                  disabled={!hasActiveFilters}
+                >
+                  Clear Filters
+                </button>
+              </div>
+            </div>
+            <div className="image-discover-results-summary">
+              <span>{rows.length} model{rows.length !== 1 ? "s" : ""} · {sortLabel(sort, sortDir)}</span>
+              {normalizedSearch ? <span className="badge subtle">Search: {searchInput.trim()}</span> : null}
+              {taskFilter !== "all" ? <span className="badge muted">Task: {taskFilter}</span> : null}
+              {statusFilter !== "all" ? <span className="badge muted">Status: {statusFilter}</span> : null}
+            </div>
+            {rows.length === 0 ? (
+              <div className="empty-state image-empty-state">
+                <p>No installed image models match the current filters.</p>
+              </div>
+            ) : (
+              <div className="media-model-table media-model-table--image">
+                <div className="media-model-head">
+                  <button className="sort-header" type="button" onClick={() => applySort("name")}>Model{sortIndicator(sort, sortDir, "name")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("provider")}>Provider{sortIndicator(sort, sortDir, "provider")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("tasks")}>Tasks{sortIndicator(sort, sortDir, "tasks")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("size")}>Size{sortIndicator(sort, sortDir, "size")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("ram")}>RAM/VRAM{sortIndicator(sort, sortDir, "ram")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("date")}>Released{sortIndicator(sort, sortDir, "date")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("status")}>Status{sortIndicator(sort, sortDir, "status")}</button>
+                  <span className="sort-header"></span>
+                </div>
+                <div className="media-model-rows">
+                  {rows.map(({ variant, family, downloadState, status, memoryEstimate }) => {
+                    const isComplete = status === "installed";
+                    const isDownloading = status === "downloading";
+                    const isPaused = status === "paused";
+                    const isDownloadFailed = status === "failed";
+                    const isPartial = status === "incomplete";
+                    const canDeleteLocalData = Boolean(isComplete || isPaused || isDownloadFailed || isPartial);
+                    const secondarySize = imageSecondarySizeLabel(variant);
+                    const releaseLabel = compactReleaseLabel(formatReleaseLabel(variant.releaseLabel, variant.releaseDate ?? variant.createdAt));
+                    const primarySizeLabel = imagePrimarySizeLabel(variant);
+                    const sizeTitle = [primarySizeLabel, secondarySize].filter(Boolean).join(" / ");
+                    const memory = memoryParts(memoryEstimate?.label);
+                    return (
+                      <div key={variant.id} className={`media-model-row-wrap${isComplete ? " downloaded" : ""}`}>
+                        <div className="media-model-row">
+                          <div className="media-model-name">
+                            <strong>{variant.name}</strong>
+                            <small>{family?.name ?? variant.provider}</small>
+                            <div className="media-model-chip-row">
+                              {variant.styleTags.slice(0, 4).map((tag) => (
+                                <span key={tag} className="badge subtle">{tag}</span>
+                              ))}
+                            </div>
+                          </div>
+                          <span>{variant.provider}</span>
+                          <div className="media-model-chip-row">
+                            {variant.taskSupport.map((task) => (
+                              <span key={task} className="badge muted">{task}</span>
+                            ))}
+                          </div>
+                          <span title={sizeTitle || undefined}>
+                            {compactModelSizeLabel(primarySizeLabel)}
+                          </span>
+                          <span className="media-model-memory" title={memoryEstimate?.title ?? "RAM/VRAM estimate pending until model weight size is known."}>
+                            <span>{memory.primary}</span>
+                            {memory.secondary ? <small>{memory.secondary}</small> : null}
+                          </span>
+                          <span>{releaseLabel ?? "Unknown"}</span>
+                          <span>{statusBadge(status, downloadState)}</span>
+                          <div className="media-model-actions">
+                            {isComplete ? (
+                              <IconActionButton icon="generate" label="Generate" buttonStyle="primary" onClick={() => onOpenImageStudio(variant.id)} />
+                            ) : isDownloading ? (
+                              <IconActionButton icon="pause" label="Pause download" onClick={() => onCancelImageDownload(variant.repo)} />
+                            ) : (
+                              <IconActionButton icon={isDownloadFailed ? "retry" : isPartial ? "resume" : "download"} label={isDownloadFailed ? "Retry download" : isPartial ? "Resume download" : "Download model"} onClick={() => onImageDownload(variant.repo)} />
+                            )}
+                            {isDownloading || canDeleteLocalData ? (
+                              <IconActionButton icon={isDownloading ? "cancel" : "delete"} label={isDownloading ? "Cancel download" : "Delete model"} danger onClick={() => onDeleteImageDownload(variant.repo)} />
+                            ) : null}
+                            {variant.localPath ? (
+                              <IconActionButton icon="reveal" label={fileRevealLabel} title={fileRevealLabel} onClick={() => onRevealPath(variant.localPath as string)} />
+                            ) : null}
+                            <IconActionButton icon="modelCard" label="Open model card" onClick={() => onOpenExternalUrl(variant.link)} />
+                          </div>
+                        </div>
+                        {isDownloadFailed && downloadState?.error ? (
+                          <div className="media-model-row-detail callout error">
+                            <p>{downloadState.error}</p>
+                          </div>
+                        ) : null}
+                      </div>
+                    );
+                  })}
+                </div>
+              </div>
+            )}
+          </>
         )}
       </Panel>
     </div>
diff --git a/src/features/images/ImageStudioTab.tsx b/src/features/images/ImageStudioTab.tsx
index ab7573e..f05e42d 100644
--- a/src/features/images/ImageStudioTab.tsx
+++ b/src/features/images/ImageStudioTab.tsx
@@ -19,7 +19,7 @@ import {
   formatImageAccessError,
   isGatedImageAccessError,
 } from "../../utils";
-import { assessImageGenerationSafety } from "../../utils/images";
+import { assessImageGenerationSafety, imageVariantSizeForMemoryEstimate } from "../../utils/images";
 import { IMAGE_RATIO_PRESETS, IMAGE_QUALITY_PRESETS, IMAGE_SAMPLERS, isFlowMatchingRepo } from "../../constants";
 
 export interface ImageStudioTabProps {
@@ -231,16 +231,34 @@ export function ImageStudioTab({
       assessImageGenerationSafety({
         width: imageWidth,
         height: imageHeight,
-        device: imageRuntimeStatus.device,
+        device: imageRuntimeStatus.device ?? imageRuntimeStatus.expectedDevice,
         deviceMemoryGb: imageRuntimeStatus.deviceMemoryGb,
-        baseModelFootprintGb: selectedImageVariant?.sizeGb,
+        baseModelFootprintGb: selectedImageVariant
+          ? imageVariantSizeForMemoryEstimate(selectedImageVariant)
+          : undefined,
+        runtimeFootprintGb: selectedImageVariant?.runtimeFootprintGb,
+        runtimeFootprintMpsGb: selectedImageVariant?.runtimeFootprintMpsGb,
+        runtimeFootprintCudaGb: selectedImageVariant?.runtimeFootprintCudaGb,
+        runtimeFootprintCpuGb: selectedImageVariant?.runtimeFootprintCpuGb,
+        repo: selectedImageVariant?.repo,
+        ggufFile: selectedImageVariant?.ggufFile,
       }),
     [
       imageWidth,
       imageHeight,
       imageRuntimeStatus.device,
+      imageRuntimeStatus.expectedDevice,
       imageRuntimeStatus.deviceMemoryGb,
+      selectedImageVariant?.repo,
+      selectedImageVariant?.ggufFile,
       selectedImageVariant?.sizeGb,
+      selectedImageVariant?.coreWeightsGb,
+      selectedImageVariant?.onDiskGb,
+      selectedImageVariant?.repoSizeGb,
+      selectedImageVariant?.runtimeFootprintGb,
+      selectedImageVariant?.runtimeFootprintMpsGb,
+      selectedImageVariant?.runtimeFootprintCudaGb,
+      selectedImageVariant?.runtimeFootprintCpuGb,
     ],
   );
 
diff --git a/src/features/models/MyModelsTab.test.tsx b/src/features/models/MyModelsTab.test.tsx
index 0050886..a850dc5 100644
--- a/src/features/models/MyModelsTab.test.tsx
+++ b/src/features/models/MyModelsTab.test.tsx
@@ -118,8 +118,8 @@ describe("MyModelsTab", () => {
 
     expect(markup).toContain("Paused 36%");
     expect(markup).toContain("23.9 / 67.0 GB downloaded.");
-    expect(markup).toContain("RESUME");
-    expect(markup).toContain("DELETE");
+    expect(markup).toContain("aria-label=\"Resume download\"");
+    expect(markup).toContain("aria-label=\"Delete download\"");
     expect(markup).not.toContain("BROKEN");
   });
 
@@ -148,8 +148,8 @@ describe("MyModelsTab", () => {
 
     expect(markup).toContain("Downloading 13%");
     expect(markup).toContain("8.4 / 67.0 GB downloaded.");
-    expect(markup).toContain("PAUSE");
-    expect(markup).toContain("CANCEL");
+    expect(markup).toContain("aria-label=\"Pause download\"");
+    expect(markup).toContain("aria-label=\"Cancel download\"");
     expect(markup).not.toContain("BROKEN");
     expect(markup).not.toContain("No .gguf, .safetensors, or pytorch weights found");
   });
@@ -170,8 +170,8 @@ describe("MyModelsTab", () => {
 
     expect(markup).toContain("BROKEN");
     expect(markup).toContain("No .gguf, .safetensors, or pytorch weights found in HF cache entry");
-    expect(markup).toContain("RETRY");
-    expect(markup).toContain("DELETE");
+    expect(markup).toContain("aria-label=\"Retry download\"");
+    expect(markup).toContain("aria-label=\"Delete download\"");
     expect(markup).not.toContain("CHAT");
     expect(markup).not.toContain("SERVER");
   });
@@ -213,8 +213,8 @@ describe("MyModelsTab", () => {
     });
 
     expect(markup).toContain("Downloading 3%");
-    expect(markup).toContain("PAUSE");
-    expect(markup).toContain("CANCEL");
+    expect(markup).toContain("aria-label=\"Pause download\"");
+    expect(markup).toContain("aria-label=\"Cancel download\"");
     // Sentinel path should not leak into the reveal button or expanded detail.
     expect(markup).not.toContain("download://Qwen/Qwen3.6-35B-A3B");
     // Reveal button should be hidden for rows with no real file on disk.
@@ -253,8 +253,8 @@ describe("MyModelsTab", () => {
 
     expect(markup).toContain("Downloading 1%");
     expect(markup).toContain("2.5 / 494.1 GB downloaded.");
-    expect(markup).toContain("PAUSE");
-    expect(markup).toContain("CANCEL");
+    expect(markup).toContain("aria-label=\"Pause download\"");
+    expect(markup).toContain("aria-label=\"Cancel download\"");
     expect(markup).not.toContain("CHAT");
     expect(markup).not.toContain("SERVER");
   });
diff --git a/src/features/models/MyModelsTab.tsx b/src/features/models/MyModelsTab.tsx
index 9333181..ff720c8 100644
--- a/src/features/models/MyModelsTab.tsx
+++ b/src/features/models/MyModelsTab.tsx
@@ -1,6 +1,8 @@
 import { useState } from "react";
 import type { DownloadStatus } from "../../api";
 import { Panel } from "../../components/Panel";
+import { IconActionButton, StatusIcon } from "../../components/ModelActionIcons";
+import type { ModelStatusKind } from "../../components/ModelActionIcons";
 import type {
   LibraryItem,
   ModelVariant,
@@ -346,6 +348,7 @@ export function MyModelsTab({
               <button className="sort-header" type="button" onClick={() => toggleLibrarySort("ram")}>RAM{sortIndicator("ram")}</button>
               <button className="sort-header" type="button" onClick={() => toggleLibrarySort("compressed")}>Compressed{sortIndicator("compressed")}</button>
               <button className="sort-header" type="button" onClick={() => toggleLibrarySort("context")}>Context{sortIndicator("context")}</button>
+              <span className="sort-header">Status</span>
               <span className="sort-header"></span>
             </div>
             <div className="library-rows">
@@ -371,11 +374,19 @@ export function MyModelsTab({
                 const hasDownloadOverlay = Boolean(isDownloading || isPaused || isDownloadFailed);
                 const showBroken = Boolean(item.broken && !hasDownloadOverlay);
                 const canRetryBrokenRepo = Boolean(showBroken && repo);
-                const downloadActionLabel = isDownloadFailed ? "RETRY" : "RESUME";
                 // Rows synthesised from an in-flight download use a
                 // ``download://<repo>`` sentinel path — they have no real
                 // file on disk yet, so hide path-only actions.
                 const isSyntheticDownloadRow = item.path.startsWith("download://");
+                const rowStatus: { kind: ModelStatusKind; label: string; detail?: string | null } = isDownloading && downloadState
+                  ? { kind: "downloading", label: "Downloading", detail: downloadProgressLabel(downloadState) }
+                  : isPaused && downloadState
+                    ? { kind: "paused", label: "Paused", detail: downloadProgressLabel(downloadState) }
+                    : isDownloadFailed && downloadState
+                      ? { kind: "failed", label: "Failed", detail: downloadState.error ?? "Download failed" }
+                      : showBroken
+                        ? { kind: "incomplete", label: "Incomplete", detail: item.brokenReason ?? "Incomplete or broken" }
+                        : { kind: "installed", label: "Installed" };
                 const wrapperClassName = [
                   "library-item-wrap",
                   isExpanded ? "expanded" : "",
@@ -395,12 +406,7 @@ export function MyModelsTab({
                         <div className="library-item-meta-row">
                           <span className="badge muted">{sourceKind}</span>
                           {hasDownloadOverlay && downloadState ? (
-                            <span
-                              className={`badge ${isDownloading ? "accent" : "warning"}`}
-                              title={downloadSizeTooltip(downloadState)}
-                            >
-                              {isDownloadFailed ? "DOWNLOAD FAILED" : downloadProgressLabel(downloadState)}
-                            </span>
+                            <span className="badge muted" title={downloadSizeTooltip(downloadState)}>Active download</span>
                           ) : null}
                         </div>
                         {matchedVariant ? renderCapabilityIcons(matchedVariant.capabilities, 5) : null}
@@ -429,59 +435,42 @@ export function MyModelsTab({
                         {estimatedCompressedGb != null ? `~${number(estimatedCompressedGb)} GB` : "?"}
                       </span>
                       <span>{matchedVariant?.contextWindow ?? ""}</span>
+                      <span className="library-row-status">
+                        <StatusIcon status={rowStatus.kind} label={rowStatus.label} detail={rowStatus.detail} />
+                      </span>
                       <div className="library-row-actions" onClick={(e) => e.stopPropagation()}>
                         {hasDownloadOverlay && repo ? (
                           <>
                             {isDownloading ? (
-                              <button className="secondary-button" type="button" onClick={() => onCancelModelDownload(repo)}>PAUSE</button>
+                              <IconActionButton icon="pause" label="Pause download" onClick={() => onCancelModelDownload(repo)} />
                             ) : (
-                              <button className="primary-button" type="button" onClick={() => onDownloadModel(repo)}>{downloadActionLabel}</button>
+                              <IconActionButton icon={isDownloadFailed ? "retry" : "resume"} label={isDownloadFailed ? "Retry download" : "Resume download"} buttonStyle="primary" onClick={() => onDownloadModel(repo)} />
                             )}
-                            <button className="secondary-button danger-button" type="button" onClick={() => onDeleteModelDownload(repo)}>
-                              {isDownloading ? "CANCEL" : "DELETE"}
-                            </button>
+                            <IconActionButton icon={isDownloading ? "cancel" : "delete"} label={isDownloading ? "Cancel download" : "Delete download"} danger onClick={() => onDeleteModelDownload(repo)} />
                           </>
                         ) : canRetryBrokenRepo ? (
                           <>
-                            <button className="primary-button" type="button" onClick={() => onDownloadModel(repo!)}>
-                              RETRY
-                            </button>
-                            <button className="secondary-button danger-button" type="button" onClick={() => onDeleteModelDownload(repo!)}>
-                              DELETE
-                            </button>
+                            <IconActionButton icon="retry" label="Retry download" buttonStyle="primary" onClick={() => onDownloadModel(repo!)} />
+                            <IconActionButton icon="delete" label="Delete download" danger onClick={() => onDeleteModelDownload(repo!)} />
                           </>
                         ) : (
                           <>
                             {!item.broken && displayFormat !== "MLX" ? (
-                              <button className="primary-button action-convert" type="button" onClick={() => onPrepareLibraryConversion(item)}>CONVERT</button>
+                              <IconActionButton icon="convert" label="Convert model" buttonStyle="primary" className="action-convert" onClick={() => onPrepareLibraryConversion(item)} />
                             ) : null}
                             {!item.broken ? (
                               <>
-                                <button className="primary-button action-chat" type="button" onClick={() => onOpenModelSelector("chat", `library:${item.path}`)}>CHAT</button>
-                                <button className="primary-button action-server" type="button" onClick={() => onOpenModelSelector("server", `library:${item.path}`)}>SERVER</button>
+                                <IconActionButton icon="chat" label="Chat with model" buttonStyle="primary" className="action-chat" onClick={() => onOpenModelSelector("chat", `library:${item.path}`)} />
+                                <IconActionButton icon="server" label="Load for server" buttonStyle="primary" className="action-server" onClick={() => onOpenModelSelector("server", `library:${item.path}`)} />
                               </>
                             ) : null}
                           </>
                         )}
                         {!isSyntheticDownloadRow ? (
-                          <button className="secondary-button icon-button" type="button" title={fileRevealLabel} onClick={() => onRevealPath(item.path)}>
-                            <svg width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
-                              <path d="M18 13v6a2 2 0 0 1-2 2H5a2 2 0 0 1-2-2V8a2 2 0 0 1 2-2h6" />
-                              <polyline points="15 3 21 3 21 9" />
-                              <line x1="10" y1="14" x2="21" y2="3" />
-                            </svg>
-                          </button>
+                          <IconActionButton icon="reveal" label={fileRevealLabel} title={fileRevealLabel} onClick={() => onRevealPath(item.path)} />
                         ) : null}
                         {!hasDownloadOverlay ? (
-                          <button className="secondary-button icon-button danger-button" type="button" title="Delete model" onClick={() => onDeleteModel(item)}>
-                            <svg width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
-                              <polyline points="3 6 5 6 21 6" />
-                              <path d="M19 6l-1 14a2 2 0 0 1-2 2H8a2 2 0 0 1-2-2L5 6" />
-                              <path d="M10 11v6" />
-                              <path d="M14 11v6" />
-                              <path d="M9 6V4a1 1 0 0 1 1-1h4a1 1 0 0 1 1 1v2" />
-                            </svg>
-                          </button>
+                          <IconActionButton icon="delete" label="Delete model" danger onClick={() => onDeleteModel(item)} />
                         ) : null}
                       </div>
                     </div>
diff --git a/src/features/models/OnlineModelsTab.test.tsx b/src/features/models/OnlineModelsTab.test.tsx
index 57bd793..509eca0 100644
--- a/src/features/models/OnlineModelsTab.test.tsx
+++ b/src/features/models/OnlineModelsTab.test.tsx
@@ -197,8 +197,8 @@ describe("OnlineModelsTab", () => {
     });
 
     expect(markup).toContain("Qwen/Qwen3-Coder-Next-FP8 was not found on Hugging Face.");
-    expect(markup).toContain("RETRY");
-    expect(markup).toContain("DELETE");
+    expect(markup).toContain("aria-label=\"Retry download\"");
+    expect(markup).toContain("aria-label=\"Delete download\"");
   });
 
   it("renders live hub results even when no curated families match", () => {
diff --git a/src/features/models/OnlineModelsTab.tsx b/src/features/models/OnlineModelsTab.tsx
index 0907cd3..fd29e86 100644
--- a/src/features/models/OnlineModelsTab.tsx
+++ b/src/features/models/OnlineModelsTab.tsx
@@ -1,4 +1,6 @@
 import { Panel } from "../../components/Panel";
+import { IconActionButton, StatusIcon } from "../../components/ModelActionIcons";
+import type { ModelStatusKind } from "../../components/ModelActionIcons";
 import type { DownloadStatus } from "../../api";
 import type {
   HubFileListResponse,
@@ -230,13 +232,13 @@ export function OnlineModelsTab({
                       <span className="badge muted">{family.provider}</span>
                       <span className="badge muted">{paramRange}</span>
                       {formats.map((f) => <span key={f} className="badge muted">{f}</span>)}
-                      {localCount > 0 ? <span className="badge success">{localCount} downloaded</span> : null}
+                      {localCount > 0 ? <StatusIcon status="installed" label={`${localCount} installed`} /> : null}
                       {headerIsDownloading ? (
-                        <span className="badge accent">{downloadProgressLabel(headerDownload)}</span>
+                        <StatusIcon status="downloading" label="Downloading" detail={headerDownload ? downloadProgressLabel(headerDownload) : null} />
                       ) : headerIsPaused ? (
-                        <span className="badge warning">{downloadProgressLabel(headerDownload)}</span>
+                        <StatusIcon status="paused" label="Paused" detail={headerDownload ? downloadProgressLabel(headerDownload) : null} />
                       ) : headerIsFailed ? (
-                        <span className="badge warning">DOWNLOAD FAILED</span>
+                        <StatusIcon status="failed" label="Download failed" detail={headerDownload?.error ?? null} />
                       ) : null}
                     </div>
                     <p>{family.headline}</p>
@@ -275,6 +277,7 @@ export function OnlineModelsTab({
                         <span>RAM</span>
                         <span>Compressed</span>
                         <span>Context</span>
+                        <span>Status</span>
                         <span></span>
                       </div>
                       {family.variants.map((variant) => {
@@ -285,6 +288,15 @@ export function OnlineModelsTab({
                         const isDownloadPaused = downloadState?.state === "cancelled";
                         const isDownloadFailed = downloadState?.state === "failed";
                         const isDownloadComplete = downloadState?.state === "completed";
+                        const variantStatus: { kind: ModelStatusKind; label: string; detail?: string | null } = variant.availableLocally || isDownloadComplete
+                          ? { kind: "installed", label: variant.availableLocally ? "Installed" : "Download complete" }
+                          : isDownloading && downloadState
+                            ? { kind: "downloading", label: "Downloading", detail: downloadProgressLabel(downloadState) }
+                            : isDownloadPaused && downloadState
+                              ? { kind: "paused", label: "Paused", detail: downloadProgressLabel(downloadState) }
+                              : isDownloadFailed && downloadState
+                                ? { kind: "failed", label: "Failed", detail: downloadState.error ?? "Download failed" }
+                                : { kind: "incomplete", label: "Not installed" };
                         return (
                           <div key={variant.id}>
                             <div
@@ -304,37 +316,35 @@ export function OnlineModelsTab({
                               <span>{variant.estimatedMemoryGb ? `~${number(variant.estimatedMemoryGb)}GB` : "?"}</span>
                               <span>{variant.estimatedCompressedMemoryGb ? `~${number(variant.estimatedCompressedMemoryGb)}GB` : "?"}</span>
                               <span>{variant.contextWindow}</span>
+                              <span><StatusIcon status={variantStatus.kind} label={variantStatus.label} detail={variantStatus.detail} /></span>
                               <div className="discover-variant-actions" onClick={(e) => e.stopPropagation()}>
                                 {variant.availableLocally ? (
                                   <>
                                     {variant.launchMode === "convert" ? (
-                                      <button className="primary-button action-convert" type="button" onClick={() => onPrepareCatalogConversion(variant)}>CONVERT</button>
+                                      <IconActionButton icon="convert" label="Convert model" buttonStyle="primary" className="action-convert" onClick={() => onPrepareCatalogConversion(variant)} />
                                     ) : null}
-                                    <button className="primary-button action-chat" type="button" onClick={() => onOpenModelSelector("thread", matchedLocal ? `library:${matchedLocal.path}` : `catalog:${variant.id}`)}>CHAT</button>
-                                    <button className="primary-button action-server" type="button" onClick={() => onOpenModelSelector("server", matchedLocal ? `library:${matchedLocal.path}` : `catalog:${variant.id}`)}>SERVER</button>
+                                    <IconActionButton icon="chat" label="Chat with model" buttonStyle="primary" className="action-chat" onClick={() => onOpenModelSelector("thread", matchedLocal ? `library:${matchedLocal.path}` : `catalog:${variant.id}`)} />
+                                    <IconActionButton icon="server" label="Load for server" buttonStyle="primary" className="action-server" onClick={() => onOpenModelSelector("server", matchedLocal ? `library:${matchedLocal.path}` : `catalog:${variant.id}`)} />
                                   </>
                                 ) : isDownloading ? (
                                   <>
-                                    <span className="badge accent">{downloadProgressLabel(downloadState)}</span>
-                                    <button className="secondary-button" type="button" onClick={() => onCancelModelDownload(variant.repo)}>PAUSE</button>
-                                    <button className="secondary-button danger-button" type="button" onClick={() => onDeleteModelDownload(variant.repo)}>CANCEL</button>
+                                    <IconActionButton icon="pause" label="Pause download" onClick={() => onCancelModelDownload(variant.repo)} />
+                                    <IconActionButton icon="cancel" label="Cancel download" danger onClick={() => onDeleteModelDownload(variant.repo)} />
                                   </>
                                 ) : isDownloadPaused ? (
                                   <>
-                                    <span className="badge warning">{downloadProgressLabel(downloadState)}</span>
-                                    <button className="secondary-button" type="button" onClick={() => onDownloadModel(variant.repo)}>RESUME</button>
-                                    <button className="secondary-button danger-button" type="button" onClick={() => onDeleteModelDownload(variant.repo)}>DELETE</button>
+                                    <IconActionButton icon="resume" label="Resume download" onClick={() => onDownloadModel(variant.repo)} />
+                                    <IconActionButton icon="delete" label="Delete download" danger onClick={() => onDeleteModelDownload(variant.repo)} />
                                   </>
                                 ) : isDownloadFailed ? (
                                   <>
-                                    <span className="badge warning">DOWNLOAD FAILED</span>
-                                    <button className="secondary-button" type="button" onClick={() => onDownloadModel(variant.repo)}>RETRY</button>
-                                    <button className="secondary-button danger-button" type="button" onClick={() => onDeleteModelDownload(variant.repo)}>DELETE</button>
+                                    <IconActionButton icon="retry" label="Retry download" onClick={() => onDownloadModel(variant.repo)} />
+                                    <IconActionButton icon="delete" label="Delete download" danger onClick={() => onDeleteModelDownload(variant.repo)} />
                                   </>
                                 ) : isDownloadComplete ? (
-                                  <span className="badge success">DOWNLOAD COMPLETE</span>
+                                  null
                                 ) : (
-                                  <button className="secondary-button" type="button" onClick={() => onDownloadModel(variant.repo)}>DOWNLOAD</button>
+                                  <IconActionButton icon="download" label="Download model" onClick={() => onDownloadModel(variant.repo)} />
                                 )}
                               </div>
                             </div>
@@ -353,18 +363,7 @@ export function OnlineModelsTab({
                                     </p>
                                   ) : null}
                                   {matchedLocal ? <p className="mono-text variant-local-path">{matchedLocal.path}</p> : null}
-                                  <a
-                                    className="text-link"
-                                    href={variant.link}
-                                    target="_blank"
-                                    rel="noreferrer"
-                                    onClick={(event) => {
-                                      event.preventDefault();
-                                      onOpenExternalUrl(variant.link);
-                                    }}
-                                  >
-                                    Open model card on HuggingFace
-                                  </a>
+                                  <IconActionButton icon="huggingFace" label="Open model card on Hugging Face" onClick={() => onOpenExternalUrl(variant.link)} />
                                 </div>
                               </div>
                             ) : null}
@@ -408,6 +407,17 @@ export function OnlineModelsTab({
             const isDownloadPaused = downloadState?.state === "cancelled";
             const isDownloadFailed = downloadState?.state === "failed";
             const isDownloadComplete = downloadState?.state === "completed";
+            const hubStatus: { kind: ModelStatusKind; label: string; detail?: string | null } | null = model.availableLocally
+              ? { kind: "installed", label: "Installed" }
+              : isDownloadComplete
+                ? { kind: "downloaded", label: "Download complete" }
+                : isDownloading && downloadState
+                  ? { kind: "downloading", label: "Downloading", detail: downloadProgressLabel(downloadState) }
+                  : isDownloadPaused && downloadState
+                    ? { kind: "paused", label: "Paused", detail: downloadProgressLabel(downloadState) }
+                    : isDownloadFailed && downloadState
+                      ? { kind: "failed", label: "Failed", detail: downloadState.error ?? "Download failed" }
+                      : null;
             return (
               <div key={model.id} className={`discover-card${isExpanded ? " expanded" : ""}`}>
                 <div
@@ -424,17 +434,7 @@ export function OnlineModelsTab({
                       <strong>{model.name}</strong>
                       <span className="badge muted">{model.provider}</span>
                       <span className={`badge ${model.format === "GGUF" ? "accent" : "muted"}`}>{model.format}</span>
-                      {model.availableLocally ? <span className="badge success">Downloaded</span> : null}
-                      {!model.availableLocally && isDownloadComplete ? <span className="badge success">Download complete</span> : null}
-                      {!model.availableLocally && isDownloading ? (
-                        <span className="badge accent">{downloadProgressLabel(downloadState)}</span>
-                      ) : null}
-                      {!model.availableLocally && isDownloadPaused ? (
-                        <span className="badge warning">{downloadProgressLabel(downloadState)}</span>
-                      ) : null}
-                      {!model.availableLocally && isDownloadFailed ? (
-                        <span className="badge warning">Download failed</span>
-                      ) : null}
+                      {hubStatus ? <StatusIcon status={hubStatus.kind} label={hubStatus.label} detail={hubStatus.detail} /> : null}
                     </div>
                     <div className="discover-card-meta">
                       {formatReleaseLabel(model.releaseLabel, model.createdAt) ? (
@@ -554,66 +554,30 @@ export function OnlineModelsTab({
                     <div className="button-row">
                       {model.availableLocally ? (
                         <>
-                          <button className="primary-button action-chat" type="button" onClick={() => onOpenModelSelector("thread")}>Chat</button>
-                          <button className="primary-button action-server" type="button" onClick={() => onOpenModelSelector("server")}>Server</button>
+                          <IconActionButton icon="chat" label="Chat with model" buttonStyle="primary" className="action-chat" onClick={() => onOpenModelSelector("thread")} />
+                          <IconActionButton icon="server" label="Load for server" buttonStyle="primary" className="action-server" onClick={() => onOpenModelSelector("server")} />
                         </>
                       ) : isDownloading ? (
                         <>
-                          <span className="badge accent">{downloadProgressLabel(downloadState)}</span>
-                          <button className="secondary-button" type="button" onClick={() => onCancelModelDownload(model.repo)}>
-                            Pause
-                          </button>
-                          <button className="secondary-button danger-button" type="button" onClick={() => onDeleteModelDownload(model.repo)}>
-                            Cancel
-                          </button>
+                          <IconActionButton icon="pause" label="Pause download" onClick={() => onCancelModelDownload(model.repo)} />
+                          <IconActionButton icon="cancel" label="Cancel download" danger onClick={() => onDeleteModelDownload(model.repo)} />
                         </>
                       ) : isDownloadPaused ? (
                         <>
-                          <span className="badge warning">{downloadProgressLabel(downloadState)}</span>
-                          <button
-                            className="secondary-button"
-                            type="button"
-                            onClick={() => onDownloadModel(model.repo)}
-                          >
-                            Resume
-                          </button>
-                          <button className="secondary-button danger-button" type="button" onClick={() => onDeleteModelDownload(model.repo)}>
-                            Delete
-                          </button>
+                          <IconActionButton icon="resume" label="Resume download" onClick={() => onDownloadModel(model.repo)} />
+                          <IconActionButton icon="delete" label="Delete download" danger onClick={() => onDeleteModelDownload(model.repo)} />
                         </>
                       ) : isDownloadFailed ? (
                         <>
-                          <span className="badge warning">Download failed</span>
-                          <button className="secondary-button" type="button" onClick={() => onDownloadModel(model.repo)}>
-                            Retry
-                          </button>
-                          <button className="secondary-button danger-button" type="button" onClick={() => onDeleteModelDownload(model.repo)}>
-                            Delete
-                          </button>
+                          <IconActionButton icon="retry" label="Retry download" onClick={() => onDownloadModel(model.repo)} />
+                          <IconActionButton icon="delete" label="Delete download" danger onClick={() => onDeleteModelDownload(model.repo)} />
                         </>
                       ) : isDownloadComplete ? (
-                        <span className="badge success">Download complete</span>
+                        <StatusIcon status="downloaded" label="Download complete" />
                       ) : (
-                        <button
-                          className="primary-button"
-                          type="button"
-                          onClick={() => onDownloadModel(model.repo)}
-                        >
-                          Download
-                        </button>
+                        <IconActionButton icon="download" label="Download model" buttonStyle="primary" onClick={() => onDownloadModel(model.repo)} />
                       )}
-                      <a
-                        className="text-link"
-                        href={model.link}
-                        target="_blank"
-                        rel="noreferrer"
-                        onClick={(event) => {
-                          event.preventDefault();
-                          onOpenExternalUrl(model.link);
-                        }}
-                      >
-                        Open on HuggingFace ↗
-                      </a>
+                      <IconActionButton icon="huggingFace" label="Open on Hugging Face" onClick={() => onOpenExternalUrl(model.link)} />
                     </div>
                   </div>
                 ) : null}
diff --git a/src/features/video/VideoDiscoverTab.tsx b/src/features/video/VideoDiscoverTab.tsx
index 475bdb3..383b6aa 100644
--- a/src/features/video/VideoDiscoverTab.tsx
+++ b/src/features/video/VideoDiscoverTab.tsx
@@ -1,5 +1,6 @@
-import { useEffect } from "react";
+import { useEffect, useMemo, useState } from "react";
 import { InstallLogPanel } from "../../components/InstallLogPanel";
+import { IconActionButton, StatusIcon } from "../../components/ModelActionIcons";
 import { Panel } from "../../components/Panel";
 import type { DownloadStatus, InstallResult, LongLiveJobState } from "../../api";
 import type {
@@ -10,21 +11,27 @@ import type {
 import type { DiscoverSort } from "../../types/image";
 import type { VideoDiscoverTaskFilter } from "../../types/video";
 import {
+  compactModelSizeLabel,
+  compactReleaseLabel,
   downloadProgressLabel,
   downloadSizeTooltip,
   formatReleaseLabel,
-  number,
+  videoDiscoverMemoryEstimate,
+  videoDeleteLabelForRepo,
+  videoDeleteRepoForVariant,
+  videoDownloadStatusForVariant,
   videoPrimarySizeLabel,
   videoSecondarySizeLabel,
 } from "../../utils";
 
+type MediaStatusFilter = "all" | "installed" | "not-installed" | "downloading" | "paused" | "failed" | "incomplete";
+type SortDir = "asc" | "desc";
+
 // LongLive ships via a dedicated Python installer (isolated venv + GitHub
 // clone + HF weights at Efficient-Large-Model/LongLive-1.3B), not via
 // snapshot_download. The catalog repo id ``NVlabs/LongLive-1.3B`` is the
 // GitHub org and intentionally does not resolve on Hugging Face — we use
-// it purely as a routing key. Detect LongLive here so the Discover card
-// can swap the Download button for an Install LongLive CTA that matches
-// the Studio tab's existing install affordance.
+// it purely as a routing key.
 function isLongLiveRepo(repo: string | undefined): boolean {
   return repo?.startsWith("NVlabs/LongLive") ?? false;
 }
@@ -44,13 +51,10 @@ export interface VideoDiscoverTabProps {
   fileRevealLabel: string;
   longLiveStatus: VideoRuntimeStatus | null;
   installingLongLive: boolean;
-  // Live LongLive install job — same async-poll job as VideoStudioTab so
-  // either tab's "Install LongLive" button drives the same backend
-  // worker and renders the same per-phase terminal output.
   longLiveJob: LongLiveJobState | null;
   onActiveTabChange: (tab: TabId) => void;
   onOpenVideoStudio: (modelId?: string) => void;
-  onVideoDownload: (repo: string) => void;
+  onVideoDownload: (repo: string, modelId?: string) => void;
   onCancelVideoDownload: (repo: string) => void;
   onDeleteVideoDownload: (repo: string) => void;
   onOpenExternalUrl: (url: string) => void;
@@ -59,6 +63,106 @@ export interface VideoDiscoverTabProps {
   onInstallLongLive: () => Promise<InstallResult>;
 }
 
+function videoDiscoverSortLabel(sort: DiscoverSort): string {
+  if (sort === "name") return "name";
+  if (sort === "provider") return "provider";
+  if (sort === "tasks") return "tasks";
+  if (sort === "size") return "largest size first";
+  if (sort === "ram") return "highest RAM/VRAM first";
+  if (sort === "likes") return "most liked first";
+  if (sort === "downloads") return "most downloads first";
+  if (sort === "status") return "status";
+  return "newest released first";
+}
+
+function sortIndicator(activeSort: DiscoverSort, sortDir: SortDir, key: DiscoverSort): string {
+  if (activeSort !== key) return "";
+  return sortDir === "asc" ? " \u25B2" : " \u25BC";
+}
+
+function defaultSortDir(sort: DiscoverSort): SortDir {
+  return sort === "name" || sort === "provider" || sort === "tasks" ? "asc" : "desc";
+}
+
+function releaseSortKey(variant: VideoModelVariant): string {
+  return variant.releaseDate ?? variant.createdAt ?? variant.lastModified ?? "";
+}
+
+function sizeSortKey(variant: VideoModelVariant): number | null {
+  const candidates = [variant.onDiskGb, variant.coreWeightsGb, variant.repoSizeGb, variant.sizeGb];
+  for (const value of candidates) {
+    if (typeof value === "number" && Number.isFinite(value) && value > 0) return value;
+  }
+  return null;
+}
+
+function compareNullableNumberDesc(left: number | null, right: number | null): number {
+  const leftKnown = typeof left === "number" && Number.isFinite(left);
+  const rightKnown = typeof right === "number" && Number.isFinite(right);
+  if (leftKnown && rightKnown) return (right as number) - (left as number);
+  if (leftKnown) return -1;
+  if (rightKnown) return 1;
+  return 0;
+}
+
+function compareNullableNumber(left: number | null, right: number | null, dir: SortDir): number {
+  const desc = compareNullableNumberDesc(left, right);
+  return dir === "desc" ? desc : -desc;
+}
+
+function statusSortKey(status: MediaStatusFilter): number {
+  if (status === "installed") return 0;
+  if (status === "downloading") return 1;
+  if (status === "paused") return 2;
+  if (status === "failed") return 3;
+  if (status === "incomplete") return 4;
+  if (status === "not-installed") return 5;
+  return 6;
+}
+
+function memoryParts(label: string | null | undefined): { primary: string; secondary: string | null } {
+  if (!label) return { primary: "pending", secondary: null };
+  const [primary, secondary] = label.split(" @ ");
+  if (!secondary) return { primary, secondary: null };
+  return { primary: `${primary} @`, secondary };
+}
+
+function videoVariantStatus(
+  variant: VideoModelVariant,
+  downloadState: DownloadStatus | undefined,
+  longLiveReady: boolean,
+  installingLongLive: boolean,
+): MediaStatusFilter {
+  if (isLongLiveRepo(variant.repo)) {
+    if (longLiveReady) return "installed";
+    if (installingLongLive) return "downloading";
+    return "not-installed";
+  }
+  if (variant.availableLocally || downloadState?.state === "completed") return "installed";
+  if (downloadState?.state === "downloading") return "downloading";
+  if (downloadState?.state === "cancelled") return "paused";
+  if (downloadState?.state === "failed") return "failed";
+  if (variant.hasLocalData) return "incomplete";
+  return "not-installed";
+}
+
+function statusBadge(status: MediaStatusFilter, downloadState?: DownloadStatus, longLiveInstalling = false) {
+  const downloadDetail = downloadState
+    ? [downloadProgressLabel(downloadState), downloadSizeTooltip(downloadState)].filter(Boolean).join(" / ")
+    : null;
+  if (status === "installed") return <StatusIcon status="installed" label="Installed" />;
+  if (longLiveInstalling) return <StatusIcon status="downloading" label="Installing" />;
+  if (status === "downloading" && downloadState) {
+    return <StatusIcon status="downloading" label="Downloading" detail={downloadDetail} />;
+  }
+  if (status === "paused" && downloadState) {
+    return <StatusIcon status="paused" label="Paused" detail={downloadDetail} />;
+  }
+  if (status === "failed") return <StatusIcon status="failed" label="Failed" detail={downloadState?.error ?? "Download failed"} />;
+  if (status === "incomplete") return <StatusIcon status="incomplete" label="Incomplete" />;
+  return <StatusIcon status="incomplete" label="Not installed" />;
+}
+
 export function VideoDiscoverTab({
   combinedVideoDiscoverResults,
   videoDiscoverSearchInput,
@@ -85,22 +189,85 @@ export function VideoDiscoverTab({
   onRefreshLongLiveStatus,
   onInstallLongLive,
 }: VideoDiscoverTabProps) {
-  // Probe LongLive install state whenever the results include a LongLive
-  // variant so the card can render "Installed" vs "Install LongLive"
-  // without the user having to open the Studio tab first. Mirrors the
-  // same effect in VideoStudioTab.
   const hasLongLiveVariant = combinedVideoDiscoverResults.some((variant) =>
     isLongLiveRepo(variant.repo),
   );
   useEffect(() => {
     if (hasLongLiveVariant) onRefreshLongLiveStatus();
   }, [hasLongLiveVariant, onRefreshLongLiveStatus]);
+
+  const [statusFilter, setStatusFilter] = useState<MediaStatusFilter>("all");
+  const [sortDir, setSortDir] = useState<SortDir>(defaultSortDir(videoDiscoverSort));
   const longLiveReady = longLiveStatus?.realGenerationAvailable ?? false;
+  const filteredResults = useMemo(
+    () =>
+      combinedVideoDiscoverResults
+        .map((variant) => {
+          const downloadState = videoDownloadStatusForVariant(activeVideoDownloads, variant);
+          const status = videoVariantStatus(variant, downloadState, longLiveReady, installingLongLive);
+          const memoryEstimate = videoDiscoverMemoryEstimate(variant);
+          return { variant, status, memoryEstimate };
+        })
+        .filter(({ status }) => statusFilter === "all" || status === statusFilter)
+        .sort((left, right) => {
+          if (videoDiscoverSort === "name") {
+            const diff = left.variant.name.localeCompare(right.variant.name);
+            return sortDir === "asc" ? diff : -diff;
+          }
+          if (videoDiscoverSort === "provider") {
+            const diff = left.variant.provider.localeCompare(right.variant.provider);
+            if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+          }
+          if (videoDiscoverSort === "tasks") {
+            const diff = left.variant.taskSupport.join(" ").localeCompare(right.variant.taskSupport.join(" "));
+            if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+          }
+          if (videoDiscoverSort === "size") {
+            const diff = compareNullableNumber(sizeSortKey(left.variant), sizeSortKey(right.variant), sortDir);
+            if (diff !== 0) return diff;
+          } else if (videoDiscoverSort === "ram") {
+            const diff = compareNullableNumber(left.memoryEstimate?.estimatedPeakGb ?? null, right.memoryEstimate?.estimatedPeakGb ?? null, sortDir);
+            if (diff !== 0) return diff;
+          } else if (videoDiscoverSort === "status") {
+            const diff = statusSortKey(left.status) - statusSortKey(right.status);
+            if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+          } else if (videoDiscoverSort === "likes") {
+            const diff = compareNullableNumber(left.variant.likes ?? null, right.variant.likes ?? null, sortDir);
+            if (diff !== 0) return diff;
+          } else if (videoDiscoverSort === "downloads") {
+            const diff = compareNullableNumber(left.variant.downloads ?? null, right.variant.downloads ?? null, sortDir);
+            if (diff !== 0) return diff;
+          }
+          const dateDiff = releaseSortKey(right.variant).localeCompare(releaseSortKey(left.variant));
+          if (dateDiff !== 0) return sortDir === "desc" ? dateDiff : -dateDiff;
+          return left.variant.name.localeCompare(right.variant.name);
+        }),
+    [
+      activeVideoDownloads,
+      combinedVideoDiscoverResults,
+      installingLongLive,
+      longLiveReady,
+      sortDir,
+      statusFilter,
+      videoDiscoverSort,
+    ],
+  );
+  const hasActiveFilters = videoDiscoverHasActiveFilters || statusFilter !== "all";
+
+  function applySort(nextSort: DiscoverSort) {
+    if (videoDiscoverSort === nextSort) {
+      setSortDir(sortDir === "asc" ? "desc" : "asc");
+    } else {
+      onVideoDiscoverSortChange(nextSort);
+      setSortDir(defaultSortDir(nextSort));
+    }
+  }
+
   return (
     <div className="image-discover-stack">
       <Panel
         title="Video Discover"
-        subtitle={`${combinedVideoDiscoverResults.length} video models / live Hugging Face metadata`}
+        subtitle={`${filteredResults.length} of ${combinedVideoDiscoverResults.length} video models / live Hugging Face metadata`}
       >
         <div className="image-hero">
           <div>
@@ -143,16 +310,42 @@ export function VideoDiscoverTab({
               <option value="video2video">Video to video</option>
             </select>
           </label>
+          <label>
+            Status
+            <select
+              className="text-input"
+              value={statusFilter}
+              onChange={(event) => setStatusFilter(event.target.value as MediaStatusFilter)}
+            >
+              <option value="all">Any status</option>
+              <option value="installed">Installed</option>
+              <option value="not-installed">Not installed</option>
+              <option value="downloading">Downloading</option>
+              <option value="paused">Paused</option>
+              <option value="failed">Failed</option>
+              <option value="incomplete">Incomplete</option>
+            </select>
+          </label>
           <label>
             Sort by
             <select
               className="text-input"
               value={videoDiscoverSort}
-              onChange={(event) => onVideoDiscoverSortChange(event.target.value as DiscoverSort)}
+              onChange={(event) => {
+                const nextSort = event.target.value as DiscoverSort;
+                onVideoDiscoverSortChange(nextSort);
+                setSortDir(defaultSortDir(nextSort));
+              }}
             >
+              <option value="name">Name</option>
+              <option value="provider">Provider</option>
+              <option value="tasks">Tasks</option>
               <option value="release">Newest released</option>
+              <option value="size">Largest size</option>
+              <option value="ram">Highest RAM/VRAM</option>
               <option value="likes">Most likes</option>
               <option value="downloads">Most downloads</option>
+              <option value="status">Status</option>
             </select>
           </label>
           <div className="image-discover-filter-actions">
@@ -162,8 +355,11 @@ export function VideoDiscoverTab({
               onClick={() => {
                 onVideoDiscoverSearchInputChange("");
                 onVideoDiscoverTaskFilterChange("all");
+                setStatusFilter("all");
+                onVideoDiscoverSortChange("release");
+                setSortDir("desc");
               }}
-              disabled={!videoDiscoverHasActiveFilters}
+              disabled={!hasActiveFilters}
             >
               Clear Filters
             </button>
@@ -172,12 +368,7 @@ export function VideoDiscoverTab({
 
         <div className="image-discover-results-summary">
           <span>
-            {combinedVideoDiscoverResults.length} model{combinedVideoDiscoverResults.length !== 1 ? "s" : ""} ·{" "}
-            {videoDiscoverSort === "likes"
-              ? "most liked first"
-              : videoDiscoverSort === "downloads"
-                ? "most downloads first"
-                : "newest released first"}
+            {filteredResults.length} model{filteredResults.length !== 1 ? "s" : ""} · {videoDiscoverSortLabel(videoDiscoverSort)}
           </span>
           {videoDiscoverSearchQuery ? (
             <span className="badge subtle">Search: {videoDiscoverSearchInput.trim()}</span>
@@ -185,152 +376,142 @@ export function VideoDiscoverTab({
           {videoDiscoverTaskFilter !== "all" ? (
             <span className="badge muted">Task: {videoDiscoverTaskFilter}</span>
           ) : null}
+          {statusFilter !== "all" ? <span className="badge muted">Status: {statusFilter}</span> : null}
         </div>
       </Panel>
 
-      {combinedVideoDiscoverResults.length === 0 ? (
+      {filteredResults.length === 0 ? (
         <Panel title="Video Models" subtitle="No models match the current filters" className="image-discover-section-panel">
           <div className="empty-state image-empty-state">
             <p>Try broadening the filters or search terms.</p>
           </div>
         </Panel>
       ) : (
-        <div className="image-discover-grid image-discover-grid--latest">
-          {combinedVideoDiscoverResults.map((variant) => {
-            const isLongLive = isLongLiveRepo(variant.repo);
-            const downloadState = activeVideoDownloads[variant.repo];
-            const isDownloading = downloadState?.state === "downloading";
-            const isPaused = downloadState?.state === "cancelled";
-            const isDownloadComplete = downloadState?.state === "completed";
-            // LongLive never goes through the HF download pipeline — stale
-            // failure states from a prior mis-routed Download click would
-            // otherwise keep rendering "Download Failed" even after we
-            // offer the correct install CTA.
-            const isDownloadFailed =
-              !isLongLive && downloadState?.state === "failed";
-            const isComplete = isLongLive
-              ? longLiveReady
-              : variant.availableLocally || isDownloadComplete;
-            const isPartial = !isLongLive && !isComplete && variant.hasLocalData;
-            const canDeleteLocalData = isLongLive
-              ? false
-              : Boolean(
-                  isComplete || isDownloadComplete || isPaused || isDownloadFailed || isPartial,
-                );
-            return (
-              <article key={variant.id} className="image-library-card">
-                <div className="image-library-card-head">
-                  <div>
-                    <h3>{variant.name}</h3>
-                    <p>{variant.familyName ?? variant.provider}</p>
-                  </div>
-                  {isComplete ? (
-                    <span className="badge success">Installed</span>
-                  ) : isLongLive ? (
-                    installingLongLive ? (
-                      <span className="badge accent">Installing…</span>
-                    ) : (
-                      <span className="badge subtle">Not installed</span>
-                    )
-                  ) : isDownloading ? (
-                    <span className="badge accent" title={downloadSizeTooltip(downloadState)}>
-                      {downloadProgressLabel(downloadState)}
+        <div className="media-model-table media-model-table--video">
+          <div className="media-model-head">
+            <button className="sort-header" type="button" onClick={() => applySort("name")}>Model{sortIndicator(videoDiscoverSort, sortDir, "name")}</button>
+            <button className="sort-header" type="button" onClick={() => applySort("provider")}>Provider{sortIndicator(videoDiscoverSort, sortDir, "provider")}</button>
+            <button className="sort-header" type="button" onClick={() => applySort("tasks")}>Tasks{sortIndicator(videoDiscoverSort, sortDir, "tasks")}</button>
+            <button className="sort-header" type="button" onClick={() => applySort("size")}>
+              Size{sortIndicator(videoDiscoverSort, sortDir, "size")}
+            </button>
+            <button className="sort-header" type="button" onClick={() => applySort("ram")}>
+              RAM/VRAM{sortIndicator(videoDiscoverSort, sortDir, "ram")}
+            </button>
+            <button className="sort-header" type="button" onClick={() => applySort("release")}>
+              Released{sortIndicator(videoDiscoverSort, sortDir, "release")}
+            </button>
+            <button className="sort-header" type="button" onClick={() => applySort("status")}>Status{sortIndicator(videoDiscoverSort, sortDir, "status")}</button>
+            <span className="sort-header"></span>
+          </div>
+          <div className="media-model-rows">
+            {filteredResults.map(({ variant, status, memoryEstimate }) => {
+              const isLongLive = isLongLiveRepo(variant.repo);
+              const downloadState = videoDownloadStatusForVariant(activeVideoDownloads, variant);
+              const isComplete = status === "installed";
+              const isDownloading = status === "downloading";
+              const isPaused = status === "paused";
+              const isDownloadFailed = status === "failed";
+              const isPartial = status === "incomplete";
+              const isDownloadComplete = downloadState?.state === "completed";
+              const canDeleteLocalData = isLongLive
+                ? false
+                : Boolean(isComplete || isDownloadComplete || isPaused || isDownloadFailed || isPartial);
+              const localStatusReason = !isComplete && !isDownloading ? variant.localStatusReason : null;
+              const secondarySize = videoSecondarySizeLabel(variant);
+              const releaseLabel = compactReleaseLabel(formatReleaseLabel(variant.releaseLabel, variant.releaseDate ?? variant.createdAt));
+              const primarySizeLabel = videoPrimarySizeLabel(variant);
+              const sizeTitle = [primarySizeLabel, secondarySize].filter(Boolean).join(" / ");
+              const memory = memoryParts(memoryEstimate?.label);
+              const deleteRepo = videoDeleteRepoForVariant(variant, downloadState);
+              const deleteLabel = isDownloading
+                ? "Cancel download"
+                : videoDeleteLabelForRepo(variant, deleteRepo, "Delete model");
+              return (
+                <div key={variant.id} className={`media-model-row-wrap${isComplete ? " downloaded" : ""}`}>
+                  <div className="media-model-row">
+                    <div className="media-model-name">
+                      <strong>{variant.name}</strong>
+                      <small>{variant.note}</small>
+                      <div className="media-model-chip-row">
+                        {variant.styleTags.slice(0, 4).map((tag) => (
+                          <span key={tag} className="badge subtle">{tag}</span>
+                        ))}
+                      </div>
+                    </div>
+                    <span>{variant.provider}</span>
+                    <div className="media-model-chip-row">
+                      {variant.taskSupport.map((task) => (
+                        <span key={task} className="badge muted">{task}</span>
+                      ))}
+                    </div>
+                    <span title={sizeTitle || undefined}>
+                      {compactModelSizeLabel(primarySizeLabel)}
                     </span>
-                  ) : isPaused ? (
-                    <span className="badge warning">{downloadProgressLabel(downloadState)}</span>
-                  ) : isDownloadFailed ? (
-                    <span className="badge warning">Download Failed</span>
-                  ) : isPartial ? (
-                    <span className="badge warning">Incomplete</span>
-                  ) : null}
-                </div>
-                <div className="image-library-stats">
-                  <span>{videoPrimarySizeLabel(variant)}</span>
-                  {videoSecondarySizeLabel(variant) ? <span>{videoSecondarySizeLabel(variant)}</span> : null}
-                  <span>{variant.recommendedResolution}</span>
-                  <span>{number(variant.defaultDurationSeconds)}s clip</span>
-                  {formatReleaseLabel(variant.releaseLabel, variant.releaseDate) ? (
-                    <span>{formatReleaseLabel(variant.releaseLabel, variant.releaseDate)}</span>
-                  ) : null}
-                  {variant.downloadsLabel ? <span>{variant.downloadsLabel}</span> : null}
-                  {variant.likesLabel ? <span>{variant.likesLabel}</span> : null}
-                  {variant.styleTags.slice(0, 3).map((tag) => (
-                    <span key={tag} className="badge subtle">{tag}</span>
-                  ))}
-                </div>
-                <p className="muted-text">{variant.note}</p>
-                {isLongLive && !isComplete ? (
-                  <p className="muted-text">
-                    LongLive installs into an isolated venv at{" "}
-                    <code>~/.chaosengine/longlive</code>. CUDA only, 5–15 min
-                    depending on network.
-                  </p>
-                ) : null}
-                {isDownloadFailed && downloadState?.error ? (
-                  <p className="muted-text" style={{ color: "var(--error, #e26d6d)" }}>{downloadState.error}</p>
-                ) : null}
-                <div className="button-row">
-                  {isLongLive ? (
-                    isComplete ? (
-                      <button className="primary-button" type="button" onClick={() => onOpenVideoStudio(variant.id)}>
-                        Generate
-                      </button>
-                    ) : (
-                      <>
-                        <button
-                          className="secondary-button"
-                          type="button"
-                          onClick={() => void onInstallLongLive()}
-                          disabled={installingLongLive}
-                        >
-                          {installingLongLive ? "Installing LongLive…" : "Install LongLive"}
-                        </button>
-                        <InstallLogPanel job={longLiveJob} variant="longlive" />
-                      </>
-                    )
-                  ) : isComplete ? (
-                    <button className="primary-button" type="button" onClick={() => onOpenVideoStudio(variant.id)}>
-                      Generate
-                    </button>
-                  ) : isDownloading ? (
-                    <button className="secondary-button" type="button" onClick={() => onCancelVideoDownload(variant.repo)}>
-                      Pause
-                    </button>
-                  ) : isPaused ? (
-                    <button className="secondary-button" type="button" onClick={() => onVideoDownload(variant.repo)}>
-                      Resume
-                    </button>
-                  ) : (
-                    <button className="secondary-button" type="button" onClick={() => onVideoDownload(variant.repo)}>
-                      {isDownloadFailed ? "Retry" : isPartial ? "Resume Download" : "Download"}
-                    </button>
-                  )}
-                  {!isLongLive && (isDownloading || canDeleteLocalData) ? (
-                    <button className="secondary-button danger-button" type="button" onClick={() => onDeleteVideoDownload(variant.repo)}>
-                      {isDownloading ? "Cancel" : "Delete"}
-                    </button>
-                  ) : null}
-                  {variant.localPath ? (
-                    <button
-                      className="secondary-button icon-button"
-                      type="button"
-                      title={fileRevealLabel}
-                      onClick={() => onRevealPath(variant.localPath as string)}
-                    >
-                      <svg width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
-                        <path d="M18 13v6a2 2 0 0 1-2 2H5a2 2 0 0 1-2-2V8a2 2 0 0 1 2-2h6" />
-                        <polyline points="15 3 21 3 21 9" />
-                        <line x1="10" y1="14" x2="21" y2="3" />
-                      </svg>
-                    </button>
+                    <span className="media-model-memory" title={memoryEstimate?.title ?? "RAM/VRAM estimate pending until model weight size is known."}>
+                      <span>{memory.primary}</span>
+                      {memory.secondary ? <small>{memory.secondary}</small> : null}
+                    </span>
+                    <span>
+                      {releaseLabel ?? "Unknown"}
+                      {variant.downloadsLabel ? <small>{variant.downloadsLabel}</small> : null}
+                      {variant.likesLabel ? <small>{variant.likesLabel}</small> : null}
+                    </span>
+                    <span>{statusBadge(status, downloadState, isLongLive && installingLongLive && !longLiveReady)}</span>
+                    <div className="media-model-actions">
+                      {isLongLive ? (
+                        isComplete ? (
+                          <IconActionButton icon="generate" label="Generate" buttonStyle="primary" onClick={() => onOpenVideoStudio(variant.id)} />
+                        ) : (
+                          <>
+                            <IconActionButton icon="install" label={installingLongLive ? "Installing" : "Install"} onClick={() => void onInstallLongLive()} disabled={installingLongLive} />
+                            <InstallLogPanel job={longLiveJob} variant="longlive" />
+                          </>
+                        )
+                      ) : isComplete ? (
+                        <IconActionButton icon="generate" label="Generate" buttonStyle="primary" onClick={() => onOpenVideoStudio(variant.id)} />
+                      ) : isDownloading ? (
+                        <>
+                          <IconActionButton icon="pause" label="Pause download" onClick={() => onCancelVideoDownload(downloadState?.repo ?? variant.repo)} />
+                          <IconActionButton icon="cancel" label={deleteLabel} danger onClick={() => onDeleteVideoDownload(deleteRepo)} />
+                        </>
+                      ) : isPaused ? (
+                        <>
+                          <IconActionButton icon="resume" label="Resume download" onClick={() => onVideoDownload(variant.repo, variant.id)} />
+                          <IconActionButton icon="delete" label={videoDeleteLabelForRepo(variant, deleteRepo, "Delete download")} danger onClick={() => onDeleteVideoDownload(deleteRepo)} />
+                        </>
+                      ) : (
+                        <IconActionButton icon={isDownloadFailed ? "retry" : isPartial ? "resume" : "download"} label={isDownloadFailed ? "Retry download" : isPartial ? "Resume download" : "Download model"} onClick={() => onVideoDownload(variant.repo, variant.id)} />
+                      )}
+                      {!isLongLive && !isDownloading && !isPaused && canDeleteLocalData ? (
+                        <IconActionButton icon="delete" label={deleteLabel} danger onClick={() => onDeleteVideoDownload(deleteRepo)} />
+                      ) : null}
+                      {variant.localPath ? (
+                        <IconActionButton icon="reveal" label={fileRevealLabel} title={fileRevealLabel} onClick={() => onRevealPath(variant.localPath as string)} />
+                      ) : null}
+                      <IconActionButton icon="modelCard" label="Open model card" onClick={() => onOpenExternalUrl(variant.link)} />
+                    </div>
+                  </div>
+                  {isLongLive && !isComplete ? (
+                    <div className="media-model-row-detail callout quiet">
+                      <p>
+                        LongLive installs into an isolated venv at <code>~/.chaosengine/longlive</code>.
+                        CUDA only, 5-15 min depending on network.
+                      </p>
+                    </div>
+                  ) : isDownloadFailed && downloadState?.error ? (
+                    <div className="media-model-row-detail callout error">
+                      <p>{downloadState.error}</p>
+                    </div>
+                  ) : localStatusReason ? (
+                    <div className="media-model-row-detail callout quiet">
+                      <p>{localStatusReason}</p>
+                    </div>
                   ) : null}
-                  <button className="secondary-button" type="button" onClick={() => onOpenExternalUrl(variant.link)}>
-                    Model Card
-                  </button>
                 </div>
-              </article>
-            );
-          })}
+              );
+            })}
+          </div>
         </div>
       )}
     </div>
diff --git a/src/features/video/VideoModelsTab.tsx b/src/features/video/VideoModelsTab.tsx
index 83760b3..c6ab00f 100644
--- a/src/features/video/VideoModelsTab.tsx
+++ b/src/features/video/VideoModelsTab.tsx
@@ -1,4 +1,6 @@
+import { useMemo, useState } from "react";
 import { Panel } from "../../components/Panel";
+import { IconActionButton, StatusIcon } from "../../components/ModelActionIcons";
 import type { DownloadStatus } from "../../api";
 import type {
   TabId,
@@ -6,7 +8,22 @@ import type {
   VideoModelVariant,
   VideoRuntimeStatus,
 } from "../../types";
-import { downloadProgressLabel, formatReleaseLabel, number, videoPrimarySizeLabel } from "../../utils";
+import {
+  compactModelSizeLabel,
+  compactReleaseLabel,
+  downloadProgressLabel,
+  formatReleaseLabel,
+  videoDiscoverMemoryEstimate,
+  videoDeleteLabelForRepo,
+  videoDeleteRepoForVariant,
+  videoDownloadStatusForVariant,
+  videoPrimarySizeLabel,
+  videoSecondarySizeLabel,
+} from "../../utils";
+
+type InstalledVideoSort = "name" | "provider" | "tasks" | "size" | "ram" | "date" | "status";
+type SortDir = "asc" | "desc";
+type InstalledVideoStatusFilter = "all" | "loaded" | "installed" | "incomplete" | "downloading" | "paused" | "failed";
 
 export interface VideoModelsTabProps {
   installedVideoVariants: VideoModelVariant[];
@@ -19,7 +36,7 @@ export interface VideoModelsTabProps {
   fileRevealLabel: string;
   onActiveTabChange: (tab: TabId) => void;
   onOpenVideoStudio: (modelId?: string) => void;
-  onVideoDownload: (repo: string) => void;
+  onVideoDownload: (repo: string, modelId?: string) => void;
   onCancelVideoDownload: (repo: string) => void;
   onDeleteVideoDownload: (repo: string) => void;
   onPreloadVideoModel: (variant: VideoModelVariant) => void;
@@ -28,6 +45,91 @@ export interface VideoModelsTabProps {
   onRevealPath: (path: string) => void;
 }
 
+function releaseSortKey(variant: VideoModelVariant): string {
+  return variant.releaseDate ?? variant.createdAt ?? variant.lastModified ?? "";
+}
+
+function sizeSortKey(variant: VideoModelVariant): number | null {
+  const candidates = [variant.onDiskGb, variant.coreWeightsGb, variant.repoSizeGb, variant.sizeGb];
+  for (const value of candidates) {
+    if (typeof value === "number" && Number.isFinite(value) && value > 0) return value;
+  }
+  return null;
+}
+
+function compareNullableNumberDesc(left: number | null, right: number | null): number {
+  const leftKnown = typeof left === "number" && Number.isFinite(left);
+  const rightKnown = typeof right === "number" && Number.isFinite(right);
+  if (leftKnown && rightKnown) return (right as number) - (left as number);
+  if (leftKnown) return -1;
+  if (rightKnown) return 1;
+  return 0;
+}
+
+function compareNullableNumber(left: number | null, right: number | null, dir: SortDir): number {
+  const desc = compareNullableNumberDesc(left, right);
+  return dir === "desc" ? desc : -desc;
+}
+
+function statusSortKey(status: InstalledVideoStatusFilter): number {
+  if (status === "loaded") return 0;
+  if (status === "installed") return 1;
+  if (status === "downloading") return 2;
+  if (status === "paused") return 3;
+  if (status === "failed") return 4;
+  if (status === "incomplete") return 5;
+  return 6;
+}
+
+function defaultSortDir(sort: InstalledVideoSort): SortDir {
+  return sort === "name" || sort === "provider" || sort === "tasks" ? "asc" : "desc";
+}
+
+function videoStatus(
+  variant: VideoModelVariant,
+  downloadState: DownloadStatus | undefined,
+  loadedVideoVariant: VideoModelVariant | null,
+): InstalledVideoStatusFilter {
+  if (loadedVideoVariant?.id === variant.id) return "loaded";
+  if (downloadState?.state === "downloading") return "downloading";
+  if (downloadState?.state === "cancelled") return "paused";
+  if (downloadState?.state === "failed") return "failed";
+  if (variant.availableLocally || downloadState?.state === "completed") return "installed";
+  return "incomplete";
+}
+
+function statusBadge(status: InstalledVideoStatusFilter, downloadState?: DownloadStatus) {
+  if (status === "loaded") return <StatusIcon status="loaded" label="Loaded in memory" />;
+  if (status === "installed") return <StatusIcon status="installed" label="Installed" />;
+  if (status === "downloading" && downloadState) return <StatusIcon status="downloading" label="Downloading" detail={downloadProgressLabel(downloadState)} />;
+  if (status === "paused" && downloadState) return <StatusIcon status="paused" label="Paused" detail={downloadProgressLabel(downloadState)} />;
+  if (status === "failed") return <StatusIcon status="failed" label="Failed" detail={downloadState?.error ?? "Download failed"} />;
+  return <StatusIcon status="incomplete" label="Incomplete" />;
+}
+
+function sortIndicator(activeSort: InstalledVideoSort, sortDir: SortDir, key: InstalledVideoSort): string {
+  if (activeSort !== key) return "";
+  return sortDir === "asc" ? " \u25B2" : " \u25BC";
+}
+
+function sortLabel(sort: InstalledVideoSort, sortDir: SortDir): string {
+  const direction = sortDir === "asc" ? "ascending" : "descending";
+  if (sort === "provider") return `provider ${direction}`;
+  if (sort === "tasks") return `tasks ${direction}`;
+  if (sort === "size") return sortDir === "desc" ? "largest size first" : "smallest size first";
+  if (sort === "ram") return sortDir === "desc" ? "highest RAM/VRAM first" : "lowest RAM/VRAM first";
+  if (sort === "status") return `status ${direction}`;
+  if (sort === "name") return sortDir === "asc" ? "name A-Z" : "name Z-A";
+  return sortDir === "desc" ? "newest released first" : "oldest released first";
+}
+
+function memoryParts(label: string | null | undefined): { primary: string; secondary: string | null } {
+  if (!label) return { primary: "pending", secondary: null };
+  const [primary, secondary] = label.split(" @ ");
+  if (!secondary) return { primary, secondary: null };
+  return { primary: `${primary} @`, secondary };
+}
+
 export function VideoModelsTab({
   installedVideoVariants,
   videoCatalog,
@@ -47,12 +149,86 @@ export function VideoModelsTab({
   onOpenExternalUrl,
   onRevealPath,
 }: VideoModelsTabProps) {
+  const [searchInput, setSearchInput] = useState("");
+  const [taskFilter, setTaskFilter] = useState<"all" | VideoModelVariant["taskSupport"][number]>("all");
+  const [statusFilter, setStatusFilter] = useState<InstalledVideoStatusFilter>("all");
+  const [sort, setSort] = useState<InstalledVideoSort>("date");
+  const [sortDir, setSortDir] = useState<SortDir>("desc");
+  const normalizedSearch = searchInput.trim().toLowerCase();
+  const hasActiveFilters =
+    normalizedSearch.length > 0 || taskFilter !== "all" || statusFilter !== "all" || sort !== "date" || sortDir !== "desc";
+
+  function applySort(nextSort: InstalledVideoSort) {
+    if (sort === nextSort) {
+      setSortDir(sortDir === "asc" ? "desc" : "asc");
+    } else {
+      setSort(nextSort);
+      setSortDir(defaultSortDir(nextSort));
+    }
+  }
+
+  const rows = useMemo(() => {
+    return installedVideoVariants
+      .map((variant) => {
+        const family = videoCatalog.find((item) =>
+          item.variants.some((candidate) => candidate.id === variant.id),
+        );
+        const downloadState = videoDownloadStatusForVariant(activeVideoDownloads, variant);
+        const status = videoStatus(variant, downloadState, loadedVideoVariant);
+        const memoryEstimate = videoDiscoverMemoryEstimate(variant);
+        return { variant, family, downloadState, status, memoryEstimate };
+      })
+      .filter(({ variant, family, status }) => {
+        if (taskFilter !== "all" && !variant.taskSupport.includes(taskFilter)) return false;
+        if (statusFilter !== "all" && status !== statusFilter) return false;
+        if (!normalizedSearch) return true;
+        const haystack = [
+          variant.name,
+          variant.provider,
+          variant.repo,
+          variant.runtime,
+          family?.name ?? "",
+          variant.recommendedResolution,
+          variant.styleTags.join(" "),
+          variant.taskSupport.join(" "),
+        ].join(" ").toLowerCase();
+        return haystack.includes(normalizedSearch);
+      })
+      .sort((left, right) => {
+        if (sort === "name") {
+          const diff = left.variant.name.localeCompare(right.variant.name);
+          return sortDir === "asc" ? diff : -diff;
+        }
+        if (sort === "provider") {
+          const diff = left.variant.provider.localeCompare(right.variant.provider);
+          if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+        }
+        if (sort === "tasks") {
+          const diff = left.variant.taskSupport.join(" ").localeCompare(right.variant.taskSupport.join(" "));
+          if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+        }
+        if (sort === "size") {
+          const diff = compareNullableNumber(sizeSortKey(left.variant), sizeSortKey(right.variant), sortDir);
+          if (diff !== 0) return diff;
+        } else if (sort === "ram") {
+          const diff = compareNullableNumber(left.memoryEstimate?.estimatedPeakGb ?? null, right.memoryEstimate?.estimatedPeakGb ?? null, sortDir);
+          if (diff !== 0) return diff;
+        } else if (sort === "status") {
+          const diff = statusSortKey(left.status) - statusSortKey(right.status);
+          if (diff !== 0) return sortDir === "asc" ? diff : -diff;
+        }
+        const dateDiff = releaseSortKey(right.variant).localeCompare(releaseSortKey(left.variant));
+        if (dateDiff !== 0) return sortDir === "desc" ? dateDiff : -dateDiff;
+        return left.variant.name.localeCompare(right.variant.name);
+      });
+  }, [activeVideoDownloads, installedVideoVariants, loadedVideoVariant, normalizedSearch, sort, sortDir, statusFilter, taskFilter, videoCatalog]);
+
   return (
     <div className="content-grid image-page-grid">
       <Panel
         title="Installed Video Models"
         subtitle={installedVideoVariants.length > 0
-          ? `${installedVideoVariants.length} model${installedVideoVariants.length !== 1 ? "s" : ""} with local data`
+          ? `${rows.length} of ${installedVideoVariants.length} model${installedVideoVariants.length !== 1 ? "s" : ""} with local data`
           : "No video models detected locally yet"}
         className="span-2"
         actions={
@@ -66,123 +242,185 @@ export function VideoModelsTab({
             <p>Download a video model from Video Discover to get started.</p>
           </div>
         ) : (
-          <div className="image-library-grid">
-            {installedVideoVariants.map((variant) => {
-              const family = videoCatalog.find((item) =>
-                item.variants.some((candidate) => candidate.id === variant.id),
-              );
-              const isComplete = variant.availableLocally;
-              const isPartial = !isComplete && variant.hasLocalData;
-              const downloadState = activeVideoDownloads[variant.repo];
-              const isDownloading = downloadState?.state === "downloading";
-              const isPaused = downloadState?.state === "cancelled";
-              const isDownloadComplete = downloadState?.state === "completed";
-              const isDownloadFailed = downloadState?.state === "failed";
-              const canDeleteLocalData = Boolean(
-                isComplete || isDownloadComplete || isPaused || isDownloadFailed || isPartial,
-              );
-              const isLoadedInMemory = loadedVideoVariant?.id === variant.id;
-              const canPreload = isComplete && videoRuntimeStatus.realGenerationAvailable && !isLoadedInMemory;
-              return (
-                <article key={variant.id} className="image-library-card">
-                  <div className="image-library-card-head">
-                    <div>
-                      <h3>{variant.name}</h3>
-                      <p>{family?.name ?? variant.provider}</p>
-                    </div>
-                    {isLoadedInMemory ? (
-                      <span className="badge accent">In Memory</span>
-                    ) : isComplete || isDownloadComplete ? (
-                      <span className="badge success">Installed</span>
-                    ) : isDownloading ? (
-                      <span className="badge accent">{downloadProgressLabel(downloadState)}</span>
-                    ) : isPaused ? (
-                      <span className="badge warning">{downloadProgressLabel(downloadState)}</span>
-                    ) : isDownloadFailed ? (
-                      <span className="badge warning">Download Failed</span>
-                    ) : isPartial ? (
-                      <span className="badge warning">Incomplete</span>
-                    ) : null}
-                  </div>
-                  <div className="image-library-stats">
-                    <span>{videoPrimarySizeLabel(variant)}</span>
-                    <span>{variant.recommendedResolution}</span>
-                    <span>{number(variant.defaultDurationSeconds)}s clip</span>
-                    {formatReleaseLabel(variant.releaseLabel, variant.releaseDate) ? (
-                      <span>{formatReleaseLabel(variant.releaseLabel, variant.releaseDate)}</span>
-                    ) : null}
-                    {variant.styleTags.slice(0, 3).map((tag) => (
-                      <span key={tag} className="badge subtle">{tag}</span>
-                    ))}
-                  </div>
-                  {isDownloadFailed && downloadState?.error ? (
-                    <p className="muted-text" style={{ color: "var(--error, #e26d6d)" }}>{downloadState.error}</p>
-                  ) : null}
-                  <div className="button-row">
-                    {isComplete || isDownloadComplete ? (
-                      <button className="primary-button" type="button" onClick={() => onOpenVideoStudio(variant.id)}>
-                        Open in Studio
-                      </button>
-                    ) : isDownloading ? (
-                      <button className="secondary-button" type="button" onClick={() => onCancelVideoDownload(variant.repo)}>
-                        Pause
-                      </button>
-                    ) : isPaused ? (
-                      <button className="secondary-button" type="button" onClick={() => onVideoDownload(variant.repo)}>
-                        Resume
-                      </button>
-                    ) : (
-                      <button className="secondary-button" type="button" onClick={() => onVideoDownload(variant.repo)}>
-                        {isDownloadFailed ? "Retry" : isPartial ? "Resume Download" : "Download"}
-                      </button>
-                    )}
-                    {canPreload ? (
-                      <button
-                        className="secondary-button"
-                        type="button"
-                        disabled={videoBusy}
-                        onClick={() => onPreloadVideoModel(variant)}
-                      >
-                        {videoBusy && videoBusyLabel?.includes(variant.name) ? "Loading..." : "Load into memory"}
-                      </button>
-                    ) : null}
-                    {isLoadedInMemory ? (
-                      <button
-                        className="secondary-button"
-                        type="button"
-                        disabled={videoBusy}
-                        onClick={() => onUnloadVideoModel(variant)}
-                      >
-                        {videoBusy && videoBusyLabel?.includes("Unloading") ? "Unloading..." : "Unload"}
-                      </button>
-                    ) : null}
-                    {isDownloading || canDeleteLocalData ? (
-                      <button className="secondary-button danger-button" type="button" onClick={() => onDeleteVideoDownload(variant.repo)}>
-                        {isDownloading ? "Cancel" : "Delete"}
-                      </button>
-                    ) : null}
-                    {variant.localPath ? (
-                      <button
-                        className="secondary-button icon-button"
-                        type="button"
-                        title={fileRevealLabel}
-                        onClick={() => onRevealPath(variant.localPath as string)}
-                      >
-                        <svg width="16" height="16" viewBox="0 0 24 24" fill="none" stroke="currentColor" strokeWidth="2" strokeLinecap="round" strokeLinejoin="round">
-                          <path d="M18 13v6a2 2 0 0 1-2 2H5a2 2 0 0 1-2-2V8a2 2 0 0 1 2-2h6" />
-                          <polyline points="15 3 21 3 21 9" />
-                          <line x1="10" y1="14" x2="21" y2="3" />
-                        </svg>
-                      </button>
-                    ) : null}
-                    <button className="secondary-button" type="button" onClick={() => onOpenExternalUrl(variant.link)}>
-                      Model Card
-                    </button>
-                  </div>
-                </article>
-              );
-            })}
-          </div>
+          <>
+            <div className="image-discover-filter-row image-discover-filter-row--wide image-model-filter-row">
+              <label className="image-discover-search">
+                Search
+                <input
+                  className="text-input"
+                  type="search"
+                  value={searchInput}
+                  onChange={(event) => setSearchInput(event.target.value)}
+                  placeholder="Filter by model, provider, repo, task, or tag..."
+                />
+              </label>
+              <label>
+                Task
+                <select
+                  className="text-input"
+                  value={taskFilter}
+                  onChange={(event) => setTaskFilter(event.target.value as typeof taskFilter)}
+                >
+                  <option value="all">All tasks</option>
+                  <option value="txt2video">Text to video</option>
+                  <option value="img2video">Image to video</option>
+                  <option value="video2video">Video to video</option>
+                </select>
+              </label>
+              <label>
+                Status
+                <select
+                  className="text-input"
+                  value={statusFilter}
+                  onChange={(event) => setStatusFilter(event.target.value as InstalledVideoStatusFilter)}
+                >
+                  <option value="all">Any status</option>
+                  <option value="loaded">In memory</option>
+                  <option value="installed">Installed</option>
+                  <option value="incomplete">Incomplete</option>
+                  <option value="downloading">Downloading</option>
+                  <option value="paused">Paused</option>
+                  <option value="failed">Failed</option>
+                </select>
+              </label>
+              <label>
+                Sort by
+                <select
+                  className="text-input"
+                  value={sort}
+                  onChange={(event) => {
+                    const nextSort = event.target.value as InstalledVideoSort;
+                    setSort(nextSort);
+                    setSortDir(defaultSortDir(nextSort));
+                  }}
+                >
+                  <option value="name">Name</option>
+                  <option value="provider">Provider</option>
+                  <option value="tasks">Tasks</option>
+                  <option value="date">Newest released</option>
+                  <option value="size">Largest size</option>
+                  <option value="ram">Highest RAM/VRAM</option>
+                  <option value="status">Status</option>
+                </select>
+              </label>
+              <div className="image-discover-filter-actions">
+                <button
+                  className="secondary-button"
+                  type="button"
+                  onClick={() => {
+                    setSearchInput("");
+                    setTaskFilter("all");
+                    setStatusFilter("all");
+                    setSort("date");
+                    setSortDir("desc");
+                  }}
+                  disabled={!hasActiveFilters}
+                >
+                  Clear Filters
+                </button>
+              </div>
+            </div>
+            <div className="image-discover-results-summary">
+              <span>{rows.length} model{rows.length !== 1 ? "s" : ""} · {sortLabel(sort, sortDir)}</span>
+              {normalizedSearch ? <span className="badge subtle">Search: {searchInput.trim()}</span> : null}
+              {taskFilter !== "all" ? <span className="badge muted">Task: {taskFilter}</span> : null}
+              {statusFilter !== "all" ? <span className="badge muted">Status: {statusFilter}</span> : null}
+            </div>
+            {rows.length === 0 ? (
+              <div className="empty-state image-empty-state">
+                <p>No installed video models match the current filters.</p>
+              </div>
+            ) : (
+              <div className="media-model-table media-model-table--video">
+                <div className="media-model-head">
+                  <button className="sort-header" type="button" onClick={() => applySort("name")}>Model{sortIndicator(sort, sortDir, "name")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("provider")}>Provider{sortIndicator(sort, sortDir, "provider")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("tasks")}>Tasks{sortIndicator(sort, sortDir, "tasks")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("size")}>Size{sortIndicator(sort, sortDir, "size")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("ram")}>RAM/VRAM{sortIndicator(sort, sortDir, "ram")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("date")}>Released{sortIndicator(sort, sortDir, "date")}</button>
+                  <button className="sort-header" type="button" onClick={() => applySort("status")}>Status{sortIndicator(sort, sortDir, "status")}</button>
+                  <span className="sort-header"></span>
+                </div>
+                <div className="media-model-rows">
+                  {rows.map(({ variant, family, downloadState, status, memoryEstimate }) => {
+                    const isLoadedInMemory = status === "loaded";
+                    const isComplete = status === "loaded" || status === "installed";
+                    const isDownloading = status === "downloading";
+                    const isPaused = status === "paused";
+                    const isDownloadFailed = status === "failed";
+                    const isPartial = status === "incomplete";
+                    const canDeleteLocalData = Boolean(isComplete || isPaused || isDownloadFailed || isPartial);
+                    const localStatusReason = !isComplete && !isDownloading ? variant.localStatusReason : null;
+                    const secondarySize = videoSecondarySizeLabel(variant);
+                    const releaseLabel = compactReleaseLabel(formatReleaseLabel(variant.releaseLabel, variant.releaseDate ?? variant.createdAt));
+                    const primarySizeLabel = videoPrimarySizeLabel(variant);
+                    const sizeTitle = [primarySizeLabel, secondarySize].filter(Boolean).join(" / ");
+                    const memory = memoryParts(memoryEstimate?.label);
+                    const deleteRepo = videoDeleteRepoForVariant(variant, downloadState);
+                    const deleteLabel = isDownloading
+                      ? "Cancel download"
+                      : videoDeleteLabelForRepo(variant, deleteRepo, "Delete model");
+                    return (
+                      <div key={variant.id} className={`media-model-row-wrap${isComplete ? " downloaded" : ""}`}>
+                        <div className="media-model-row">
+                          <div className="media-model-name">
+                            <strong>{variant.name}</strong>
+                            <small>{family?.name ?? variant.provider}</small>
+                            <div className="media-model-chip-row">
+                              {variant.styleTags.slice(0, 4).map((tag) => (
+                                <span key={tag} className="badge subtle">{tag}</span>
+                              ))}
+                            </div>
+                          </div>
+                          <span>{variant.provider}</span>
+                          <div className="media-model-chip-row">
+                            {variant.taskSupport.map((task) => (
+                              <span key={task} className="badge muted">{task}</span>
+                            ))}
+                          </div>
+                          <span title={sizeTitle || undefined}>
+                            {compactModelSizeLabel(primarySizeLabel)}
+                          </span>
+                          <span className="media-model-memory" title={memoryEstimate?.title ?? "RAM/VRAM estimate pending until model weight size is known."}>
+                            <span>{memory.primary}</span>
+                            {memory.secondary ? <small>{memory.secondary}</small> : null}
+                          </span>
+                          <span>{releaseLabel ?? "Unknown"}</span>
+                          <span>{statusBadge(status, downloadState)}</span>
+                          <div className="media-model-actions">
+                            {isComplete ? (
+                              <IconActionButton icon="generate" label="Generate" buttonStyle="primary" onClick={() => onOpenVideoStudio(variant.id)} />
+                            ) : isDownloading ? (
+                              <IconActionButton icon="pause" label="Pause download" onClick={() => onCancelVideoDownload(downloadState?.repo ?? variant.repo)} />
+                            ) : (
+                              <IconActionButton icon={isDownloadFailed ? "retry" : isPartial ? "resume" : "download"} label={isDownloadFailed ? "Retry download" : isPartial ? "Resume download" : "Download model"} onClick={() => onVideoDownload(variant.repo, variant.id)} />
+                            )}
+                            {isDownloading || canDeleteLocalData ? (
+                              <IconActionButton icon={isDownloading ? "cancel" : "delete"} label={deleteLabel} danger onClick={() => onDeleteVideoDownload(deleteRepo)} />
+                            ) : null}
+                            {variant.localPath ? (
+                              <IconActionButton icon="reveal" label={fileRevealLabel} title={fileRevealLabel} onClick={() => onRevealPath(variant.localPath as string)} />
+                            ) : null}
+                            <IconActionButton icon="modelCard" label="Open model card" onClick={() => onOpenExternalUrl(variant.link)} />
+                          </div>
+                        </div>
+                        {isDownloadFailed && downloadState?.error ? (
+                          <div className="media-model-row-detail callout error">
+                            <p>{downloadState.error}</p>
+                          </div>
+                        ) : localStatusReason ? (
+                          <div className="media-model-row-detail callout quiet">
+                            <p>{localStatusReason}</p>
+                          </div>
+                        ) : null}
+                      </div>
+                    );
+                  })}
+                </div>
+              </div>
+            )}
+          </>
         )}
       </Panel>
     </div>
diff --git a/src/features/video/VideoStudioTab.tsx b/src/features/video/VideoStudioTab.tsx
index 26448ed..9eb6cbf 100644
--- a/src/features/video/VideoStudioTab.tsx
+++ b/src/features/video/VideoStudioTab.tsx
@@ -15,6 +15,7 @@ import {
   defaultVideoVariantForFamily,
   downloadProgressLabel,
   number,
+  videoDownloadStatusForVariant,
   videoPrimarySizeLabel,
   videoSecondarySizeLabel,
 } from "../../utils";
@@ -68,7 +69,7 @@ export interface VideoStudioTabProps {
   onActiveTabChange: (tab: TabId) => void;
   onPreloadVideoModel: (variant: VideoModelVariant) => void;
   onUnloadVideoModel: (variant?: VideoModelVariant) => void;
-  onVideoDownload: (repo: string) => void;
+  onVideoDownload: (repo: string, modelId?: string) => void;
   onGenerateVideo: () => void;
   onOpenExternalUrl: (url: string) => void;
   onRestartServer: () => void;
@@ -285,6 +286,7 @@ export function VideoStudioTab({
   const mp4EncoderMissing = missingDependencies.some(
     (dep) => dep === "imageio" || dep === "imageio-ffmpeg",
   );
+  const gpuBundleRestartRequired = gpuBundleJob?.phase === "done" && gpuBundleJob.requiresRestart;
   // Tokenizer / text-encoder packages individual pipelines need lazily —
   // tiktoken for LTX-Video, sentencepiece for Wan / HunyuanVideo / CogVideoX
   // / Mochi, plus the protobuf + ftfy support libs. We list them out as a
@@ -343,7 +345,7 @@ export function VideoStudioTab({
           variants: family.variants.filter((variant) => {
             if (variant.availableLocally) return true;
             if (variant.hasLocalData) return true;
-            const downloadState = activeVideoDownloads[variant.repo];
+            const downloadState = videoDownloadStatusForVariant(activeVideoDownloads, variant);
             return downloadState?.state === "downloading" || downloadState?.state === "completed";
           }),
         }))
@@ -426,7 +428,7 @@ export function VideoStudioTab({
     && !(mlxVideoStatus.missingDependencies ?? []).includes("mlx-video");
 
   const downloadState = useMemo(
-    () => (selectedVideoVariant ? activeVideoDownloads[selectedVideoVariant.repo] : undefined),
+    () => (selectedVideoVariant ? videoDownloadStatusForVariant(activeVideoDownloads, selectedVideoVariant) : undefined),
     [activeVideoDownloads, selectedVideoVariant],
   );
   const isDownloading = downloadState?.state === "downloading";
@@ -457,6 +459,8 @@ export function VideoStudioTab({
     ? "Choose a video model first."
     : !isDownloaded
       ? `${selectedVideoVariant.name} is not installed locally yet.`
+      : gpuBundleRestartRequired
+        ? "Restart the backend to activate the newly installed GPU runtime before generating."
       : !selectedVideoRuntimeStatus.realGenerationAvailable
         ? (selectedVideoRuntimeStatus.message || "Video runtime is not ready.")
         : !hasPrompt
@@ -490,6 +494,9 @@ export function VideoStudioTab({
         deviceMemoryGb: selectedVideoRuntimeStatus.deviceMemoryGb,
         baseModelFootprintGb: selectedVideoVariant?.sizeGb,
         runtimeFootprintGb: selectedVideoVariant?.runtimeFootprintGb,
+        runtimeFootprintMpsGb: selectedVideoVariant?.runtimeFootprintMpsGb,
+        runtimeFootprintCudaGb: selectedVideoVariant?.runtimeFootprintCudaGb,
+        runtimeFootprintCpuGb: selectedVideoVariant?.runtimeFootprintCpuGb,
       }),
     [
       videoWidth,
@@ -499,6 +506,9 @@ export function VideoStudioTab({
       selectedVideoRuntimeStatus.deviceMemoryGb,
       selectedVideoVariant?.sizeGb,
       selectedVideoVariant?.runtimeFootprintGb,
+      selectedVideoVariant?.runtimeFootprintMpsGb,
+      selectedVideoVariant?.runtimeFootprintCudaGb,
+      selectedVideoVariant?.runtimeFootprintCpuGb,
     ],
   );
 
@@ -599,6 +609,9 @@ export function VideoStudioTab({
             <span className={`badge ${videoRuntimeStatus.realGenerationAvailable ? "success" : "warning"}`}>
               {videoRuntimeStatus.realGenerationAvailable ? "Real engine ready" : "Fallback active"}
             </span>
+            {gpuBundleRestartRequired ? (
+              <span className="badge warning">Restart required</span>
+            ) : null}
             <span className="badge muted">Engine: {videoRuntimeStatus.activeEngine}</span>
             {/* Prefer the actual-loaded device; fall back to the predicted
               * expectedDevice computed via nvidia-smi + find_spec (no torch
@@ -733,36 +746,31 @@ export function VideoStudioTab({
               </button>
             </div>
           ) : null}
-          {!videoRuntimeStatus.realGenerationAvailable ? (
+          {gpuBundleRestartRequired ? (
+            <>
+              <div className="image-runtime-actions">
+                <p className="muted-text">
+                  GPU runtime installed to{" "}
+                  <code>{gpuBundleJob.targetDir ?? "extras"}</code>. The running backend
+                  still has its old import cache — click Restart Backend to activate the
+                  new runtime, then video generation will use it.
+                </p>
+                <div className="button-row">
+                  <button
+                    className="primary-button"
+                    type="button"
+                    onClick={() => onRestartServer()}
+                    disabled={busy}
+                  >
+                    {busyAction === "Restarting server..." ? "Restarting..." : "Restart Backend to activate"}
+                  </button>
+                </div>
+              </div>
+              <InstallLogPanel job={gpuBundleJob} />
+            </>
+          ) : !videoRuntimeStatus.realGenerationAvailable ? (
             <>
               <div className="image-runtime-actions">
-                {/* Same post-install-awaiting-restart branch Image Studio
-                  * uses. After a successful GPU bundle install, the
-                  * running backend still can't see the new torch in
-                  * extras (PYTHONPATH is snapshotted at spawn). Nudge
-                  * the user toward Restart Backend instead of asking
-                  * them to install again. */}
-                {gpuBundleJob?.phase === "done" && gpuBundleJob.requiresRestart ? (
-                  <>
-                    <p className="muted-text">
-                      GPU runtime installed to{" "}
-                      <code>{gpuBundleJob.targetDir ?? "extras"}</code>. The running backend
-                      still has its old import cache — click Restart Backend to activate the
-                      new runtime, then video generation will use your GPU.
-                    </p>
-                    <div className="button-row">
-                      <button
-                        className="primary-button"
-                        type="button"
-                        onClick={() => onRestartServer()}
-                        disabled={busy}
-                      >
-                        {busyAction === "Restarting server..." ? "Restarting..." : "Restart Backend to activate"}
-                      </button>
-                    </div>
-                  </>
-                ) : (
-                  <>
                 <p className="muted-text">
                   Video generation needs the GPU runtime bundle (torch + diffusers + tokenizers,
                   ~2.5 GB). Install it once — it writes to a persistent user-local directory so
@@ -781,8 +789,6 @@ export function VideoStudioTab({
                     {busyAction === "Restarting server..." ? "Restarting..." : "Restart Backend"}
                   </button>
                 </div>
-                  </>
-                )}
               </div>
               <InstallLogPanel job={gpuBundleJob} />
             </>
@@ -800,7 +806,7 @@ export function VideoStudioTab({
               >
                 {studioFamilies.flatMap((family) =>
                   family.variants.map((variant) => {
-                    const downloadState = activeVideoDownloads[variant.repo];
+                    const downloadState = videoDownloadStatusForVariant(activeVideoDownloads, variant);
                     const isDownloadingVariant = downloadState?.state === "downloading";
                     const suffix = variant.availableLocally
                       ? " (installed)"
@@ -846,7 +852,9 @@ export function VideoStudioTab({
               ) : isDownloading ? (
                 <span className="badge accent">{downloadProgressLabel(downloadState)}</span>
               ) : (
-                <span className="badge warning">Not downloaded</span>
+                <span className="badge warning" title={selectedVideoVariant.localStatusReason ?? undefined}>
+                  {selectedVideoVariant.hasLocalData ? "Incomplete" : "Not downloaded"}
+                </span>
               )}
               {selectedVideoLoaded ? <span className="badge accent">In Memory</span> : null}
               {videoRuntimeLoadedDifferentModel && loadedVideoVariant ? (
@@ -855,6 +863,12 @@ export function VideoStudioTab({
             </div>
           ) : null}
 
+          {selectedVideoVariant?.localStatusReason && !isDownloaded && !isDownloading ? (
+            <p className="muted-text" style={{ color: "var(--warning, #f2c66d)" }}>
+              {selectedVideoVariant.localStatusReason}
+            </p>
+          ) : null}
+
           <label>
             Prompt
             <textarea
@@ -1306,7 +1320,7 @@ export function VideoStudioTab({
                 className="secondary-button"
                 type="button"
                 disabled={!backendOnline}
-                onClick={() => selectedVideoVariant && onVideoDownload(selectedVideoVariant.repo)}
+                onClick={() => selectedVideoVariant && onVideoDownload(selectedVideoVariant.repo, selectedVideoVariant.id)}
               >
                 Download model
               </button>
@@ -1331,6 +1345,18 @@ export function VideoStudioTab({
                 {videoBusy && videoBusyLabel?.includes("Unloading") ? videoBusyLabel : "Unload"}
               </button>
             ) : null}
+            {!selectedVideoLoaded && loadedVideoVariant ? (
+              <button
+                className="secondary-button"
+                type="button"
+                disabled={videoBusy}
+                onClick={() => onUnloadVideoModel()}
+              >
+                {videoBusy && videoBusyLabel?.includes("Unloading")
+                  ? videoBusyLabel
+                  : `Unload ${loadedVideoVariant.name}`}
+              </button>
+            ) : null}
             <button
               className="primary-button"
               type="button"
diff --git a/src/hooks/useSettings.ts b/src/hooks/useSettings.ts
index 7c3a1d2..5ed8217 100644
--- a/src/hooks/useSettings.ts
+++ b/src/hooks/useSettings.ts
@@ -20,6 +20,7 @@ import type {
   LaunchPreferences,
   ModelDirectorySetting,
   PreviewMetrics,
+  StrategyInstallLog,
   TauriBackendInfo,
   WorkspaceData,
 } from "../types";
@@ -69,6 +70,89 @@ export function useSettings(
   const [systemPrompt, setSystemPrompt] = useState("");
   const [serverModelKey, setServerModelKey] = useState("");
   const [installingPackage, setInstallingPackage] = useState<string | null>(null);
+  const [installLogs, setInstallLogs] = useState<Record<string, StrategyInstallLog>>({});
+
+  function installLabelFor(strategyId: string): string {
+    const labels: Record<string, string> = {
+      rotorquant: "RotorQuant",
+      turboquant: "TurboQuant",
+      triattention: "TriAttention",
+      "dflash-mlx": "DFlash",
+      dflash: "DFlash",
+      chaosengine: "ChaosEngine",
+    };
+    return labels[strategyId] ?? strategyId;
+  }
+
+  function beginInstallLog(strategyId: string) {
+    setInstallLogs((current) => ({
+      ...current,
+      [strategyId]: {
+        strategyId,
+        label: installLabelFor(strategyId),
+        status: "running",
+        startedAt: new Date().toLocaleString(),
+        finishedAt: null,
+        steps: [],
+      },
+    }));
+  }
+
+  function addInstallLogStep(strategyId: string, stepId: string, label: string, command: string) {
+    setInstallLogs((current) => {
+      const existing = current[strategyId] ?? {
+        strategyId,
+        label: installLabelFor(strategyId),
+        status: "running" as const,
+        startedAt: new Date().toLocaleString(),
+        finishedAt: null,
+        steps: [],
+      };
+      return {
+        ...current,
+        [strategyId]: {
+          ...existing,
+          status: "running",
+          finishedAt: null,
+          steps: [
+            ...existing.steps,
+            { id: stepId, label, command, status: "running", output: "" },
+          ],
+        },
+      };
+    });
+  }
+
+  function finishInstallLogStep(strategyId: string, stepId: string, status: "success" | "failed", output: string) {
+    setInstallLogs((current) => {
+      const existing = current[strategyId];
+      if (!existing) return current;
+      return {
+        ...current,
+        [strategyId]: {
+          ...existing,
+          steps: existing.steps.map((step) =>
+            step.id === stepId ? { ...step, status, output } : step,
+          ),
+        },
+      };
+    });
+  }
+
+  function finishInstallLog(strategyId: string, status: "success" | "failed") {
+    setInstallLogs((current) => {
+      const existing = current[strategyId];
+      if (!existing) return current;
+      return {
+        ...current,
+        [strategyId]: {
+          ...existing,
+          status,
+          finishedAt: new Date().toLocaleString(),
+        },
+      };
+    });
+  }
 
   // Cache preview calculation
   useEffect(() => {
@@ -393,15 +477,32 @@ export function useSettings(
       "dflash-mlx": "dflash-mlx",
       dflash: "dflash",
     };
+    const pipCommandMap: Record<string, string> = {
+      rotorquant: "./.venv/bin/python3 -m pip install turboquant",
+      turboquant: "./.venv/bin/python3 -m pip install turboquant-mlx-full",
+      triattention: "./.venv/bin/python3 -m pip install 'triattention @ git+https://github.com/WeianMao/triattention.git'",
+      "dflash-mlx": "./.venv/bin/python3 -m pip install 'dflash-mlx @ git+https://github.com/bstnxbt/dflash-mlx.git@f825ffb268e50d531e8b6524413b0847334a14dd'",
+      dflash: "./.venv/bin/python3 -m pip install dflash",
+    };
     const pipName = pipPackageMap[strategyId];
     if (!pipName) {
+      beginInstallLog(strategyId);
       if (strategyId === "chaosengine") {
-        setError(
-          "ChaosEngine is not on PyPI. Desktop builds can bundle a vendored vendor/ChaosEngine checkout during npm run stage:runtime. For source/dev installs, clone https://github.com/cryptopoly/ChaosEngine and install it into the backend runtime with ./.venv/bin/python3 -m pip install -e /path/to/ChaosEngine, then restart ChaosEngineAI.",
-        );
+        const message = "ChaosEngine is not on PyPI. Desktop builds can bundle a vendored vendor/ChaosEngine checkout during npm run stage:runtime. For source/dev installs, clone https://github.com/cryptopoly/ChaosEngine and install it into the backend runtime with ./.venv/bin/python3 -m pip install -e /path/to/ChaosEngine, then restart ChaosEngineAI.";
+        addInstallLogStep(strategyId, "manual", "Manual install required", "./.venv/bin/python3 -m pip install -e /path/to/ChaosEngine");
+        finishInstallLogStep(strategyId, "manual", "failed", message);
+        finishInstallLog(strategyId, "failed");
+        setError(message);
+      } else {
+        const message = `No installer is configured for ${strategyId}.`;
+        addInstallLogStep(strategyId, "manual", "No installer configured", strategyId);
+        finishInstallLogStep(strategyId, "manual", "failed", message);
+        finishInstallLog(strategyId, "failed");
+        setError(message);
       }
       return;
     }
+    beginInstallLog(strategyId);
     setInstallingPackage(strategyId);
     setError(null);
     try {
@@ -410,22 +511,38 @@ export function useSettings(
       if (needsTurboBinary) {
         const turboInstalled = workspace?.system?.llamaServerTurboPath;
         if (!turboInstalled) {
+          addInstallLogStep(strategyId, "llama-server-turbo", "Build llama-server-turbo", "./scripts/build-llama-turbo.sh");
           const turboResult = await installSystemPackage("llama-server-turbo");
+          finishInstallLogStep(
+            strategyId,
+            "llama-server-turbo",
+            turboResult.ok ? "success" : "failed",
+            turboResult.output,
+          );
           if (!turboResult.ok) {
+            finishInstallLog(strategyId, "failed");
             setError(`llama-server-turbo build failed: ${turboResult.output.slice(0, 300)}`);
             return;
           }
         }
       }
 
+      addInstallLogStep(strategyId, "pip", "Install Python package", pipCommandMap[strategyId] ?? `./.venv/bin/python3 -m pip install ${pipName}`);
       const result = await installPipPackage(pipName);
+      finishInstallLogStep(strategyId, "pip", result.ok ? "success" : "failed", result.output);
       if (result.ok) {
         await refreshWorkspace(activeChatId || undefined);
+        finishInstallLog(strategyId, "success");
       } else {
+        finishInstallLog(strategyId, "failed");
         setError(`Install failed: ${result.output.slice(0, 300)}`);
       }
     } catch (err) {
-      setError(err instanceof Error ? err.message : "Install failed.");
+      const message = err instanceof Error ? err.message : "Install failed.";
+      addInstallLogStep(strategyId, "request", "Install request failed", "ChaosEngineAI install request");
+      finishInstallLogStep(strategyId, "request", "failed", message);
+      finishInstallLog(strategyId, "failed");
+      setError(message);
     } finally {
       setInstallingPackage(null);
     }
@@ -472,6 +589,7 @@ export function useSettings(
     serverModelKey,
     setServerModelKey,
     installingPackage,
+    installLogs,
     updateLaunchSetting,
     updateConversionDraft,
     handleAddDirectory,
diff --git a/src/hooks/useVideoState.ts b/src/hooks/useVideoState.ts
index 204af00..67be385 100644
--- a/src/hooks/useVideoState.ts
+++ b/src/hooks/useVideoState.ts
@@ -74,6 +74,7 @@ import {
   pendingDownloadStatus,
   videoDiscoverFamilyMatchesQuery,
   videoDiscoverVariantMatchesQuery,
+  videoDownloadRepos,
   videoRuntimeErrorStatus,
   videoVariantMatchesDiscoverFilters,
 } from "../utils";
@@ -484,7 +485,7 @@ export function useVideoState(
 
   // ── Data fetching ───────────────────────────────────────────
   async function refreshVideoData() {
-    const [catalog, statuses, runtime, outputs, mlxVideo] = await Promise.allSettled([
+    const [catalog, statuses, runtime, outputs, mlxVideo, gpuBundle] = await Promise.allSettled([
       getVideoCatalog(),
       getVideoDownloadStatus(),
       getVideoRuntime(),
@@ -495,6 +496,7 @@ export function useVideoState(
       // Studio's chip render in sync with the diffusers status without a
       // second round-trip. Failure here is silently swallowed below.
       getMlxVideoRuntime(),
+      getGpuBundleStatus(),
     ]);
     const failures = [catalog, statuses, runtime, outputs].filter(
       (result): result is PromiseRejectedResult => result.status === "rejected",
@@ -518,6 +520,9 @@ export function useVideoState(
     if (mlxVideo.status === "fulfilled") {
       setMlxVideoStatus(mlxVideo.value);
     }
+    if (gpuBundle.status === "fulfilled" && (gpuBundle.value.phase !== "idle" || gpuBundle.value.done)) {
+      setGpuBundleJob(gpuBundle.value);
+    }
     // mlxVideo failure intentionally not added to ``failures`` — the chip
     // is non-blocking; Studio falls back to hiding it when status is null.
 
@@ -533,11 +538,11 @@ export function useVideoState(
   }
 
   // ── Download handlers ───────────────────────────────────────
-  async function handleVideoDownload(repo: string) {
+  async function handleVideoDownload(repo: string, modelId?: string) {
     try {
       setActiveVideoDownloads((prev) => ({ ...prev, [repo]: pendingDownloadStatus(repo, prev[repo]) }));
-      const download = await downloadVideoModel(repo);
-      setActiveVideoDownloads((prev) => ({ ...prev, [repo]: download }));
+      const download = await downloadVideoModel(repo, modelId);
+      setActiveVideoDownloads((prev) => ({ ...prev, [repo]: download, [download.repo]: download }));
       void refreshVideoData();
     } catch (err) {
       setError(err instanceof Error ? err.message : "Video download failed");
@@ -605,7 +610,12 @@ export function useVideoState(
       return;
     }
     if (!selectedVideoVariant.availableLocally) {
-      setError(`${selectedVideoVariant.name} is not installed locally yet. Download it first.`);
+      const missingRepos = videoDownloadRepos(selectedVideoVariant).join(" + ");
+      setError(`${selectedVideoVariant.name} is not installed locally yet. Download required files first: ${missingRepos}.`);
+      return;
+    }
+    if (gpuBundleJob?.phase === "done" && gpuBundleJob.requiresRestart) {
+      setError("Restart the backend to activate the newly installed GPU runtime before generating video.");
       return;
     }
     if (!videoRuntimeStatus.realGenerationAvailable) {
diff --git a/src/styles.css b/src/styles.css
index 9ede21b..ec62ad7 100644
--- a/src/styles.css
+++ b/src/styles.css
@@ -672,6 +672,18 @@ strong {
   line-height: 1.2;
 }
 
+.sr-only {
+  position: absolute;
+  width: 1px;
+  height: 1px;
+  padding: 0;
+  margin: -1px;
+  overflow: hidden;
+  clip: rect(0, 0, 0, 0);
+  white-space: nowrap;
+  border: 0;
+}
+
 .primary-button {
   background: var(--accent);
   color: #0f1215;
@@ -2661,7 +2673,7 @@ select.text-input {
 
 .discover-variant-head {
   display: grid;
-  grid-template-columns: minmax(0, 1fr) 150px 70px 55px 70px 70px 80px 70px minmax(220px, auto);
+  grid-template-columns: minmax(0, 1fr) 150px 70px 55px 70px 70px 80px 70px 52px minmax(190px, auto);
   gap: 12px;
   align-items: center;
   padding: 10px 14px;
@@ -2674,7 +2686,7 @@ select.text-input {
 
 .discover-variant-row {
   display: grid;
-  grid-template-columns: minmax(0, 1fr) 150px 70px 55px 70px 70px 80px 70px minmax(220px, auto);
+  grid-template-columns: minmax(0, 1fr) 150px 70px 55px 70px 70px 80px 70px 52px minmax(190px, auto);
   gap: 12px;
   align-items: center;
   padding: 12px 14px;
@@ -2858,7 +2870,8 @@ select.text-input {
     minmax(80px, 0.7fr)
     minmax(110px, 0.8fr)
     minmax(80px, 0.6fr)
-    290px;
+    52px
+    250px;
   flex: 1;
   display: grid;
   grid-template-rows: auto minmax(0, 1fr);
@@ -2933,13 +2946,74 @@ select.text-input {
   display: inline-flex;
   align-items: center;
   justify-content: center;
-  padding: 6px 10px !important;
+  width: 32px;
+  height: 32px;
+  padding: 0 !important;
+  flex-shrink: 0;
 }
 
 .icon-button svg {
   display: block;
 }
 
+.action-icon-button {
+  border-radius: 8px;
+}
+
+.action-icon-button.action-chat,
+.action-icon-button.action-server,
+.action-icon-button.action-convert {
+  color: #0f1215;
+}
+
+.status-icon-pill {
+  width: 28px;
+  height: 28px;
+  display: inline-flex;
+  align-items: center;
+  justify-content: center;
+  border-radius: 8px;
+  border: 1px solid var(--border);
+  color: var(--muted-strong);
+  background: rgba(255, 255, 255, 0.03);
+}
+
+.status-icon-pill svg {
+  display: block;
+}
+
+.status-icon-pill--installed,
+.status-icon-pill--downloaded {
+  color: var(--success);
+  border-color: rgba(143, 207, 159, 0.38);
+  background: rgba(143, 207, 159, 0.1);
+}
+
+.status-icon-pill--loaded {
+  color: var(--accent);
+  border-color: rgba(143, 180, 255, 0.42);
+  background: rgba(143, 180, 255, 0.1);
+}
+
+.status-icon-pill--downloading {
+  color: var(--accent);
+  border-color: rgba(143, 180, 255, 0.42);
+  background: rgba(143, 180, 255, 0.1);
+}
+
+.status-icon-pill--paused,
+.status-icon-pill--incomplete {
+  color: var(--warning);
+  border-color: rgba(228, 190, 117, 0.42);
+  background: rgba(228, 190, 117, 0.1);
+}
+
+.status-icon-pill--failed {
+  color: var(--danger);
+  border-color: rgba(224, 154, 154, 0.42);
+  background: rgba(224, 154, 154, 0.1);
+}
+
 .library-row-actions .primary-button,
 .library-row-actions .secondary-button {
   padding: 5px 10px;
@@ -4218,6 +4292,113 @@ select.text-input {
   font-style: italic;
 }
 
+.strategy-install-terminal {
+  width: 100%;
+  margin-top: 8px;
+  border: 1px solid rgba(255, 255, 255, 0.08);
+  border-radius: 6px;
+  background: rgba(0, 0, 0, 0.24);
+  overflow: hidden;
+}
+
+.strategy-install-terminal--failed {
+  border-color: rgba(255, 139, 134, 0.28);
+}
+
+.strategy-install-terminal--success {
+  border-color: rgba(123, 216, 143, 0.22);
+}
+
+.strategy-install-terminal--running {
+  border-color: rgba(120, 162, 255, 0.28);
+}
+
+.strategy-install-terminal-summary {
+  display: flex;
+  align-items: center;
+  justify-content: space-between;
+  gap: 10px;
+  padding: 7px 9px;
+  cursor: pointer;
+  list-style: none;
+  user-select: none;
+  color: var(--text-primary, #c9d1d9);
+}
+
+.strategy-install-terminal-summary::-webkit-details-marker {
+  display: none;
+}
+
+.strategy-install-terminal-summary::before {
+  content: "▸";
+  color: var(--text-tertiary, #6e7681);
+  margin-right: 2px;
+  transition: transform 120ms ease;
+}
+
+.strategy-install-terminal[open] > .strategy-install-terminal-summary::before {
+  transform: rotate(90deg);
+}
+
+.strategy-install-terminal-summary span:first-child {
+  flex: 1;
+}
+
+.strategy-install-terminal-status {
+  padding: 2px 6px;
+  border-radius: 999px;
+  font-size: 10px;
+  font-weight: 700;
+  letter-spacing: 0.06em;
+  text-transform: uppercase;
+}
+
+.strategy-install-terminal-status--idle {
+  color: var(--text-tertiary, #6e7681);
+  background: rgba(110, 118, 129, 0.14);
+}
+
+.strategy-install-terminal-status--running {
+  color: var(--accent);
+  background: rgba(120, 162, 255, 0.14);
+}
+
+.strategy-install-terminal-status--success {
+  color: #7bd88f;
+  background: rgba(123, 216, 143, 0.14);
+}
+
+.strategy-install-terminal-status--failed {
+  color: #ff8b86;
+  background: rgba(255, 139, 134, 0.14);
+}
+
+.strategy-install-terminal-meta {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 8px;
+  padding: 7px 9px;
+  border-top: 1px solid rgba(255, 255, 255, 0.06);
+  color: var(--text-tertiary, #6e7681);
+  font-family: ui-monospace, SFMono-Regular, Menlo, Consolas, monospace;
+  font-size: 10px;
+}
+
+.strategy-install-terminal-output {
+  margin: 0;
+  padding: 9px;
+  max-height: 220px;
+  overflow: auto;
+  border-top: 1px solid rgba(255, 255, 255, 0.06);
+  background: rgba(0, 0, 0, 0.42);
+  color: rgba(226, 232, 240, 0.92);
+  font-family: ui-monospace, SFMono-Regular, Menlo, Consolas, monospace;
+  font-size: 11px;
+  line-height: 1.45;
+  white-space: pre;
+  overflow-wrap: anywhere;
+}
+
 /* --- Slider Controls --- */
 
 .slider-grid {
@@ -5487,6 +5668,14 @@ select.text-input {
   align-items: end;
 }
 
+.image-discover-filter-row--wide {
+  grid-template-columns: minmax(240px, 1.8fr) repeat(4, minmax(140px, 0.75fr)) auto;
+}
+
+.image-model-filter-row {
+  margin-bottom: 12px;
+}
+
 .image-discover-filter-row label {
   display: flex;
   flex-direction: column;
@@ -5709,6 +5898,143 @@ select.text-input {
     var(--panel);
 }
 
+.media-model-table {
+  --media-model-grid-columns:
+    minmax(220px, 1.8fr)
+    minmax(95px, 0.7fr)
+    minmax(100px, 0.75fr)
+    minmax(82px, 0.55fr)
+    minmax(105px, 0.7fr)
+    minmax(88px, 0.55fr)
+    minmax(92px, 0.6fr)
+    minmax(220px, 1fr);
+  display: grid;
+  grid-template-rows: auto minmax(0, 1fr);
+  min-height: 0;
+  overflow: auto;
+  scrollbar-gutter: stable;
+  border: 1px solid var(--border);
+  border-radius: 14px;
+  background: var(--panel, rgba(16, 20, 28, 0.92));
+}
+
+.media-model-head,
+.media-model-row {
+  display: grid;
+  grid-template-columns: var(--media-model-grid-columns);
+  gap: 10px;
+  align-items: center;
+  min-width: 1000px;
+}
+
+.media-model-head {
+  position: sticky;
+  top: 0;
+  z-index: 1;
+  padding: 10px 14px;
+  background: var(--panel-alt);
+}
+
+.media-model-rows {
+  min-height: 0;
+}
+
+.media-model-row-wrap {
+  border-bottom: 1px solid var(--border);
+}
+
+.media-model-row-wrap:last-child {
+  border-bottom: none;
+}
+
+.media-model-row {
+  padding: 12px 14px;
+  font-size: 0.9rem;
+}
+
+.media-model-row:hover {
+  background: rgba(255, 255, 255, 0.02);
+}
+
+.media-model-name {
+  display: flex;
+  flex-direction: column;
+  gap: 4px;
+  min-width: 0;
+}
+
+.media-model-name strong {
+  overflow: hidden;
+  text-overflow: ellipsis;
+  white-space: nowrap;
+  font-size: 0.9rem;
+}
+
+.media-model-name small,
+.media-model-row > span small {
+  color: var(--muted);
+  font-size: 0.78rem;
+  line-height: 1.3;
+}
+
+.media-model-name small {
+  display: -webkit-box;
+  -webkit-line-clamp: 2;
+  -webkit-box-orient: vertical;
+  overflow: hidden;
+}
+
+.media-model-row > span {
+  min-width: 0;
+  display: flex;
+  flex-direction: column;
+  gap: 3px;
+  color: var(--muted-strong);
+  font-variant-numeric: tabular-nums;
+}
+
+.media-model-memory > span {
+  line-height: 1.2;
+}
+
+.media-model-memory small {
+  color: var(--muted);
+}
+
+.media-model-chip-row {
+  display: flex;
+  flex-wrap: wrap;
+  gap: 5px;
+  align-items: center;
+  min-width: 0;
+}
+
+.media-model-chip-row .badge {
+  max-width: 100%;
+}
+
+.media-model-actions {
+  display: flex;
+  gap: 6px;
+  align-items: center;
+  justify-content: flex-end;
+  flex-wrap: wrap;
+}
+
+.media-model-actions .primary-button,
+.media-model-actions .secondary-button {
+  padding: 5px 10px;
+  font-size: 0.82rem;
+}
+
+.media-model-row-detail {
+  margin: 0;
+  border-radius: 0;
+  border-left: none;
+  border-right: none;
+  border-bottom: none;
+}
+
 @media (max-width: 1280px) {
   .image-discover-filter-row {
     grid-template-columns: repeat(2, minmax(0, 1fr));
diff --git a/src/types.ts b/src/types.ts
index efcd73a..ec3a95d 100644
--- a/src/types.ts
+++ b/src/types.ts
@@ -106,6 +106,8 @@ export interface ModelVariant {
   familyId: string;
   name: string;
   repo: string;
+  ggufRepo?: string | null;
+  ggufFile?: string | null;
   link: string;
   paramsB: number;
   sizeGb: number;
@@ -183,6 +185,23 @@ export interface LaunchPreferences {
   treeBudget: number;
 }
 
+export interface StrategyInstallLogStep {
+  id: string;
+  label: string;
+  command: string;
+  status: "running" | "success" | "failed";
+  output: string;
+}
+
+export interface StrategyInstallLog {
+  strategyId: string;
+  label: string;
+  status: "running" | "success" | "failed";
+  startedAt: string;
+  finishedAt?: string | null;
+  steps: StrategyInstallLogStep[];
+}
+
 export interface RemoteProvider {
   id: string;
   label: string;
@@ -387,6 +406,7 @@ export interface NativeBackendStatus {
   llamaServerPath?: string | null;
   llamaServerTurboPath?: string | null;
   converterAvailable: boolean;
+  probing?: boolean;
 }
 
 export interface GenerationMetrics {
@@ -713,11 +733,21 @@ export interface ImageModelVariant {
   name: string;
   provider: string;
   repo: string;
+  ggufRepo?: string | null;
+  ggufFile?: string | null;
   link: string;
   runtime: string;
   styleTags: string[];
   taskSupport: ImageModelTask[];
   sizeGb: number;
+  /** Resident peak memory at runtime. Useful when on-disk / quantized
+   * transformer size materially understates the full pipeline footprint
+   * (for example FLUX GGUF: GGUF covers the transformer only, while T5/CLIP,
+   * VAE, and runtime buffers still dominate the Python process). */
+  runtimeFootprintGb?: number;
+  runtimeFootprintMpsGb?: number;
+  runtimeFootprintCudaGb?: number;
+  runtimeFootprintCpuGb?: number;
   recommendedResolution: string;
   note: string;
   availableLocally: boolean;
@@ -773,6 +803,9 @@ export interface VideoModelVariant {
   name: string;
   provider: string;
   repo: string;
+  ggufRepo?: string | null;
+  ggufFile?: string | null;
+  textEncoderRepo?: string | null;
   link: string;
   runtime: string;
   styleTags: string[];
@@ -785,11 +818,17 @@ export interface VideoModelVariant {
    * sharded safetensors and tokenizer caches. ``undefined`` falls back to
    * the legacy ``sizeGb × 1.4`` heuristic. */
   runtimeFootprintGb?: number;
+  runtimeFootprintMpsGb?: number;
+  runtimeFootprintCudaGb?: number;
+  runtimeFootprintCpuGb?: number;
   recommendedResolution: string;
   defaultDurationSeconds: number;
   note: string;
   availableLocally: boolean;
   hasLocalData?: boolean;
+  localDataRepos?: string[];
+  primaryLocalRepo?: string | null;
+  localStatusReason?: string | null;
   estimatedGenerationSeconds: number | null;
   onDiskBytes?: number | null;
   onDiskGb?: number | null;
diff --git a/src/types/image.ts b/src/types/image.ts
index 208cd06..e687f7a 100644
--- a/src/types/image.ts
+++ b/src/types/image.ts
@@ -4,7 +4,18 @@ export type ImageGallerySort = "newest" | "oldest";
 export type ImageDiscoverTaskFilter = "all" | "txt2img" | "img2img" | "inpaint";
 export type ImageDiscoverAccessFilter = "all" | "open" | "gated";
 /** Discover sort axis. ``release`` = most recently released first (prefers
- * the curated releaseDate, falls back to HF createdAt). ``likes`` = HF
- * stars/hearts desc. ``downloads`` = HF downloads desc. Variants without
- * the relevant HF metadata sort to the bottom. */
-export type DiscoverSort = "release" | "likes" | "downloads";
+ * the curated releaseDate, falls back to HF createdAt). ``size`` and ``ram``
+ * sort largest first using the same metadata that powers the row labels.
+ * ``likes`` = HF stars/hearts desc. ``downloads`` = HF downloads desc.
+ * Row views also use name/provider/tasks/status for table headers.
+ * Variants without the relevant metadata sort to the bottom. */
+export type DiscoverSort =
+  | "name"
+  | "provider"
+  | "tasks"
+  | "release"
+  | "size"
+  | "ram"
+  | "likes"
+  | "downloads"
+  | "status";
diff --git a/src/utils/__tests__/cache.test.ts b/src/utils/__tests__/cache.test.ts
index e2a4b4d..bc8ab3f 100644
--- a/src/utils/__tests__/cache.test.ts
+++ b/src/utils/__tests__/cache.test.ts
@@ -5,6 +5,7 @@ import {
   estimateParamsBFromDisk,
   detectBitsPerWeight,
   compareOptionalNumber,
+  getCacheFitStatus,
 } from "../cache";
 
 describe("parseContextK()", () => {
@@ -107,3 +108,24 @@ describe("compareOptionalNumber()", () => {
     expect(compareOptionalNumber(undefined, undefined, 1)).toBe(0);
   });
 });
+
+describe("getCacheFitStatus()", () => {
+  it("calls out full context cache pressure separately from model loading", () => {
+    const status = getCacheFitStatus(60, 48.1, 128, 0);
+    expect(status.label).toBe("Full context may not fit");
+    expect(status.advice).toContain("model can load");
+    expect(status.advice).toContain("full native f16 cache");
+  });
+
+  it("only says model weights are the problem when weights exceed usable RAM", () => {
+    const status = getCacheFitStatus(8, 110, 128, 0);
+    expect(status.label).toBe("Model may not fit");
+    expect(status.advice).toContain("Model weights alone exceed");
+  });
+
+  it("keeps ordinary headroom as a success", () => {
+    const status = getCacheFitStatus(10, 20, 128, 0);
+    expect(status.label).toBe("Fits easily");
+    expect(status.advice).toBeNull();
+  });
+});
diff --git a/src/utils/__tests__/images.test.ts b/src/utils/__tests__/images.test.ts
new file mode 100644
index 0000000..c948ec3
--- /dev/null
+++ b/src/utils/__tests__/images.test.ts
@@ -0,0 +1,224 @@
+import { describe, expect, it } from "vitest";
+
+import type { ImageModelVariant } from "../../types";
+import { assessImageGenerationSafety, imageDiscoverMemoryEstimate } from "../images";
+import { compareDiscoverVariants } from "../discoverSort";
+
+describe("assessImageGenerationSafety()", () => {
+  it("does not block standard FLUX 1024px generation on a 64 GB MPS Mac", () => {
+    const result = assessImageGenerationSafety({
+      width: 1024,
+      height: 1024,
+      device: "mps",
+      deviceMemoryGb: 64,
+      baseModelFootprintGb: 23.7,
+      repo: "black-forest-labs/FLUX.1-schnell",
+    });
+
+    expect(result.riskLevel).toBe("safe");
+    expect(result.effectiveDevice).toBe("mps");
+    expect(result.modelFootprintGb).toBeCloseTo(17.775, 3);
+  });
+
+  it("still warns hard for standard FLUX on a 16 GB MPS Mac", () => {
+    const result = assessImageGenerationSafety({
+      width: 1024,
+      height: 1024,
+      device: "mps",
+      deviceMemoryGb: 16,
+      baseModelFootprintGb: 23.7,
+      repo: "black-forest-labs/FLUX.1-schnell",
+    });
+
+    expect(result.riskLevel).toBe("danger");
+    expect(result.reason).toMatch(/Apple Silicon \(MPS\)/);
+    expect(result.suggestion).toBeNull();
+  });
+
+  it("flags 2K FLUX on 64 GB MPS because attention dominates", () => {
+    const result = assessImageGenerationSafety({
+      width: 2048,
+      height: 2048,
+      device: "mps",
+      deviceMemoryGb: 64,
+      baseModelFootprintGb: 23.7,
+      repo: "black-forest-labs/FLUX.1-schnell",
+    });
+
+    expect(result.riskLevel).toBe("danger");
+    expect(result.reason).toMatch(/peak memory/);
+    expect(result.suggestion?.width).toBeLessThan(2048);
+  });
+
+  it("uses CUDA FLUX offload assumptions on dedicated GPUs", () => {
+    const result = assessImageGenerationSafety({
+      width: 1024,
+      height: 1024,
+      device: "cuda",
+      deviceMemoryGb: 24,
+      baseModelFootprintGb: 23.7,
+      repo: "black-forest-labs/FLUX.1-dev",
+    });
+
+    expect(result.riskLevel).toBe("safe");
+    expect(result.effectiveDevice).toBe("cuda");
+    expect(result.reason).toBeNull();
+  });
+
+  it("does not apply FLUX runtime discounts to non-FLUX CUDA models", () => {
+    const result = assessImageGenerationSafety({
+      width: 1024,
+      height: 1024,
+      device: "cuda",
+      deviceMemoryGb: 8,
+      baseModelFootprintGb: 16.5,
+      repo: "stabilityai/stable-diffusion-3.5-large-turbo",
+    });
+
+    expect(result.riskLevel).toBe("danger");
+    expect(result.reason).toMatch(/this GPU/);
+  });
+
+  it("keeps CPU warnings labelled as CPU generation", () => {
+    const result = assessImageGenerationSafety({
+      width: 1024,
+      height: 1024,
+      device: "cpu",
+      deviceMemoryGb: 16,
+      baseModelFootprintGb: 13.1,
+      repo: "stabilityai/stable-diffusion-xl-base-1.0",
+    });
+
+    expect(result.effectiveDevice).toBe("cpu");
+    expect(result.riskLevel).not.toBe("safe");
+    expect(result.reason).toMatch(/CPU generation/);
+  });
+
+  it("matches Qwen-Image's backend CPU route on Apple Silicon", () => {
+    const result = assessImageGenerationSafety({
+      width: 1024,
+      height: 1024,
+      device: "mps",
+      deviceMemoryGb: 64,
+      baseModelFootprintGb: 57.7,
+      runtimeFootprintMpsGb: 60,
+      runtimeFootprintCpuGb: 72,
+      repo: "Qwen/Qwen-Image",
+    });
+
+    expect(result.effectiveDevice).toBe("cpu");
+    expect(result.modelFootprintGb).toBe(72);
+    expect(result.reason).toMatch(/CPU generation/);
+  });
+
+  it("falls back safely for invalid dimensions", () => {
+    const result = assessImageGenerationSafety({
+      width: 0,
+      height: 1024,
+      device: "mps",
+      deviceMemoryGb: 64,
+      baseModelFootprintGb: 23.7,
+      repo: "black-forest-labs/FLUX.1-schnell",
+    });
+
+    expect(result.riskLevel).toBe("safe");
+    expect(result.estimatedPeakGb).toBe(0);
+  });
+});
+
+describe("imageDiscoverMemoryEstimate()", () => {
+  const baseVariant: ImageModelVariant = {
+    id: "black-forest-labs/FLUX.1-schnell",
+    familyId: "flux-fast",
+    name: "FLUX.1 Schnell",
+    provider: "Black Forest Labs",
+    repo: "black-forest-labs/FLUX.1-schnell",
+    link: "https://huggingface.co/black-forest-labs/FLUX.1-schnell",
+    runtime: "Diffusers",
+    styleTags: ["general"],
+    taskSupport: ["txt2img"],
+    sizeGb: 23.7,
+    recommendedResolution: "1024x1024",
+    note: "Fast local generation.",
+    availableLocally: false,
+    estimatedGenerationSeconds: null,
+  };
+
+  it("returns a GB label at the recommended resolution", () => {
+    const result = imageDiscoverMemoryEstimate(baseVariant);
+
+    expect(result).not.toBeNull();
+    expect(result!.label).toMatch(/^~\d+ GB @ 1024×1024$/);
+    expect(result!.estimatedPeakGb).toBeGreaterThan(0);
+  });
+
+  it("uses live core weight metadata ahead of stale catalog size", () => {
+    const result = imageDiscoverMemoryEstimate({
+      ...baseVariant,
+      coreWeightsGb: 10,
+      sizeGb: 23.7,
+    });
+
+    expect(result!.modelFootprintGb).toBeCloseTo(7.5, 2);
+  });
+
+  it("accounts for FLUX GGUF text encoders and MPS runtime overhead", () => {
+    const result = imageDiscoverMemoryEstimate({
+      ...baseVariant,
+      id: "black-forest-labs/FLUX.1-dev-gguf-q4km",
+      name: "FLUX.1 Dev · GGUF Q4_K_M",
+      repo: "black-forest-labs/FLUX.1-dev",
+      ggufRepo: "city96/FLUX.1-dev-gguf",
+      ggufFile: "flux1-dev-Q4_K_M.gguf",
+      sizeGb: 6.8,
+      coreWeightsGb: null,
+      onDiskGb: 53.9,
+    });
+
+    expect(result).not.toBeNull();
+    expect(result!.modelFootprintGb).toBeCloseTo(41.3, 1);
+    expect(result!.estimatedPeakGb).toBeGreaterThan(42);
+    expect(result!.estimatedPeakGb).toBeLessThan(45);
+    expect(result!.label).toMatch(/^~43 GB @ 1024×1024$/);
+  });
+
+  it("prefers host-specific runtime footprint metadata when present", () => {
+    const result = imageDiscoverMemoryEstimate({
+      ...baseVariant,
+      id: "Tongyi-MAI/Z-Image-Turbo",
+      name: "Z-Image-Turbo",
+      repo: "Tongyi-MAI/Z-Image-Turbo",
+      sizeGb: 30.58,
+      runtimeFootprintGb: 16,
+      runtimeFootprintMpsGb: 20,
+    });
+
+    expect(result).not.toBeNull();
+    expect(result!.modelFootprintGb).toBe(20);
+    expect(result!.label).toMatch(/^~22 GB @ 1024×1024$/);
+  });
+
+  it("returns null when model size is unknown", () => {
+    const result = imageDiscoverMemoryEstimate({
+      ...baseVariant,
+      sizeGb: 0,
+      coreWeightsGb: null,
+      repoSizeGb: null,
+    });
+
+    expect(result).toBeNull();
+  });
+});
+
+describe("compareDiscoverVariants()", () => {
+  it("sorts Discover models by size and RAM metadata with unknowns last", () => {
+    const small = { name: "small", sizeGb: 4, releaseDate: "2026-01" };
+    const large = { name: "large", coreWeightsGb: 12, sizeGb: 8, releaseDate: "2025-01" };
+    const unknown = { name: "unknown", releaseDate: "2027-01" };
+
+    expect([small, unknown, large].sort((a, b) => compareDiscoverVariants("size", a, b)).map((item) => item.name))
+      .toEqual(["large", "small", "unknown"]);
+    expect([small, unknown, large].sort((a, b) => compareDiscoverVariants("ram", a, b)).map((item) => item.name))
+      .toEqual(["large", "small", "unknown"]);
+  });
+});
diff --git a/src/utils/__tests__/library.test.ts b/src/utils/__tests__/library.test.ts
index 98324a1..770dfb8 100644
--- a/src/utils/__tests__/library.test.ts
+++ b/src/utils/__tests__/library.test.ts
@@ -4,6 +4,7 @@ import {
   estimateLibraryItemCompressedGb,
   estimateLibraryItemResidentGb,
   findCatalogVariantForLibraryItem,
+  isChatLibraryItem,
 } from "../library";
 import type { LibraryItem, ModelFamily, ModelVariant } from "../../types";
 
@@ -131,6 +132,42 @@ describe("findCatalogVariantForLibraryItem()", () => {
   });
 });
 
+describe("isChatLibraryItem()", () => {
+  it("keeps text models", () => {
+    expect(isChatLibraryItem(makeItem({ name: "Qwen3-8B", path: "/models/Qwen3-8B" }))).toBe(true);
+  });
+
+  it("excludes explicit non-chat model types", () => {
+    expect(isChatLibraryItem(makeItem({ name: "Flux", path: "/models/Flux", modelType: "image" }))).toBe(false);
+    expect(isChatLibraryItem(makeItem({ name: "LTX-Video", path: "/models/LTX-Video", modelType: "video" }))).toBe(false);
+    expect(isChatLibraryItem(makeItem({ name: "Qwen-Draft", path: "/models/Qwen-Draft", modelType: "draft" }))).toBe(false);
+  });
+
+  it("filters legacy cached LTX-2 entries without modelType", () => {
+    expect(isChatLibraryItem(makeItem({
+      name: "prince-canuma/LTX-2.3-dev",
+      path: "/hf/models--prince-canuma--LTX-2.3-dev/snapshots/1234",
+      modelType: null,
+    }))).toBe(false);
+  });
+
+  it("filters stale LTX-2 entries previously misclassified as text", () => {
+    expect(isChatLibraryItem(makeItem({
+      name: "prince-canuma/LTX-2-distilled",
+      path: "/hf/models--prince-canuma--LTX-2-distilled/snapshots/1234",
+      modelType: "text",
+    }))).toBe(false);
+  });
+
+  it("filters stale Sana image entries previously misclassified as text", () => {
+    expect(isChatLibraryItem(makeItem({
+      name: "Efficient-Large-Model/Sana_Sprint_1.6B_1024px_diffusers",
+      path: "/hf/models--Efficient-Large-Model--Sana_Sprint_1.6B_1024px_diffusers/snapshots/1234",
+      modelType: "text",
+    }))).toBe(false);
+  });
+});
+
 describe("estimateLibraryItemResidentGb()", () => {
   it("scales with actual on-disk size, not a stale catalog guess", () => {
     const tiny = estimateLibraryItemResidentGb(makeItem({ name: "a", path: "/a", sizeGb: 0.9 }));
diff --git a/src/utils/__tests__/videos.test.ts b/src/utils/__tests__/videos.test.ts
index ecabd7c..0cc3ca8 100644
--- a/src/utils/__tests__/videos.test.ts
+++ b/src/utils/__tests__/videos.test.ts
@@ -3,6 +3,9 @@ import { afterEach, describe, expect, it } from "vitest";
 import {
   assessVideoGenerationSafety,
   inferDeviceFromHostPlatform,
+  videoDeleteLabelForRepo,
+  videoDeleteRepoForVariant,
+  videoDiscoverMemoryEstimate,
   videoDiscoverFamilyMatchesQuery,
   videoDiscoverVariantMatchesQuery,
   videoRuntimeErrorStatus,
@@ -71,6 +74,103 @@ describe("video discover search helpers", () => {
   });
 });
 
+describe("video delete target helpers", () => {
+  it("uses the active component download repo before the base repo", () => {
+    const variant = makeVideoVariant({
+      repo: "Lightricks/LTX-Video",
+      ggufRepo: "city96/LTX-Video-gguf",
+      ggufFile: "ltx-video-2b-v0.9-Q6_K.gguf",
+    });
+
+    expect(videoDeleteRepoForVariant(variant, { repo: "city96/LTX-Video-gguf" })).toBe("city96/LTX-Video-gguf");
+  });
+
+  it("uses the primary local repo for partial shared GGUF data", () => {
+    const variant = makeVideoVariant({
+      repo: "Lightricks/LTX-Video",
+      ggufRepo: "city96/LTX-Video-gguf",
+      ggufFile: "ltx-video-2b-v0.9-Q6_K.gguf",
+      hasLocalData: true,
+      localDataRepos: ["city96/LTX-Video-gguf"],
+      primaryLocalRepo: "city96/LTX-Video-gguf",
+    });
+
+    const repo = videoDeleteRepoForVariant(variant);
+    expect(repo).toBe("city96/LTX-Video-gguf");
+    expect(videoDeleteLabelForRepo(variant, repo)).toBe("Delete shared GGUF download");
+  });
+});
+
+describe("videoDiscoverMemoryEstimate()", () => {
+  it("returns a GB label at the recommended resolution and default clip length", () => {
+    const result = videoDiscoverMemoryEstimate(makeVideoVariant({
+      sizeGb: 16.4,
+      recommendedResolution: "832x480",
+      defaultDurationSeconds: 4,
+    }));
+
+    expect(result).not.toBeNull();
+    expect(result!.label).toMatch(/^~\d+ GB @ 832×480$/);
+    expect(result!.frameCount).toBe(33);
+    expect(result!.estimatedPeakGb).toBeGreaterThan(0);
+  });
+
+  it("returns null when no size or runtime footprint metadata is available", () => {
+    const result = videoDiscoverMemoryEstimate(makeVideoVariant({
+      sizeGb: 0,
+      coreWeightsGb: null,
+      repoSizeGb: null,
+      runtimeFootprintGb: undefined,
+    }));
+
+    expect(result).toBeNull();
+  });
+
+  it("uses catalog runtime size instead of inflated local snapshot size", () => {
+    const result = videoDiscoverMemoryEstimate(makeVideoVariant({
+      name: "LTX-2.3 · dev (MLX)",
+      repo: "prince-canuma/LTX-2.3-dev",
+      sizeGb: 19,
+      runtimeFootprintGb: 27,
+      coreWeightsGb: 45.8,
+      onDiskGb: 45.8,
+      recommendedResolution: "768x512",
+      defaultDurationSeconds: 4,
+    }));
+
+    expect(result).not.toBeNull();
+    expect(result!.modelFootprintGb).toBeCloseTo(27, 1);
+    expect(result!.estimatedPeakGb).toBeLessThan(35);
+    expect(result!.title).toMatch(/local storage/i);
+  });
+
+  it("prefers host-specific runtime footprint metadata when present", () => {
+    const mps = assessVideoGenerationSafety({
+      width: 832,
+      height: 480,
+      numFrames: 33,
+      device: "mps",
+      deviceMemoryGb: 64,
+      baseModelFootprintGb: 16.4,
+      runtimeFootprintGb: 14,
+      runtimeFootprintMpsGb: 23,
+    });
+    const cuda = assessVideoGenerationSafety({
+      width: 832,
+      height: 480,
+      numFrames: 33,
+      device: "cuda:0",
+      deviceMemoryGb: 24,
+      baseModelFootprintGb: 16.4,
+      runtimeFootprintGb: 14,
+      runtimeFootprintMpsGb: 23,
+    });
+
+    expect(mps.modelFootprintGb).toBe(23);
+    expect(cuda.modelFootprintGb).toBe(14);
+  });
+});
+
 describe("assessVideoGenerationSafety()", () => {
   describe("safe envelope on base hardware", () => {
     it("returns safe for the Studio defaults on a 16 GB M2", () => {
diff --git a/src/utils/cache.ts b/src/utils/cache.ts
index b1f7a58..c1ae318 100644
--- a/src/utils/cache.ts
+++ b/src/utils/cache.ts
@@ -43,3 +43,39 @@ export function compareOptionalNumber(left: number | null | undefined, right: nu
   if (!leftKnown && rightKnown) return 1;
   return 0;
 }
+
+export interface CacheFitStatus {
+  label: string;
+  className: string;
+  advice: string | null;
+}
+
+export function getCacheFitStatus(
+  optimizedCacheGb: number,
+  diskSizeGb: number,
+  totalGb: number,
+  bits: number,
+): CacheFitStatus {
+  // Use total system memory because loading a new chat model unloads the old
+  // one. Keep a reserve for the OS and other desktop apps.
+  const usable = totalGb > 0 ? totalGb * 0.80 : 0;
+  if (usable <= 0) return { label: "May not fit", className: "warning", advice: null };
+
+  if (diskSizeGb > usable) {
+    return {
+      label: "Model may not fit",
+      className: "warning",
+      advice: "Model weights alone exceed estimated usable RAM. Pick a smaller model or a more aggressive quantisation.",
+    };
+  }
+
+  const totalNeeded = optimizedCacheGb + diskSizeGb;
+  const ratio = totalNeeded / usable;
+  if (ratio < 0.7) return { label: "Fits easily", className: "success", advice: null };
+  if (ratio < 0.95) return { label: "Tight fit", className: "warning", advice: null };
+
+  const advice = bits <= 0
+    ? "The model can load, but a full native f16 cache at this context may exceed RAM as the thread fills. Lower context, or pick a compressed strategy."
+    : "The model can load, but the selected context cache may exceed RAM as the thread fills. Lower context or reduce FP16 layers.";
+  return { label: "Full context may not fit", className: "warning", advice };
+}
diff --git a/src/utils/discoverSort.ts b/src/utils/discoverSort.ts
index d0cbd28..1ac505b 100644
--- a/src/utils/discoverSort.ts
+++ b/src/utils/discoverSort.ts
@@ -6,11 +6,22 @@ import type { DiscoverSort } from "../types/image";
 // level. Every field is optional; missing fields sink to the bottom
 // of the sorted list.
 interface DiscoverSortable {
+  name?: string | null;
+  provider?: string | null;
+  taskSupport?: string[] | null;
   releaseDate?: string | null;
   createdAt?: string | null;
   lastModified?: string | null;
   likes?: number | null;
   downloads?: number | null;
+  sizeGb?: number | null;
+  repoSizeGb?: number | null;
+  coreWeightsGb?: number | null;
+  onDiskGb?: number | null;
+  runtimeFootprintGb?: number | null;
+  runtimeFootprintMpsGb?: number | null;
+  runtimeFootprintCudaGb?: number | null;
+  runtimeFootprintCpuGb?: number | null;
 }
 
 function releaseSortKey(variant: DiscoverSortable): string {
@@ -26,11 +37,83 @@ function releaseSortKey(variant: DiscoverSortable): string {
   );
 }
 
+function firstPositiveNumber(values: Array<number | null | undefined>): number | null {
+  for (const value of values) {
+    if (typeof value === "number" && Number.isFinite(value) && value > 0) {
+      return value;
+    }
+  }
+  return null;
+}
+
+function sizeSortKey(variant: DiscoverSortable): number | null {
+  return firstPositiveNumber([
+    variant.onDiskGb,
+    variant.coreWeightsGb,
+    variant.repoSizeGb,
+    variant.sizeGb,
+  ]);
+}
+
+function ramSortKey(variant: DiscoverSortable): number | null {
+  const runtimeValues = [
+    variant.runtimeFootprintGb,
+    variant.runtimeFootprintMpsGb,
+    variant.runtimeFootprintCudaGb,
+    variant.runtimeFootprintCpuGb,
+  ].filter((value): value is number => typeof value === "number" && Number.isFinite(value) && value > 0);
+  const runtimeMax = runtimeValues.length > 0 ? Math.max(...runtimeValues) : null;
+  return firstPositiveNumber([
+    runtimeMax,
+    variant.runtimeFootprintGb,
+    variant.coreWeightsGb,
+    variant.sizeGb,
+    variant.onDiskGb,
+    variant.repoSizeGb,
+  ]);
+}
+
+function compareNullableNumberDesc(left: number | null, right: number | null): number {
+  const leftKnown = typeof left === "number" && Number.isFinite(left);
+  const rightKnown = typeof right === "number" && Number.isFinite(right);
+  if (leftKnown && rightKnown) return (right as number) - (left as number);
+  if (leftKnown) return -1;
+  if (rightKnown) return 1;
+  return 0;
+}
+
+function taskSortKey(variant: DiscoverSortable): string {
+  return (variant.taskSupport ?? []).join(" ");
+}
+
 export function compareDiscoverVariants(
   sort: DiscoverSort,
   a: DiscoverSortable,
   b: DiscoverSortable,
 ): number {
+  if (sort === "name") {
+    return (a.name ?? "").localeCompare(b.name ?? "");
+  }
+  if (sort === "provider") {
+    const diff = (a.provider ?? "").localeCompare(b.provider ?? "");
+    if (diff !== 0) return diff;
+    return (a.name ?? "").localeCompare(b.name ?? "");
+  }
+  if (sort === "tasks") {
+    const diff = taskSortKey(a).localeCompare(taskSortKey(b));
+    if (diff !== 0) return diff;
+    return (a.name ?? "").localeCompare(b.name ?? "");
+  }
+  if (sort === "size") {
+    const diff = compareNullableNumberDesc(sizeSortKey(a), sizeSortKey(b));
+    if (diff !== 0) return diff;
+    return releaseSortKey(b).localeCompare(releaseSortKey(a));
+  }
+  if (sort === "ram") {
+    const diff = compareNullableNumberDesc(ramSortKey(a), ramSortKey(b));
+    if (diff !== 0) return diff;
+    return releaseSortKey(b).localeCompare(releaseSortKey(a));
+  }
   if (sort === "likes") {
     const diff = (b.likes ?? -1) - (a.likes ?? -1);
     if (diff !== 0) return diff;
diff --git a/src/utils/format.ts b/src/utils/format.ts
index 8a4d714..e547307 100644
--- a/src/utils/format.ts
+++ b/src/utils/format.ts
@@ -55,6 +55,11 @@ export function formatReleaseLabel(
   return `Released ${MONTH_SHORT[parsed.getUTCMonth()]} ${parsed.getUTCFullYear()}`;
 }
 
+export function compactReleaseLabel(value?: string | null) {
+  if (!value) return null;
+  return value.replace(/^Released\s+/i, "").trim() || null;
+}
+
 export function formatImageLicenseLabel(value?: string | null) {
   if (!value) return null;
   return value
@@ -62,6 +67,11 @@ export function formatImageLicenseLabel(value?: string | null) {
     .replace(/\b\w/g, (char) => char.toUpperCase());
 }
 
+export function compactModelSizeLabel(value: string | null | undefined) {
+  if (!value) return "Unknown";
+  return value.replace(/\s+(on disk|weights|download|full repo)$/i, "").trim();
+}
+
 export function imagePrimarySizeLabel(variant: ImageModelVariant) {
   if (typeof variant.onDiskGb === "number" && variant.onDiskGb > 0) {
     return `${sizeLabel(variant.onDiskGb)} on disk`;
diff --git a/src/utils/images.ts b/src/utils/images.ts
index 871ea35..5b19c11 100644
--- a/src/utils/images.ts
+++ b/src/utils/images.ts
@@ -111,6 +111,81 @@ export function imageDiscoverFamilyMatchesQuery(family: ImageModelFamily, query:
   return imageDiscoverFamilyHaystack(family).includes(query);
 }
 
+export interface ImageDiscoverMemoryEstimate {
+  estimatedPeakGb: number;
+  modelFootprintGb: number;
+  resolutionLabel: string;
+  label: string;
+  title: string;
+}
+
+function formatImageDiscoverGb(gb: number): string {
+  if (!Number.isFinite(gb) || gb <= 0) return "Unknown";
+  return gb >= 10 ? `${gb.toFixed(0)} GB` : `${gb.toFixed(1)} GB`;
+}
+
+function parseRecommendedImageResolution(value: string | null | undefined): { width: number; height: number } {
+  const match = /(\d{3,5})\s*[x×]\s*(\d{3,5})/i.exec(value ?? "");
+  if (!match) return { width: 1024, height: 1024 };
+  const width = Number.parseInt(match[1], 10);
+  const height = Number.parseInt(match[2], 10);
+  if (!Number.isFinite(width) || !Number.isFinite(height) || width <= 0 || height <= 0) {
+    return { width: 1024, height: 1024 };
+  }
+  return { width, height };
+}
+
+export function imageVariantSizeForMemoryEstimate(variant: ImageModelVariant): number {
+  const candidates = [
+    variant.coreWeightsGb,
+    variant.sizeGb,
+    variant.onDiskGb,
+    variant.repoSizeGb,
+  ];
+  for (const candidate of candidates) {
+    if (typeof candidate === "number" && Number.isFinite(candidate) && candidate > 0) {
+      return candidate;
+    }
+  }
+  return 0;
+}
+
+export function imageDiscoverMemoryEstimate(variant: ImageModelVariant): ImageDiscoverMemoryEstimate | null {
+  const baseModelFootprintGb = imageVariantSizeForMemoryEstimate(variant);
+  if (!(baseModelFootprintGb > 0)) return null;
+
+  const { width, height } = parseRecommendedImageResolution(variant.recommendedResolution);
+  const safety = assessImageGenerationSafety({
+    width,
+    height,
+    device: null,
+    // Discover does not know the exact target device memory yet. Use a large
+    // budget so this function is only a requirement estimate; Studio still
+    // computes the actual risk against the live backend/device.
+    deviceMemoryGb: 512,
+    baseModelFootprintGb,
+    runtimeFootprintGb: variant.runtimeFootprintGb,
+    runtimeFootprintMpsGb: variant.runtimeFootprintMpsGb,
+    runtimeFootprintCudaGb: variant.runtimeFootprintCudaGb,
+    runtimeFootprintCpuGb: variant.runtimeFootprintCpuGb,
+    repo: variant.repo,
+    ggufFile: variant.ggufFile,
+  });
+  const resolutionLabel = `${width}×${height}`;
+  const estimatedPeakGb = Math.max(safety.estimatedPeakGb, safety.modelFootprintGb);
+  return {
+    estimatedPeakGb,
+    modelFootprintGb: safety.modelFootprintGb,
+    resolutionLabel,
+    label: `~${formatImageDiscoverGb(estimatedPeakGb)} @ ${resolutionLabel}`,
+    title: (
+      `Estimated peak RAM/VRAM at ${resolutionLabel}. Includes model/text encoder residency`
+      + (safety.modelFootprintGb > 0 ? ` (~${formatImageDiscoverGb(safety.modelFootprintGb)})` : "")
+      + " plus a resolution-dependent attention estimate. Actual usage varies by runtime and device."
+    ),
+  };
+}
+
 // ---------------------------------------------------------------------------
 // Generation safety heuristic
 // ---------------------------------------------------------------------------
@@ -122,9 +197,10 @@ export function imageDiscoverFamilyMatchesQuery(family: ImageModelFamily, query:
 //     for the 8× spatial downsample most diffusion models use. No temporal
 //     term → much smaller than video, but still enough to OOM at 2K+.
 //
-// Thresholds track the video heuristic: MPS uses a 0.5 / 0.8 caution/danger
-// ratio because Metal panics on the ceiling, CUDA uses 0.7 / 1.0 because it
-// surfaces catchable OOMs.
+// Thresholds track the runtime path rather than raw model size. MPS uses
+// Apple's ~75% recommended working-set ceiling; CUDA uses dedicated VRAM and
+// the runtime's FLUX offload path; CPU uses system RAM with a conservative
+// allowance because swapping makes "will it finish?" much less predictable.
 
 export type ImageGenerationRiskLevel = "safe" | "caution" | "danger";
 export type ImageEffectiveDevice = "mps" | "cuda" | "cpu";
@@ -148,9 +224,8 @@ const DEFAULT_CPU_MEMORY_GB = 8;
 // Attention slab multiplier — same rationale as video, smaller constant
 // because image transformers cluster around 8-16 heads per block rather
 // than the 16-32 video models use, and there's no temporal term fighting
-// the budget. Calibrated so 2048×2048 on FLUX dev (57.7 GB disk → ~81 GB
-// resident on MPS × 1.4) lands on "danger" at 64 GB unified memory, which
-// matches user-reported OOMs.
+// the budget. This keeps 1024px FLUX on a 64 GB MPS machine clear while
+// still flagging 2K FLUX where attention starts competing with weights.
 const IMAGE_HEAD_SLAB_MULTIPLIER = 4;
 
 function bytesPerElement(device: ImageEffectiveDevice): number {
@@ -158,19 +233,85 @@ function bytesPerElement(device: ImageEffectiveDevice): number {
 }
 
 function effectiveBudgetGb(totalGb: number, device: ImageEffectiveDevice): number {
-  return device === "cuda" ? totalGb * 0.7 : totalGb * 0.5;
+  if (device === "cuda") return totalGb * 0.9;
+  if (device === "mps") return totalGb * 0.75;
+  return totalGb * 0.6;
+}
+
+function riskRatios(device: ImageEffectiveDevice): { caution: number; danger: number } {
+  if (device === "cuda") return { caution: 0.85, danger: 1.0 };
+  if (device === "mps") return { caution: 0.8, danger: 0.95 };
+  return { caution: 0.75, danger: 0.95 };
 }
 
 function estimatePeakAttentionBytes(latentTokens: number, device: ImageEffectiveDevice): number {
   return latentTokens * latentTokens * bytesPerElement(device) * IMAGE_HEAD_SLAB_MULTIPLIER;
 }
 
-function estimateResidentModelGb(baseGb: number, device: ImageEffectiveDevice): number {
+function isFluxRepo(repo?: string | null): boolean {
+  return (repo ?? "").toLowerCase().includes("flux");
+}
+
+function runsOnCpuForMps(repo?: string | null): boolean {
+  // image_runtime.py intentionally routes Qwen-Image away from MPS because
+  // the naive fp16 MPS path can produce black outputs. Keep the warning and
+  // capacity math aligned with the backend's actual execution device.
+  return (repo ?? "").toLowerCase().includes("qwen-image");
+}
+
+function estimateResidentModelGb(
+  baseGb: number,
+  device: ImageEffectiveDevice,
+  repo?: string | null,
+  ggufFile?: string | null,
+): number {
   if (!(baseGb > 0) || !Number.isFinite(baseGb)) return 0;
-  const factor = device === "mps" ? 1.4 : device === "cpu" ? 1.3 : 1.05;
+  const flux = isFluxRepo(repo);
+  const hasExplicitQuant = Boolean(ggufFile);
+  if (flux && hasExplicitQuant) {
+    // GGUF image variants quantize only the FLUX transformer. Diffusers still
+    // loads the base repo's text encoders + VAE, and on Apple Silicon the
+    // Python process includes Metal allocator/watermark overhead. A real
+    // FLUX.1 Dev Q4_K_M run on a 64 GB M-series Mac sits around 43 GB in
+    // Activity Monitor despite the GGUF transformer being ~7 GB, so include
+    // that fixed pipeline residency rather than showing the transformer size
+    // as if it were the whole model.
+    if (device === "mps") return baseGb + 34.5;
+    if (device === "cuda") return baseGb + 11.5;
+    return baseGb + 18;
+  }
+  if (flux && !hasExplicitQuant) {
+    // Mirrors image_runtime.py:
+    // - MPS quantizes FLUX's transformer to int8wo before pipeline load.
+    // - CUDA uses model CPU offload and tries NF4 for the transformer.
+    // So the accelerator working set is much smaller than fp16 disk size.
+    if (device === "mps") return baseGb * 0.75;
+    if (device === "cuda") return Math.min(baseGb * 0.45, 11);
+  }
+  const factor = device === "mps" ? 1.15 : device === "cpu" ? 1.25 : 1.05;
   return baseGb * factor;
 }
 
+function positiveRuntimeFootprint(value: number | null | undefined): number | null {
+  return typeof value === "number" && Number.isFinite(value) && value > 0 ? value : null;
+}
+
+function runtimeFootprintForDevice(opts: {
+  device: ImageEffectiveDevice;
+  runtimeFootprintGb?: number | null;
+  runtimeFootprintMpsGb?: number | null;
+  runtimeFootprintCudaGb?: number | null;
+  runtimeFootprintCpuGb?: number | null;
+}): number | null {
+  if (opts.device === "mps") {
+    return positiveRuntimeFootprint(opts.runtimeFootprintMpsGb) ?? positiveRuntimeFootprint(opts.runtimeFootprintGb);
+  }
+  if (opts.device === "cuda") {
+    return positiveRuntimeFootprint(opts.runtimeFootprintCudaGb) ?? positiveRuntimeFootprint(opts.runtimeFootprintGb);
+  }
+  return positiveRuntimeFootprint(opts.runtimeFootprintCpuGb) ?? positiveRuntimeFootprint(opts.runtimeFootprintGb);
+}
+
 /**
  * Assess whether an image generation request is likely to detonate the
  * inference device. Same shape as ``assessVideoGenerationSafety`` without
@@ -178,9 +319,10 @@ function estimateResidentModelGb(baseGb: number, device: ImageEffectiveDevice):
  *
  * Calibration points (all with ``baseModelFootprintGb`` supplied):
  * - SD 1.5 (4 GB) at 1024×1024 on 16 GB MPS: safe.
- * - SDXL (13 GB) at 1024×1024 on 16 GB MPS: caution.
- * - FLUX dev (57.7 GB) at 1024×1024 on 32 GB MPS: danger (model alone > budget).
- * - FLUX dev (57.7 GB) at 1024×1024 on 64 GB MPS: caution → danger at 2K.
+ * - SDXL (13 GB) at 1024×1024 on 16 GB MPS: danger/tight.
+ * - FLUX schnell/dev standard at 1024×1024 on 64 GB MPS: safe; runtime uses int8wo.
+ * - FLUX standard at 1024×1024 on 16 GB MPS: danger.
+ * - FLUX standard at 2048×2048 on 64 GB MPS: danger from attention peak.
  * - HiDream (47 GB) at 1024×1024 on 64 GB MPS: caution.
  */
 export function assessImageGenerationSafety(opts: {
@@ -189,20 +331,41 @@ export function assessImageGenerationSafety(opts: {
   device: string | null | undefined;
   deviceMemoryGb?: number | null;
   baseModelFootprintGb?: number | null;
+  runtimeFootprintGb?: number | null;
+  runtimeFootprintMpsGb?: number | null;
+  runtimeFootprintCudaGb?: number | null;
+  runtimeFootprintCpuGb?: number | null;
+  repo?: string | null;
+  ggufFile?: string | null;
 }): ImageGenerationSafety {
-  const { width, height, device, deviceMemoryGb, baseModelFootprintGb } = opts;
+  const {
+    width,
+    height,
+    device,
+    deviceMemoryGb,
+    baseModelFootprintGb,
+    runtimeFootprintGb,
+    runtimeFootprintMpsGb,
+    runtimeFootprintCudaGb,
+    runtimeFootprintCpuGb,
+    repo,
+    ggufFile,
+  } = opts;
 
   const normalised = (device ?? "").toLowerCase();
   const isCuda = normalised.startsWith("cuda");
   const isCpu = normalised === "cpu";
   const isMps = normalised === "mps";
-  const effectiveDevice: ImageEffectiveDevice = isCuda
+  let effectiveDevice: ImageEffectiveDevice = isCuda
     ? "cuda"
     : isCpu
       ? "cpu"
       : isMps
         ? "mps"
         : inferDeviceFromHostPlatform();
+  if (effectiveDevice === "mps" && runsOnCpuForMps(repo)) {
+    effectiveDevice = "cpu";
+  }
   const effectiveDeviceWasInferred = !isCuda && !isCpu && !isMps;
 
   const fallback =
@@ -221,7 +384,17 @@ export function assessImageGenerationSafety(opts: {
     baseModelFootprintGb != null && Number.isFinite(baseModelFootprintGb) && baseModelFootprintGb > 0
       ? baseModelFootprintGb
       : 0;
-  const modelFootprintGb = estimateResidentModelGb(baseFootprint, effectiveDevice);
+  const runtimeOverrideGb = runtimeFootprintForDevice({
+    device: effectiveDevice,
+    runtimeFootprintGb,
+    runtimeFootprintMpsGb,
+    runtimeFootprintCudaGb,
+    runtimeFootprintCpuGb,
+  });
+  const modelFootprintGb =
+    runtimeOverrideGb != null
+      ? runtimeOverrideGb
+      : estimateResidentModelGb(baseFootprint, effectiveDevice, repo, ggufFile);
 
   if (
     !Number.isFinite(width)
@@ -246,8 +419,7 @@ export function assessImageGenerationSafety(opts: {
   const attentionPeakGb = estimatePeakAttentionBytes(latentTokens, effectiveDevice) / 1024 ** 3;
   const estimatedPeakGb = modelFootprintGb + attentionPeakGb;
 
-  const cautionRatio = effectiveDevice === "cuda" ? 0.7 : 0.5;
-  const dangerRatio = effectiveDevice === "cuda" ? 1.0 : 0.8;
+  const { caution: cautionRatio, danger: dangerRatio } = riskRatios(effectiveDevice);
   const ratio = estimatedPeakGb / budgetGb;
   const exceedsDevice = estimatedPeakGb > budgetGb;
   const riskLevel: ImageGenerationRiskLevel =
@@ -276,13 +448,18 @@ export function assessImageGenerationSafety(opts: {
         : "Apple Silicon (MPS)";
 
   // Model-alone-too-big short-circuit: same logic as video, no resolution
-  // suggestion can recover because the weights still have to live in memory.
+  // suggestion can recover when the weights/text encoders are the pressure
+  // point. Threshold against the comfort band so we do not return bogus
+  // "try smaller pixels" suggestions for a model-heavy warning.
   if (modelFootprintGb > cautionRatio * budgetGb) {
-    const cautionBudgetGb = cautionRatio * budgetGb;
+    const comfortBudgetGb = cautionRatio * budgetGb;
+    const highRiskBudgetGb = dangerRatio * budgetGb;
     const reason =
       riskLevel === "danger"
-        ? `The model needs ~${fmt(modelFootprintGb)} GB just to hold its weights + text encoder. On ${platform} with ${fmt(totalMemoryGb)} GB total, safe usage tops out around ${fmt(cautionBudgetGb)} GB — the model alone is already over that. Even small images would likely crash the backend. Try a smaller model (SD 1.5 is ~4 GB, SDXL ~13 GB) or a machine with more memory.`
-        : `The model needs ~${fmt(modelFootprintGb)} GB just to hold its weights + text encoder. On ${platform} with ${fmt(totalMemoryGb)} GB total, safe usage tops out around ${fmt(cautionBudgetGb)} GB — you're right on the edge. Generation may run slowly or fail; consider a smaller model.`;
+        ? modelFootprintGb > budgetGb
+          ? `The model needs ~${fmt(modelFootprintGb)} GB just to hold its weights + text encoder. On ${platform} with ${fmt(totalMemoryGb)} GB total, the estimated working set is ~${fmt(budgetGb)} GB, so the model alone is already over that. Even small images would likely crash the backend. Try a smaller model (SD 1.5 is ~4 GB, SDXL ~13 GB) or a machine with more memory.`
+          : `The model needs ~${fmt(modelFootprintGb)} GB just to hold its weights + text encoder, and this run peaks around ~${fmt(estimatedPeakGb)} GB. On ${platform} with ${fmt(totalMemoryGb)} GB total, that is above the high-risk threshold (~${fmt(highRiskBudgetGb)} GB) and close to the estimated working set (~${fmt(budgetGb)} GB). Generation is likely to crash the backend; lower the resolution or choose a smaller model.`
+        : `The model needs ~${fmt(modelFootprintGb)} GB just to hold its weights + text encoder. On ${platform} with ${fmt(totalMemoryGb)} GB total, that is above the conservative comfort target (~${fmt(comfortBudgetGb)} GB) but below the estimated working set (~${fmt(budgetGb)} GB). Generation may run slowly or fail; lower the resolution if it becomes unstable.`;
     return {
       riskLevel,
       estimatedPeakGb,
diff --git a/src/utils/library.ts b/src/utils/library.ts
index ce6ac25..02e59f1 100644
--- a/src/utils/library.ts
+++ b/src/utils/library.ts
@@ -49,6 +49,55 @@ export function inferHfRepoFromLocalPath(path: string | null | undefined): strin
   return repo || null;
 }
 
+const CHAT_EXCLUDED_MODEL_TYPES = new Set(["image", "video", "draft"]);
+
+const VIDEO_LIBRARY_KEYWORDS = [
+  "hunyuanvideo",
+  "wan-ai/",
+  "wan2.",
+  "wan2-",
+  "-t2v-",
+  "-i2v-",
+  "-v2v-",
+  "mochi-1",
+  "cogvideo",
+  "ltx-video",
+  "ltx-2",
+  "zeroscope",
+  "animatediff",
+];
+
+const IMAGE_LIBRARY_KEYWORDS = [
+  "stable-diffusion",
+  "sdxl",
+  "flux.",
+  "flux1",
+  "flux-",
+  "dall-e",
+  "imagen",
+  "kandinsky",
+  "wuerstchen",
+  "diffusion-pipe",
+  "qwen-image",
+  "qwen/qwen-image",
+  "sana_sprint",
+  "sana-sprint",
+  "sana sprint",
+  "sana_1600m",
+  "sana-1600m",
+];
+
+export function isChatLibraryItem(item: LibraryItem): boolean {
+  const modelType = String(item.modelType ?? "").trim().toLowerCase();
+  if (modelType && CHAT_EXCLUDED_MODEL_TYPES.has(modelType)) return false;
+
+  const repo = inferHfRepoFromLocalPath(item.path);
+  const haystack = `${item.name} ${item.path} ${repo ?? ""}`.toLowerCase();
+  if (VIDEO_LIBRARY_KEYWORDS.some((keyword) => haystack.includes(keyword))) return false;
+  if (IMAGE_LIBRARY_KEYWORDS.some((keyword) => haystack.includes(keyword))) return false;
+  return true;
+}
+
 export function libraryItemFormat(item: LibraryItem, matchedVariant?: ModelVariant | null): string {
   const explicit = (item.format ?? "").trim();
   if (explicit && explicit.toLowerCase() !== "hf cache" && explicit.toLowerCase() !== "unknown") {
diff --git a/src/utils/videos.ts b/src/utils/videos.ts
index b13ad11..ab5afcd 100644
--- a/src/utils/videos.ts
+++ b/src/utils/videos.ts
@@ -30,6 +30,48 @@ export function findVideoVariantByRepo(
   return null;
 }
 
+export function videoDownloadRepos(variant: VideoModelVariant): string[] {
+  const repos = [variant.repo];
+  if (variant.ggufRepo && variant.ggufFile) repos.push(variant.ggufRepo);
+  if (variant.hasLocalData && variant.textEncoderRepo) repos.push(variant.textEncoderRepo);
+  return repos;
+}
+
+export function videoDownloadStatusForVariant<T extends { state: string }>(
+  downloads: Record<string, T>,
+  variant: VideoModelVariant,
+): T | undefined {
+  const statuses = videoDownloadRepos(variant)
+    .map((repo) => downloads[repo])
+    .filter((status): status is T => Boolean(status));
+  return (
+    statuses.find((status) => status.state === "downloading")
+    ?? statuses.find((status) => status.state === "failed")
+    ?? statuses.find((status) => status.state === "cancelled")
+    ?? statuses.find((status) => status.state === "completed")
+  );
+}
+
+export function videoDeleteRepoForVariant<T extends { repo?: string | null }>(
+  variant: VideoModelVariant,
+  downloadState?: T,
+): string {
+  const activeRepo = String(downloadState?.repo ?? "").trim();
+  if (activeRepo) return activeRepo;
+  const primaryLocalRepo = String(variant.primaryLocalRepo ?? "").trim();
+  if (primaryLocalRepo) return primaryLocalRepo;
+  const [firstLocalRepo] = variant.localDataRepos ?? [];
+  if (firstLocalRepo) return firstLocalRepo;
+  return variant.repo;
+}
+
+export function videoDeleteLabelForRepo(variant: VideoModelVariant, repo: string, fallback = "Delete model"): string {
+  if (repo === variant.ggufRepo) return "Delete shared GGUF download";
+  if (repo === variant.textEncoderRepo) return "Delete shared text encoder download";
+  if (repo !== variant.repo) return "Delete shared component download";
+  return fallback;
+}
+
 export function videoVariantMatchesDiscoverFilters(
   variant: VideoModelVariant,
   taskFilter: VideoDiscoverTaskFilter,
@@ -81,6 +123,114 @@ export function videoDiscoverFamilyMatchesQuery(family: VideoModelFamily, query:
   return videoDiscoverFamilyHaystack(family).includes(query);
 }
 
+export interface VideoDiscoverMemoryEstimate {
+  estimatedPeakGb: number;
+  modelFootprintGb: number;
+  resolutionLabel: string;
+  frameCount: number;
+  label: string;
+  title: string;
+}
+
+function formatVideoDiscoverGb(gb: number): string {
+  if (!Number.isFinite(gb) || gb <= 0) return "Unknown";
+  return gb >= 10 ? `${gb.toFixed(0)} GB` : `${gb.toFixed(1)} GB`;
+}
+
+function parseRecommendedVideoResolution(value: string | null | undefined): { width: number; height: number } {
+  const match = /(\d{3,5})\s*[x×]\s*(\d{3,5})/i.exec(value ?? "");
+  if (!match) return { width: 832, height: 480 };
+  const width = Number.parseInt(match[1], 10);
+  const height = Number.parseInt(match[2], 10);
+  if (!Number.isFinite(width) || !Number.isFinite(height) || width <= 0 || height <= 0) {
+    return { width: 832, height: 480 };
+  }
+  return { width, height };
+}
+
+function videoVariantSizeForMemoryEstimate(variant: VideoModelVariant): number {
+  // Runtime memory should follow the curated runtime/catalog footprint, not
+  // local storage size. Some video repos (notably LTX-2.3 MLX) keep shared
+  // components or duplicate sharded weights on disk, so ``onDiskGb`` /
+  // live ``coreWeightsGb`` can be much larger than the resident model the
+  // Studio actually loads. Keep those fields as storage/download fallbacks
+  // only for uncurated rows with no catalog size.
+  const candidates = [
+    variant.sizeGb,
+    variant.coreWeightsGb,
+    variant.onDiskGb,
+    variant.repoSizeGb,
+  ];
+  for (const candidate of candidates) {
+    if (typeof candidate === "number" && Number.isFinite(candidate) && candidate > 0) {
+      return candidate;
+    }
+  }
+  return 0;
+}
+
+function defaultFrameCountForVideoVariant(variant: VideoModelVariant): number {
+  const seconds = Number.isFinite(variant.defaultDurationSeconds)
+    ? variant.defaultDurationSeconds
+    : 4;
+  const estimated = Math.round(seconds * 8);
+  const clamped = Math.max(1, Math.min(257, estimated));
+  const remainder = (clamped - 1) % 4;
+  if (remainder === 0) return clamped;
+  const down = clamped - remainder;
+  const up = down + 4;
+  return up - clamped < clamped - down ? up : down;
+}
+
+export function videoDiscoverMemoryEstimate(variant: VideoModelVariant): VideoDiscoverMemoryEstimate | null {
+  const baseModelFootprintGb = videoVariantSizeForMemoryEstimate(variant);
+  const hasRuntimeFootprint =
+    typeof variant.runtimeFootprintGb === "number"
+    && Number.isFinite(variant.runtimeFootprintGb)
+    && variant.runtimeFootprintGb > 0;
+  if (!(baseModelFootprintGb > 0) && !hasRuntimeFootprint) return null;
+
+  const { width, height } = parseRecommendedVideoResolution(variant.recommendedResolution);
+  const frameCount = defaultFrameCountForVideoVariant(variant);
+  const safety = assessVideoGenerationSafety({
+    width,
+    height,
+    numFrames: frameCount,
+    device: null,
+    // Discover is a requirement estimate, not a live compatibility check.
+    deviceMemoryGb: 512,
+    baseModelFootprintGb,
+    runtimeFootprintGb: variant.runtimeFootprintGb,
+    runtimeFootprintMpsGb: variant.runtimeFootprintMpsGb,
+    runtimeFootprintCudaGb: variant.runtimeFootprintCudaGb,
+    runtimeFootprintCpuGb: variant.runtimeFootprintCpuGb,
+  });
+  const resolutionLabel = `${width}×${height}`;
+  const estimatedPeakGb = Math.max(safety.estimatedPeakGb, safety.modelFootprintGb);
+  const storageNote = (
+    typeof variant.onDiskGb === "number"
+    && Number.isFinite(variant.onDiskGb)
+    && variant.onDiskGb > 0
+    && baseModelFootprintGb > 0
+    && variant.onDiskGb > baseModelFootprintGb * 1.25
+  )
+    ? ` Local storage is ${formatVideoDiscoverGb(variant.onDiskGb)} because the snapshot can include shared or duplicate components; runtime RAM uses the catalog footprint.`
+    : "";
+  return {
+    estimatedPeakGb,
+    modelFootprintGb: safety.modelFootprintGb,
+    resolutionLabel,
+    frameCount,
+    label: `~${formatVideoDiscoverGb(estimatedPeakGb)} @ ${resolutionLabel}`,
+    title: (
+      `Estimated peak RAM/VRAM at ${resolutionLabel} with ${frameCount} frames. Includes resident model memory`
+      + (safety.modelFootprintGb > 0 ? ` (~${formatVideoDiscoverGb(safety.modelFootprintGb)})` : "")
+      + " plus a temporal attention estimate. Actual usage varies by runtime, frame count, and device."
+      + storageNote
+    ),
+  };
+}
+
 /** WebKit's ``fetch()`` (Safari + macOS Tauri's WKWebView) produces the
  * literal string ``"Load failed"`` when it can't reach the server — for
  * example after the Python sidecar dies from an MPS OOM. Chromium produces
@@ -300,6 +450,26 @@ function estimateResidentModelGb(
   return baseFootprintGb * factor;
 }
 
+function positiveRuntimeFootprint(value: number | null | undefined): number | null {
+  return typeof value === "number" && Number.isFinite(value) && value > 0 ? value : null;
+}
+
+function runtimeFootprintForDevice(opts: {
+  device: VideoEffectiveDevice;
+  runtimeFootprintGb?: number | null;
+  runtimeFootprintMpsGb?: number | null;
+  runtimeFootprintCudaGb?: number | null;
+  runtimeFootprintCpuGb?: number | null;
+}): number | null {
+  if (opts.device === "mps") {
+    return positiveRuntimeFootprint(opts.runtimeFootprintMpsGb) ?? positiveRuntimeFootprint(opts.runtimeFootprintGb);
+  }
+  if (opts.device === "cuda") {
+    return positiveRuntimeFootprint(opts.runtimeFootprintCudaGb) ?? positiveRuntimeFootprint(opts.runtimeFootprintGb);
+  }
+  return positiveRuntimeFootprint(opts.runtimeFootprintCpuGb) ?? positiveRuntimeFootprint(opts.runtimeFootprintGb);
+}
+
 /**
  * Estimate whether a video generation request is in danger of detonating
  * the inference device. The estimate combines two memory terms:
@@ -353,8 +523,22 @@ export function assessVideoGenerationSafety(opts: {
    * directly — bypasses the ``sizeGb × 1.4`` heuristic. Disk size
    * overstates resident because of duplicate sharded safetensors. */
   runtimeFootprintGb?: number | null;
+  runtimeFootprintMpsGb?: number | null;
+  runtimeFootprintCudaGb?: number | null;
+  runtimeFootprintCpuGb?: number | null;
 }): VideoGenerationSafety {
-  const { width, height, numFrames, device, deviceMemoryGb, baseModelFootprintGb, runtimeFootprintGb } = opts;
+  const {
+    width,
+    height,
+    numFrames,
+    device,
+    deviceMemoryGb,
+    baseModelFootprintGb,
+    runtimeFootprintGb,
+    runtimeFootprintMpsGb,
+    runtimeFootprintCudaGb,
+    runtimeFootprintCpuGb,
+  } = opts;
 
   const normalisedDevice = (device ?? "").toLowerCase();
   const isCuda = normalisedDevice.startsWith("cuda");
@@ -395,11 +579,16 @@ export function assessVideoGenerationSafety(opts: {
       : 0;
   // Prefer explicit runtime footprint when the catalog supplies one — it
   // already reflects resident peak. Otherwise estimate from disk size.
+  const runtimeOverrideGb = runtimeFootprintForDevice({
+    device: effectiveDevice,
+    runtimeFootprintGb,
+    runtimeFootprintMpsGb,
+    runtimeFootprintCudaGb,
+    runtimeFootprintCpuGb,
+  });
   const modelFootprintGb =
-    runtimeFootprintGb != null
-    && Number.isFinite(runtimeFootprintGb)
-    && runtimeFootprintGb > 0
-      ? runtimeFootprintGb
+    runtimeOverrideGb != null
+      ? runtimeOverrideGb
       : estimateResidentModelGb(baseFootprint, effectiveDevice);
 
   if (
diff --git a/tests/test_backend_service.py b/tests/test_backend_service.py
index c1171d6..d6e376b 100644
--- a/tests/test_backend_service.py
+++ b/tests/test_backend_service.py
@@ -1084,6 +1084,60 @@ def test_model_download_delete_clears_tracked_attempt(self):
         self.assertNotIn(repo, state._download_cancel)
         self.assertNotIn(repo, state._download_tokens)
 
+    def test_image_generate_unloads_idle_video_runtime_first(self):
+        state = self.client.app.state.chaosengine
+        state.video_runtime = SimpleNamespace(
+            capabilities=mock.Mock(
+                return_value={
+                    "activeEngine": "diffusers",
+                    "realGenerationAvailable": True,
+                    "loadedModelRepo": "Wan-AI/Wan2.1-T2V-1.3B-Diffusers",
+                }
+            ),
+            unload=mock.Mock(return_value={"loadedModelRepo": None}),
+        )
+
+        with mock.patch(
+            "backend_service.routes.images._generate_image_artifacts",
+            return_value=([], {"activeEngine": "diffusers", "loadedModelRepo": "black-forest-labs/FLUX.1-schnell"}),
+        ):
+            response = self.client.post(
+                "/api/images/generate",
+                json={
+                    "modelId": "black-forest-labs/FLUX.1-schnell",
+                    "prompt": "A quiet studio product photo",
+                    "width": 512,
+                    "height": 512,
+                    "steps": 4,
+                    "guidance": 3.5,
+                },
+            )
+
+        self.assertEqual(response.status_code, 200, response.text)
+        state.video_runtime.unload.assert_called_once_with()
+
+    def test_image_generate_rejects_while_video_generation_active(self):
+        from backend_service.progress import VIDEO_PROGRESS
+
+        VIDEO_PROGRESS.begin(run_label="Wan test", total_steps=10, message="Diffusing")
+        try:
+            response = self.client.post(
+                "/api/images/generate",
+                json={
+                    "modelId": "black-forest-labs/FLUX.1-schnell",
+                    "prompt": "A quiet studio product photo",
+                    "width": 512,
+                    "height": 512,
+                    "steps": 4,
+                    "guidance": 3.5,
+                },
+            )
+        finally:
+            VIDEO_PROGRESS.finish()
+
+        self.assertEqual(response.status_code, 409)
+        self.assertIn("video generation is still running", response.json()["detail"])
+
     def test_image_download_delete_removes_cache_and_unloads_matching_models(self):
         repo = "black-forest-labs/FLUX.1-dev"
         hf_cache = Path(self.tempdir.name) / "hf-cache"
@@ -1830,6 +1884,53 @@ def test_discovery_classifies_hf_cache_mlx_repo_by_storage_format(self):
         self.assertEqual(library[0]["sourceKind"], "HF cache")
         self.assertFalse(library[0]["broken"])
 
+    def test_discovery_classifies_ltx2_hf_cache_as_video(self):
+        models_root = Path(self.tempdir.name) / "HF"
+        hf_repo = models_root / "models--prince-canuma--LTX-2.3-dev" / "snapshots" / "1234"
+        hf_repo.mkdir(parents=True)
+        (hf_repo / "config.json").write_text("{}", encoding="utf-8")
+        (hf_repo / "model.safetensors.index.json").write_text("{}", encoding="utf-8")
+        (hf_repo / "model-00001-of-00001.safetensors").write_bytes(b"x" * 4096)
+
+        library = _discover_local_models(
+            [
+                {
+                    "label": "HF",
+                    "path": str(models_root),
+                    "enabled": True,
+                    "source": "user",
+                }
+            ]
+        )
+
+        self.assertEqual(len(library), 1)
+        self.assertEqual(library[0]["name"], "prince-canuma/LTX-2.3-dev")
+        self.assertEqual(library[0]["modelType"], "video")
+
+    def test_discovery_classifies_sana_hf_cache_as_image(self):
+        models_root = Path(self.tempdir.name) / "HF"
+        hf_repo = models_root / "models--Efficient-Large-Model--Sana_Sprint_1.6B_1024px_diffusers" / "snapshots" / "1234"
+        hf_repo.mkdir(parents=True)
+        (hf_repo / "config.json").write_text("{}", encoding="utf-8")
+        (hf_repo / "model_index.json").write_text("{}", encoding="utf-8")
+        (hf_repo / "model.safetensors.index.json").write_text("{}", encoding="utf-8")
+        (hf_repo / "model-00001-of-00001.safetensors").write_bytes(b"x" * 4096)
+
+        library = _discover_local_models(
+            [
+                {
+                    "label": "HF",
+                    "path": str(models_root),
+                    "enabled": True,
+                    "source": "user",
+                }
+            ]
+        )
+
+        self.assertEqual(len(library), 1)
+        self.assertEqual(library[0]["name"], "Efficient-Large-Model/Sana_Sprint_1.6B_1024px_diffusers")
+        self.assertEqual(library[0]["modelType"], "image")
+
     def test_discovery_marks_nvfp4_modelopt_repo_as_unsupported_for_mlx(self):
         models_root = Path(self.tempdir.name) / "HF"
         hf_repo = models_root / "models--LilaRest--gemma-4-31B-it-NVFP4-turbo" / "snapshots" / "1234"
@@ -2044,6 +2145,9 @@ def test_returns_mlx_layout_for_ltx2_repo(self):
         self.assertIn("vae/**", patterns)
         self.assertIn("text_encoder/**", patterns)
         self.assertIn("tokenizer/**", patterns)
+        self.assertIn("text_projections/**", patterns)
+        self.assertIn("audio_vae/**", patterns)
+        self.assertIn("vocoder/**", patterns)
         self.assertIn("*spatial-upscaler*.safetensors", patterns)
         self.assertNotIn("model_index.json", patterns)
 
diff --git a/tests/test_cache_strategies.py b/tests/test_cache_strategies.py
index d8a42f0..6195767 100644
--- a/tests/test_cache_strategies.py
+++ b/tests/test_cache_strategies.py
@@ -1,5 +1,7 @@
 import unittest
 import importlib
+import tempfile
+from pathlib import Path
 from types import SimpleNamespace
 from unittest.mock import patch
 
@@ -8,6 +10,7 @@
 from cache_compression.rotorquant import RotorQuantStrategy
 from cache_compression.triattention import TriAttentionStrategy
 from cache_compression.turboquant import TurboQuantStrategy
+from turboquant_mlx import _find_pip_turboquant_path
 
 
 class CacheStrategyRegistryTests(unittest.TestCase):
@@ -167,14 +170,22 @@ def test_rotorquant_is_unavailable_without_supported_marker(self):
     # TurboQuant
     # ------------------------------------------------------------------
 
-    def test_turboquant_is_available_when_required_hooks_exist(self):
+    def test_turboquant_is_available_when_required_hooks_and_package_exist(self):
         tq = TurboQuantStrategy()
         with patch(
             "cache_compression.turboquant._turboquant_mlx_source_blobs",
             return_value=["def make_adaptive_cache():\n    pass", "def apply_patch():\n    pass"],
-        ):
+        ), patch("cache_compression.turboquant._has_full_turboquant_mlx_package", return_value=True):
             self.assertTrue(tq.is_available())
 
+    def test_turboquant_is_unavailable_without_full_package(self):
+        tq = TurboQuantStrategy()
+        with patch(
+            "cache_compression.turboquant._turboquant_mlx_source_blobs",
+            return_value=["def make_adaptive_cache():\n    pass", "def apply_patch():\n    pass"],
+        ), patch("cache_compression.turboquant._has_full_turboquant_mlx_package", return_value=False):
+            self.assertFalse(tq.is_available())
+
     def test_turboquant_is_unavailable_without_required_hooks(self):
         tq = TurboQuantStrategy()
         with patch(
@@ -193,6 +204,15 @@ def test_turboquant_mlx_cache_raises_helpful_message_without_hooks(self):
                 tq.make_mlx_cache(32, 3, 4, False, None)
         self.assertIn("required MLX adapter hooks", str(ctx.exception))
 
+    def test_turboquant_adapter_finds_package_in_extras_dir(self):
+        with tempfile.TemporaryDirectory() as tmp:
+            package = Path(tmp) / "turboquant_mlx"
+            marker = package / "layers" / "polar_kv_cache.py"
+            marker.parent.mkdir(parents=True)
+            marker.write_text("class TurboQuantKVCache:\n    pass\n", encoding="utf-8")
+            with patch.dict("os.environ", {"CHAOSENGINE_EXTRAS_SITE_PACKAGES": tmp}):
+                self.assertEqual(_find_pip_turboquant_path(), str(package.resolve()))
+
     # ------------------------------------------------------------------
     # ChaosEngine — cache type validation
     # ------------------------------------------------------------------
diff --git a/tests/test_discovery.py b/tests/test_discovery.py
index 9717519..2f7d9b8 100644
--- a/tests/test_discovery.py
+++ b/tests/test_discovery.py
@@ -43,6 +43,21 @@ def test_skips_symlink_loops(self):
             self.assertGreaterEqual(total, 512)
             self.assertLess(total, 1024)
 
+    def test_follows_snapshot_symlinks_to_blob_targets(self):
+        with tempfile.TemporaryDirectory() as tmp:
+            root = Path(tmp)
+            snapshot = root / "snapshots" / "rev-a"
+            blobs = root / "blobs"
+            snapshot.mkdir(parents=True)
+            blobs.mkdir()
+            blob = blobs / "sha256"
+            blob.write_bytes(b"x" * 2048)
+            try:
+                os.symlink(str(blob), str(snapshot / "model.safetensors"))
+            except (OSError, NotImplementedError):
+                self.skipTest("symlink not supported on this platform")
+            self.assertEqual(_path_size_bytes(snapshot), 2048)
+
     def test_dedupes_hardlinks_via_inode(self):
         with tempfile.TemporaryDirectory() as tmp:
             root = Path(tmp)
diff --git a/tests/test_image_discover.py b/tests/test_image_discover.py
new file mode 100644
index 0000000..3f08f25
--- /dev/null
+++ b/tests/test_image_discover.py
@@ -0,0 +1,149 @@
+"""Tests for Image Discover latest-model selection."""
+
+from __future__ import annotations
+
+import json
+import urllib.error
+import unittest
+from unittest import mock
+
+from backend_service.helpers.images import (
+    _clear_image_discover_caches,
+    _image_repo_live_metadata,
+    _is_latest_image_candidate,
+    _tracked_latest_seed_payloads,
+)
+
+
+class _FakeResponse:
+    def __init__(self, payload: dict):
+        self._payload = payload
+
+    def __enter__(self):
+        return self
+
+    def __exit__(self, *args):
+        return False
+
+    def read(self) -> bytes:
+        return json.dumps(self._payload).encode()
+
+
+class ImageDiscoverLatestTests(unittest.TestCase):
+    def setUp(self):
+        _clear_image_discover_caches()
+
+    def tearDown(self):
+        _clear_image_discover_caches()
+
+    def test_tracked_latest_fallback_includes_post_august_2025_models(self):
+        payloads = _tracked_latest_seed_payloads([])
+        repos = [str(item.get("repo") or "") for item in payloads]
+
+        self.assertEqual(payloads[0].get("releaseDate"), "2026-04")
+        self.assertIn("baidu/ERNIE-Image", repos)
+        self.assertIn("black-forest-labs/FLUX.2-dev", repos)
+        self.assertIn("Qwen/Qwen-Image-Edit-2511", repos)
+
+    def test_tracked_latest_fallback_has_size_metadata_for_ram_estimates(self):
+        payloads = _tracked_latest_seed_payloads([])
+
+        missing = [
+            str(item.get("repo") or item.get("id") or "")
+            for item in payloads
+            if not (float(item.get("sizeGb") or 0) > 0)
+        ]
+        missing_weights = [
+            str(item.get("repo") or item.get("id") or "")
+            for item in payloads
+            if not (
+                float(item.get("coreWeightsGb") or 0) > 0
+                or float(item.get("repoSizeGb") or 0) > 0
+            )
+        ]
+
+        self.assertEqual(missing, [])
+        self.assertEqual(missing_weights, [])
+
+    def test_tracked_latest_fallback_has_runtime_metadata_for_ram_estimates(self):
+        payloads = _tracked_latest_seed_payloads([])
+
+        missing_runtime = [
+            str(item.get("repo") or item.get("id") or "")
+            for item in payloads
+            if not (
+                float(item.get("runtimeFootprintGb") or 0) > 0
+                or float(item.get("runtimeFootprintMpsGb") or 0) > 0
+                or float(item.get("runtimeFootprintCudaGb") or 0) > 0
+                or float(item.get("runtimeFootprintCpuGb") or 0) > 0
+            )
+        ]
+
+        self.assertEqual(missing_runtime, [])
+
+    def test_latest_candidate_accepts_current_official_diffusers_repos(self):
+        self.assertTrue(
+            _is_latest_image_candidate(
+                {
+                    "id": "baidu/ERNIE-Image",
+                    "tags": ["diffusers", "text-to-image"],
+                    "pipeline_tag": "text-to-image",
+                    "downloads": 4100,
+                    "likes": 488,
+                },
+                curated_repos=set(),
+            )
+        )
+
+    def test_latest_candidate_filters_low_signal_loras(self):
+        self.assertFalse(
+            _is_latest_image_candidate(
+                {
+                    "id": "random-user/current-model-lora",
+                    "tags": ["diffusers", "text-to-image", "lora"],
+                    "pipeline_tag": "text-to-image",
+                    "downloads": 50_000,
+                    "likes": 500,
+                },
+                curated_repos=set(),
+            )
+        )
+
+    def test_live_metadata_cache_is_token_aware_for_gated_repos(self):
+        gated_error = urllib.error.HTTPError(
+            url="https://huggingface.co/api/models/gated/model",
+            code=403,
+            msg="Forbidden",
+            hdrs=None,
+            fp=None,
+        )
+        live_payload = {
+            "downloads": 12,
+            "likes": 3,
+            "gated": "auto",
+            "siblings": [
+                {"rfilename": "transformer/model.safetensors", "size": 2 * 1024 ** 3},
+            ],
+        }
+
+        with mock.patch.dict("os.environ", {}, clear=True):
+            with mock.patch(
+                "backend_service.helpers.images.urllib.request.urlopen",
+                side_effect=[gated_error, _FakeResponse(live_payload)],
+            ) as urlopen:
+                anonymous = _image_repo_live_metadata("gated/model")
+
+                self.assertIn("HTTP 403", anonymous["metadataWarning"])
+
+                with mock.patch.dict("os.environ", {"HF_TOKEN": "hf_test_token"}, clear=True):
+                    tokened = _image_repo_live_metadata("gated/model")
+
+                self.assertEqual(tokened["downloads"], 12)
+                self.assertEqual(tokened["coreWeightsGb"], 2.0)
+                self.assertEqual(urlopen.call_count, 2)
+                authed_request = urlopen.call_args_list[1].args[0]
+                self.assertEqual(authed_request.get_header("Authorization"), "Bearer hf_test_token")
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/test_inference.py b/tests/test_inference.py
index 0d7df64..1001401 100644
--- a/tests/test_inference.py
+++ b/tests/test_inference.py
@@ -418,6 +418,24 @@ def test_exclusive_load_unloads_previous_model_instead_of_parking_it(self):
         self.assertEqual(engine_a.unload_calls, 1)
         self.assertEqual(controller._warm_pool, {})
 
+    def test_large_incoming_load_unloads_previous_model_instead_of_parking_it(self):
+        controller = self._controller()
+        engine_a = DummyEngine("A")
+        engine_b = DummyEngine("B")
+        controller._select_engine = mock.Mock(side_effect=[engine_a, engine_b])
+
+        self._load(controller, "model-a", context_tokens=8192)
+        with (
+            mock.patch.object(RuntimeController, "_target_resident_bytes", return_value=20),
+            mock.patch.object(controller, "_memory_budget_bytes", return_value=10),
+        ):
+            loaded = self._load(controller, "model-b", context_tokens=8192)
+
+        self.assertIs(controller.engine, engine_b)
+        self.assertEqual(loaded.ref, "model-b")
+        self.assertEqual(engine_a.unload_calls, 1)
+        self.assertEqual(controller._warm_pool, {})
+
     def test_clear_warm_pool_unloads_every_parked_engine(self):
         controller = self._controller()
         engine_a = DummyEngine("A")
diff --git a/tests/test_mlx_video.py b/tests/test_mlx_video.py
index ef6b2a0..5259756 100644
--- a/tests/test_mlx_video.py
+++ b/tests/test_mlx_video.py
@@ -13,6 +13,7 @@
 
 from __future__ import annotations
 
+import tempfile
 import unittest
 from pathlib import Path
 from unittest.mock import MagicMock, patch
@@ -241,6 +242,50 @@ def test_build_cmd_picks_dev_pipeline_for_ltx2_3_dev(self):
         idx = cmd.index("--pipeline")
         self.assertEqual(cmd[idx + 1], "dev")
 
+    def test_build_cmd_overlays_shared_text_encoder_for_ltx2_3(self):
+        engine = MlxVideoEngine()
+        config = _make_config("prince-canuma/LTX-2.3-dev")
+        with tempfile.TemporaryDirectory() as tmp:
+            root = Path(tmp)
+            model = root / "ltx23"
+            shared = root / "ltx2"
+            workspace = root / "run"
+            model.mkdir()
+            shared.mkdir()
+            workspace.mkdir()
+            for name in ("transformer", "text_projections", "audio_vae", "vae", "vocoder"):
+                (model / name).mkdir()
+            (shared / "text_encoder").mkdir()
+            (shared / "text_encoder" / "config.json").write_text("{}")
+            (shared / "text_encoder" / "model.safetensors.index.json").write_text("{}")
+            (shared / "tokenizer").mkdir()
+            (shared / "tokenizer" / "tokenizer.json").write_text("{}")
+            (shared / "tokenizer" / "tokenizer.model").write_text("tokenizer")
+
+            def fake_snapshot(repo: str) -> Path | None:
+                if repo == "prince-canuma/LTX-2.3-dev":
+                    return model
+                if repo == "prince-canuma/LTX-2-distilled":
+                    return shared
+                return None
+
+            with patch(
+                "backend_service.mlx_video_runtime._resolve_local_snapshot",
+                side_effect=fake_snapshot,
+            ):
+                cmd = engine._build_cmd(
+                    config,
+                    workspace / "out.mp4",
+                    resolve_aux_files=True,
+                )
+
+            model_arg = Path(cmd[cmd.index("--model-repo") + 1])
+            self.assertEqual(model_arg.parent, workspace)
+            self.assertTrue((model_arg / "transformer").is_dir())
+            self.assertTrue((model_arg / "text_encoder" / "config.json").exists())
+            self.assertTrue((model_arg / "tokenizer" / "tokenizer.json").exists())
+            self.assertNotIn("--text-encoder-repo", cmd)
+
     def test_build_cmd_omits_seed_when_none(self):
         engine = MlxVideoEngine()
         config = _make_config()
diff --git a/tests/test_video_routes.py b/tests/test_video_routes.py
index 876cfd4..874c623 100644
--- a/tests/test_video_routes.py
+++ b/tests/test_video_routes.py
@@ -192,6 +192,16 @@ def test_catalog_variants_have_frontend_ready_fields(self):
                 # availableLocally should be False on a fresh test env (no snapshots).
                 self.assertEqual(variant.get("availableLocally"), False)
                 self.assertEqual(variant.get("familyName"), family["name"])
+                runtime_fields = (
+                    variant.get("runtimeFootprintGb"),
+                    variant.get("runtimeFootprintMpsGb"),
+                    variant.get("runtimeFootprintCudaGb"),
+                    variant.get("runtimeFootprintCpuGb"),
+                )
+                self.assertTrue(
+                    any(float(value or 0) > 0 for value in runtime_fields),
+                    f"{variant.get('id')} missing runtime footprint metadata",
+                )
 
 
 class VideoRuntimeRouteTests(unittest.TestCase):
@@ -463,6 +473,55 @@ def test_generate_happy_path_persists_artifact_and_returns_outputs(self):
         self.assertEqual(len(listing), 1)
         self.assertEqual(listing[0]["artifactId"], artifact["artifactId"])
 
+    def test_generate_unloads_idle_image_runtime_first(self):
+        state = self.client.app.state.chaosengine
+        state.image_runtime = mock.MagicMock()
+        state.image_runtime.capabilities.return_value = {
+            "activeEngine": "diffusers",
+            "realGenerationAvailable": True,
+            "loadedModelRepo": "black-forest-labs/FLUX.1-schnell",
+        }
+        state.image_runtime.unload.return_value = {"loadedModelRepo": None}
+        state.video_runtime.generate = mock.MagicMock(  # type: ignore[method-assign]
+            return_value=(
+                self._fake_generated_video(),
+                {
+                    "activeEngine": "diffusers",
+                    "realGenerationAvailable": True,
+                    "message": "Ready",
+                    "missingDependencies": [],
+                    "loadedModelRepo": "Wan-AI/Wan2.1-T2V-1.3B-Diffusers",
+                },
+            )
+        )
+
+        with mock.patch.object(
+            video_routes,
+            "_video_variant_available_locally",
+            return_value=True,
+        ):
+            response = self.client.post("/api/video/generate", json=self._payload())
+
+        self.assertEqual(response.status_code, 200, response.text)
+        state.image_runtime.unload.assert_called_once_with()
+
+    def test_generate_rejects_while_image_generation_active(self):
+        from backend_service.progress import IMAGE_PROGRESS
+
+        IMAGE_PROGRESS.begin(run_label="FLUX test", total_steps=4, message="Diffusing")
+        try:
+            with mock.patch.object(
+                video_routes,
+                "_video_variant_available_locally",
+                return_value=True,
+            ):
+                response = self.client.post("/api/video/generate", json=self._payload())
+        finally:
+            IMAGE_PROGRESS.finish()
+
+        self.assertEqual(response.status_code, 409)
+        self.assertIn("image generation is still running", response.json()["detail"])
+
     def test_generate_then_stream_file_then_delete_round_trip(self):
         state = self.client.app.state.chaosengine
         state.video_runtime.generate = mock.MagicMock(  # type: ignore[method-assign]
@@ -709,6 +768,15 @@ def test_cancel_known_but_not_downloading_returns_not_found_state(self):
         download = response.json()["download"]
         self.assertEqual(download["state"], "not_found")
 
+    def test_cancel_accepts_shared_gguf_repo(self):
+        response = self.client.post(
+            "/api/video/download/cancel",
+            json={"repo": "city96/LTX-Video-gguf"},
+        )
+        self.assertEqual(response.status_code, 200)
+        download = response.json()["download"]
+        self.assertEqual(download["state"], "not_found")
+
     def test_delete_rejects_repo_outside_video_catalog(self):
         response = self.client.post(
             "/api/video/download/delete",
@@ -725,11 +793,19 @@ def test_delete_known_but_not_downloaded_is_noop(self):
         result = response.json()["result"]
         self.assertEqual(result["state"], "not_found")
 
+    def test_delete_accepts_shared_gguf_repo(self):
+        response = self.client.post(
+            "/api/video/download/delete",
+            json={"repo": "city96/LTX-Video-gguf"},
+        )
+        self.assertEqual(response.status_code, 200)
+        result = response.json()["result"]
+        self.assertEqual(result["state"], "not_found")
+
 
 class MlxVideoSnapshotValidationTests(unittest.TestCase):
-    """mlx-video repos (e.g. ``prince-canuma/LTX-2-*``) ship MLX layout —
-    text_encoder / tokenizer / transformer / vae folders WITHOUT
-    ``model_index.json``. The diffusers-shape validator must not flag
+    """mlx-video repos (e.g. ``prince-canuma/LTX-2-*``) ship MLX layouts
+    WITHOUT ``model_index.json``. The diffusers-shape validator must not flag
     these as incomplete; ``_video_download_validation_error`` must route
     through the mlx-video schema check instead.
     """
@@ -738,7 +814,13 @@ def test_complete_mlx_snapshot_validates_clean(self):
         from backend_service.helpers.video import _validate_mlx_video_snapshot
         with tempfile.TemporaryDirectory() as tmp:
             root = Path(tmp)
-            for name in ("text_encoder", "tokenizer", "transformer", "vae"):
+            for name in (
+                "text_encoder",
+                "tokenizer",
+                "text_projections",
+                "transformer",
+                "vae",
+            ):
                 folder = root / name
                 folder.mkdir()
                 (folder / "config.json").write_text("{}")
@@ -748,7 +830,12 @@ def test_missing_component_reports_which_one(self):
         from backend_service.helpers.video import _validate_mlx_video_snapshot
         with tempfile.TemporaryDirectory() as tmp:
             root = Path(tmp)
-            for name in ("text_encoder", "tokenizer", "transformer"):  # vae absent
+            for name in (
+                "text_encoder",
+                "tokenizer",
+                "text_projections",
+                "transformer",
+            ):  # vae absent
                 folder = root / name
                 folder.mkdir()
                 (folder / "config.json").write_text("{}")
@@ -760,13 +847,64 @@ def test_empty_component_dir_reports_as_incomplete(self):
         from backend_service.helpers.video import _validate_mlx_video_snapshot
         with tempfile.TemporaryDirectory() as tmp:
             root = Path(tmp)
-            for name in ("text_encoder", "tokenizer", "transformer", "vae"):
+            for name in (
+                "text_encoder",
+                "tokenizer",
+                "text_projections",
+                "transformer",
+                "vae",
+            ):
                 (root / name).mkdir()
             # All folders exist but are empty — partial download.
             err = _validate_mlx_video_snapshot(str(root))
             self.assertIsNotNone(err)
             self.assertIn("empty", err.lower())
 
+    def test_ltx2_missing_text_projections_reports_incomplete(self):
+        from backend_service.helpers.video import _validate_mlx_video_snapshot
+        with tempfile.TemporaryDirectory() as tmp:
+            root = Path(tmp)
+            for name in ("text_encoder", "tokenizer", "transformer", "vae"):
+                folder = root / name
+                folder.mkdir()
+                (folder / "config.json").write_text("{}")
+            err = _validate_mlx_video_snapshot(
+                str(root),
+                "prince-canuma/LTX-2-distilled",
+            )
+            self.assertIsNotNone(err)
+            self.assertIn("text_projections", err)
+
+    def test_ltx23_snapshot_uses_current_mlx_layout(self):
+        from backend_service.helpers.video import _validate_mlx_video_snapshot
+        with tempfile.TemporaryDirectory() as tmp:
+            root = Path(tmp)
+            for name in (
+                "audio_vae",
+                "text_projections",
+                "transformer",
+                "vae",
+                "vocoder",
+            ):
+                folder = root / name
+                folder.mkdir()
+                (folder / "config.json").write_text("{}")
+            self.assertIsNone(
+                _validate_mlx_video_snapshot(str(root), "prince-canuma/LTX-2.3-dev")
+            )
+
+    def test_ltx23_missing_component_reports_current_name(self):
+        from backend_service.helpers.video import _validate_mlx_video_snapshot
+        with tempfile.TemporaryDirectory() as tmp:
+            root = Path(tmp)
+            for name in ("audio_vae", "transformer", "vae", "vocoder"):
+                folder = root / name
+                folder.mkdir()
+                (folder / "config.json").write_text("{}")
+            err = _validate_mlx_video_snapshot(str(root), "prince-canuma/LTX-2.3-dev")
+            self.assertIsNotNone(err)
+            self.assertIn("text_projections", err)
+
     def test_mlx_routed_repo_skips_diffusers_check(self):
         from backend_service.helpers.video import (
             _is_mlx_video_routed_repo,
@@ -791,5 +929,193 @@ def test_mlx_routed_repo_skips_diffusers_check(self):
             self.assertNotIn("model_index", err)
 
 
+class VideoGgufVariantValidationTests(unittest.TestCase):
+    def test_gguf_partial_local_data_reports_shared_repo_delete_target(self):
+        from backend_service.helpers.video import _video_model_payloads
+
+        with tempfile.TemporaryDirectory() as tmp:
+            gguf_snapshot = Path(tmp) / "gguf"
+            gguf_snapshot.mkdir()
+            (gguf_snapshot / "partial.gguf").write_bytes(b"partial")
+
+            def snapshot(repo: str):
+                if repo == "city96/LTX-Video-gguf":
+                    return gguf_snapshot
+                return None
+
+            with mock.patch(
+                "backend_service.helpers.video._hf_repo_snapshot_dir",
+                side_effect=snapshot,
+            ), mock.patch(
+                "backend_service.helpers.video._image_repo_live_metadata",
+                return_value={},
+            ):
+                families = _video_model_payloads([])
+
+        variants = [
+            variant
+            for family in families
+            for variant in family["variants"]
+            if variant["id"] == "Lightricks/LTX-Video-gguf-q6k"
+        ]
+        self.assertEqual(len(variants), 1)
+        variant = variants[0]
+        self.assertTrue(variant["hasLocalData"])
+        self.assertFalse(variant["availableLocally"])
+        self.assertEqual(variant["localDataRepos"], ["city96/LTX-Video-gguf"])
+        self.assertEqual(variant["primaryLocalRepo"], "city96/LTX-Video-gguf")
+        self.assertEqual(variant["localPath"], str(gguf_snapshot))
+
+    def test_gguf_variant_requires_cached_transformer_file(self):
+        from backend_service.helpers.video import _video_variant_validation_error
+
+        variant = {
+            "name": "Wan 2.2 TI2V 5B · GGUF Q8_0",
+            "repo": "Wan-AI/Wan2.2-TI2V-5B-Diffusers",
+            "ggufRepo": "QuantStack/Wan2.2-TI2V-5B-GGUF",
+            "ggufFile": "Wan2.2-TI2V-5B-Q8_0.gguf",
+        }
+        with mock.patch(
+            "backend_service.helpers.video._video_download_validation_error",
+            return_value=None,
+        ), mock.patch(
+            "huggingface_hub.hf_hub_download",
+            side_effect=FileNotFoundError("not cached"),
+        ):
+            err = _video_variant_validation_error(variant)
+
+        self.assertIsNotNone(err)
+        self.assertIn("GGUF transformer file is missing", err)
+        self.assertIn("Wan2.2-TI2V-5B-Q8_0.gguf", err)
+
+    def test_gguf_missing_file_status_reason_is_specific(self):
+        from backend_service.helpers.video import _video_variant_local_status_reason
+
+        variant = {
+            "name": "Wan 2.2 TI2V 5B · GGUF Q8_0",
+            "repo": "Wan-AI/Wan2.2-TI2V-5B-Diffusers",
+            "ggufRepo": "QuantStack/Wan2.2-TI2V-5B-GGUF",
+            "ggufFile": "Wan2.2-TI2V-5B-Q8_0.gguf",
+        }
+        reason = _video_variant_local_status_reason(
+            variant,
+            (
+                "The base diffusers snapshot is installed, but the selected GGUF "
+                "transformer file is missing: QuantStack/Wan2.2-TI2V-5B-GGUF/"
+                "Wan2.2-TI2V-5B-Q8_0.gguf."
+            ),
+        )
+        self.assertEqual(
+            reason,
+            (
+                "Base model installed; missing GGUF transformer: "
+                "QuantStack/Wan2.2-TI2V-5B-GGUF/Wan2.2-TI2V-5B-Q8_0.gguf."
+            ),
+        )
+
+    def test_mlx_missing_components_status_reason_is_specific(self):
+        from backend_service.helpers.video import _video_variant_local_status_reason
+
+        reason = _video_variant_local_status_reason(
+            {"repo": "prince-canuma/LTX-2-distilled"},
+            (
+                "The local snapshot is incomplete. Missing mlx-video components: "
+                "text_projections (empty). Re-download the model and keep "
+                "ChaosEngineAI open until the download completes."
+            ),
+        )
+        self.assertEqual(reason, "Missing MLX components: text_projections (empty).")
+
+    def test_ltx23_variant_requires_shared_text_encoder(self):
+        from backend_service.helpers.video import _video_variant_validation_error
+
+        variant = {
+            "name": "LTX-2.3 · dev (MLX)",
+            "repo": "prince-canuma/LTX-2.3-dev",
+            "textEncoderRepo": "prince-canuma/LTX-2-distilled",
+        }
+        with tempfile.TemporaryDirectory() as tmp:
+            base = Path(tmp) / "ltx23"
+            shared = Path(tmp) / "ltx2"
+            base.mkdir()
+            shared.mkdir()
+
+            def snapshot(repo: str):
+                if repo == "prince-canuma/LTX-2.3-dev":
+                    return base
+                if repo == "prince-canuma/LTX-2-distilled":
+                    return shared
+                return None
+
+            with mock.patch(
+                "backend_service.helpers.video._video_download_validation_error",
+                return_value=None,
+            ), mock.patch(
+                "backend_service.helpers.video._hf_repo_snapshot_dir",
+                side_effect=snapshot,
+            ):
+                err = _video_variant_validation_error(variant)
+
+        self.assertIsNotNone(err)
+        self.assertIn("shared mlx-video text components", err)
+        self.assertIn("prince-canuma/LTX-2-distilled", err)
+
+    def test_ltx23_variant_accepts_shared_text_encoder_repo(self):
+        from backend_service.helpers.video import _video_variant_validation_error
+
+        variant = {
+            "name": "LTX-2.3 · dev (MLX)",
+            "repo": "prince-canuma/LTX-2.3-dev",
+            "textEncoderRepo": "prince-canuma/LTX-2-distilled",
+        }
+        with tempfile.TemporaryDirectory() as tmp:
+            base = Path(tmp) / "ltx23"
+            shared = Path(tmp) / "ltx2"
+            base.mkdir()
+            (shared / "text_encoder").mkdir(parents=True)
+            (shared / "text_encoder" / "config.json").write_text("{}")
+            (shared / "text_encoder" / "model.safetensors.index.json").write_text("{}")
+            (shared / "tokenizer").mkdir()
+            (shared / "tokenizer" / "tokenizer.json").write_text("{}")
+            (shared / "tokenizer" / "tokenizer.model").write_text("tokenizer")
+
+            def snapshot(repo: str):
+                if repo == "prince-canuma/LTX-2.3-dev":
+                    return base
+                if repo == "prince-canuma/LTX-2-distilled":
+                    return shared
+                return None
+
+            with mock.patch(
+                "backend_service.helpers.video._video_download_validation_error",
+                return_value=None,
+            ), mock.patch(
+                "backend_service.helpers.video._hf_repo_snapshot_dir",
+                side_effect=snapshot,
+            ):
+                self.assertIsNone(_video_variant_validation_error(variant))
+
+    def test_gguf_variant_validates_when_base_and_gguf_are_cached(self):
+        from backend_service.helpers.video import _video_variant_validation_error
+
+        variant = {
+            "name": "Wan 2.2 TI2V 5B · GGUF Q8_0",
+            "repo": "Wan-AI/Wan2.2-TI2V-5B-Diffusers",
+            "ggufRepo": "QuantStack/Wan2.2-TI2V-5B-GGUF",
+            "ggufFile": "Wan2.2-TI2V-5B-Q8_0.gguf",
+        }
+        with tempfile.TemporaryDirectory() as tmp:
+            gguf = Path(tmp) / "Wan2.2-TI2V-5B-Q8_0.gguf"
+            gguf.write_bytes(b"gguf")
+            with mock.patch(
+                "backend_service.helpers.video._video_download_validation_error",
+                return_value=None,
+            ), mock.patch(
+                "huggingface_hub.hf_hub_download",
+                return_value=str(gguf),
+            ):
+                self.assertIsNone(_video_variant_validation_error(variant))
+
+
 if __name__ == "__main__":
     unittest.main()
diff --git a/turboquant_mlx/__init__.py b/turboquant_mlx/__init__.py
index 76506cc..54f9643 100644
--- a/turboquant_mlx/__init__.py
+++ b/turboquant_mlx/__init__.py
@@ -38,17 +38,51 @@
 def _find_pip_turboquant_path() -> str | None:
     """Find the pip-installed turboquant-mlx-full package in site-packages.
 
-    Our local ``turboquant_mlx/`` directory shadows the pip package, so
-    we locate it directly in site-packages.
+    Our local ``turboquant_mlx/`` adapter intentionally shadows the upstream
+    package so ChaosEngineAI can expose stable hooks. The actual TurboQuant
+    implementation may live in the embedded site-packages directory, the
+    persistent extras directory used by the one-click installer, or a source
+    checkout venv, so locate it directly instead of importing by name.
     """
+    import os
+    import sys
     import sysconfig
     from pathlib import Path
 
-    site_packages = sysconfig.get_path("purelib")
-    if site_packages:
-        candidate = Path(site_packages) / "turboquant_mlx" / "layers" / "polar_kv_cache.py"
+    def resolved(path: Path) -> Path:
+        try:
+            return path.resolve()
+        except OSError:
+            return path
+
+    local_adapter = resolved(Path(__file__).parent)
+    roots: list[Path] = []
+
+    extras = os.environ.get("CHAOSENGINE_EXTRAS_SITE_PACKAGES")
+    if extras:
+        roots.append(Path(extras))
+
+    for entry in sys.path:
+        if entry:
+            roots.append(Path(entry))
+
+    for key in ("purelib", "platlib"):
+        site_packages = sysconfig.get_path(key)
+        if site_packages:
+            roots.append(Path(site_packages))
+
+    seen: set[Path] = set()
+    for root in roots:
+        root = resolved(root)
+        if root in seen:
+            continue
+        seen.add(root)
+        package_dir = resolved(root / "turboquant_mlx")
+        candidate = package_dir / "layers" / "polar_kv_cache.py"
+        if package_dir == local_adapter and not candidate.exists():
+            continue
         if candidate.exists():
-            return str(Path(site_packages) / "turboquant_mlx")
+            return str(package_dir)
     return None