From 243c2bc773979ffc17fd606bb63c906ceaed9601 Mon Sep 17 00:00:00 2001
From: Cursor Agent <cursoragent@cursor.com>
Date: Sun, 3 May 2026 03:04:11 +0000
Subject: [PATCH 1/4] fix(onboarding): use catalog-resolved alias for outbound
 requests
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The background 'Hello World' batch and the Run-Now handler were both
reading from a single `modelAlias` value that fell back to a hard-coded
`medgemma-4b` while the catalog query was still loading. Because the
background effect fired immediately after auth resolved (well before
`useModels` returned), the visible payload would later re-render with
the catalog alias (e.g. 'deepseek') while the backend received
'medgemma-4b' — producing 'Model medgemma-4b has not been configured or
is not available to user' on every onboarding load in environments
without that model.

Split the alias into two values:

  - displayModelAlias: always populated (real alias or placeholder) and
    used only for rendering code samples so the UI is never blank.
  - runnableModelAlias: undefined while the catalog is loading and when
    the user has no accessible chat model. Used for outbound requests.

The background batch now waits for the catalog to resolve and bails
silently (no toast, no request) when there's no entitled chat model.
Run Now does the same in its IIFE so the simulated success timer still
fires while we skip the doomed network call.

Co-authored-by: aschkanAH <aschkanAH@users.noreply.github.com>
---
 .../onboarding/Onboarding/Onboarding.tsx      | 104 +++++++++++++-----
 1 file changed, 74 insertions(+), 30 deletions(-)

diff --git a/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx b/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
index 5c7b150ab..0a2038a0d 100644
--- a/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
+++ b/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
@@ -39,11 +39,13 @@ import { AppSidebar } from "../../../layout/Sidebar/AppSidebar";
 const INVITE_WEBHOOK_URL: string | undefined =
   import.meta.env.VITE_INVITE_WEBHOOK_URL;
 
-// Default catalog model used in the visible code samples. We swap this with the
-// first available chat model alias from the user's catalog when one is found,
-// but keep medgemma-4b as a fallback so the snippet always renders something
-// concrete even before /models loads.
-const FALLBACK_MODEL_ALIAS = "medgemma-4b";
+// Placeholder alias used purely for rendering the code samples while the
+// catalog query is in flight or empty. We deliberately do NOT use this for
+// outbound API calls — the user almost certainly isn't entitled to it on
+// every deployment, so firing real requests against it produces 4xx errors
+// (see "Model 'medgemma-4b' has not been configured…"). Real requests are
+// gated on a catalog-resolved alias (see `runnableModelAlias` below).
+const FALLBACK_DISPLAY_MODEL_ALIAS = "medgemma-4b";
 
 const SUCCESS_REDIRECT_DELAY_MS = 2000;
 const RUN_NOW_SIMULATED_DELAY_MS = 2500;
@@ -209,16 +211,31 @@ export function Onboarding() {
   const uploadFile = useUploadFileWithProgress();
 
   // Pull the first chat model alias from the catalog so the rendered code
-  // samples reference something that will actually work for the user. Falls
-  // back to a hard-coded alias when the catalog query is still loading or
-  // empty.
-  const { data: modelsData } = useModels({ accessible: true, limit: 50 });
-  const modelAlias = useMemo(() => {
+  // samples reference something that will actually work for the user.
+  //
+  // We expose two values intentionally:
+  //   - runnableModelAlias: undefined while the catalog is still loading and
+  //     when the user has no accessible chat model. Used for outbound
+  //     requests (background batch, Run Now) so we never fire batches against
+  //     a hard-coded model the user isn't entitled to. The earlier behaviour
+  //     of falling back to "medgemma-4b" silently caused a divergence between
+  //     the rendered payload (e.g. "deepseek") and the model actually sent to
+  //     the backend, producing "Model 'medgemma-4b' has not been configured"
+  //     errors in environments where that model isn't available.
+  //   - displayModelAlias: always resolved (real alias when available, hard-
+  //     coded placeholder otherwise) so the rendered code samples are never
+  //     blank.
+  const { data: modelsData, isLoading: modelsLoading } = useModels({
+    accessible: true,
+    limit: 50,
+  });
+  const runnableModelAlias = useMemo<string | undefined>(() => {
     const chat = modelsData?.data?.find(
       (m) => (m.model_type ?? "CHAT") === "CHAT",
     );
-    return chat?.alias ?? FALLBACK_MODEL_ALIAS;
+    return chat?.alias;
   }, [modelsData]);
+  const displayModelAlias = runnableModelAlias ?? FALLBACK_DISPLAY_MODEL_ALIAS;
 
   // Mint a live API key on mount so step 1 has something concrete to show.
   // We only do this once per visit and only when the user is authenticated.
@@ -250,14 +267,21 @@ export function Onboarding() {
       });
   }, [authLoading, isAuthenticated, currentUser, createApiKey]);
 
-  // Fire the "Hello World" sample batch in the background on mount. This is
-  // best-effort: if the catalog has no chat model or the upload fails, we
-  // swallow the error and just hide the toast. The toast is shown
-  // optimistically so the user sees activity even if the model catalog is
-  // slow to load.
+  // Fire the "Hello World" sample batch in the background once we know which
+  // model to send it to. We deliberately wait for the catalog query so the
+  // outbound payload uses the same alias the visible code samples render
+  // (otherwise the user sees e.g. `deepseek` in the UI but the backend
+  // receives `medgemma-4b`). If the catalog has no accessible chat model we
+  // skip the background batch and the toast entirely — there's no plausible
+  // model to demo with, and a doomed POST would just spam the console.
   useEffect(() => {
     if (sampleBatchRequestedRef.current) return;
     if (authLoading || !isAuthenticated) return;
+    if (modelsLoading) return;
+    if (!runnableModelAlias) {
+      sampleBatchRequestedRef.current = true;
+      return;
+    }
     sampleBatchRequestedRef.current = true;
 
     toast("Sample Batch Started", {
@@ -267,12 +291,19 @@ export function Onboarding() {
       icon: <Sparkles className="w-4 h-4 text-doubleword-primary" />,
     });
 
+    const aliasForRequest = runnableModelAlias;
     void (async () => {
       try {
-        // Wait one tick for the models query to resolve. If it hasn't, the
-        // fallback alias is fine — the batch creation will just fail silently
-        // server-side which is acceptable for this background "demo" job.
-        const helloPayload = `{"custom_id": "hello-1", "method": "POST", "url": "/v1/chat/completions", "body": {"model": "${modelAlias}", "messages": [{"role": "user", "content": "Say hello."}]}}\n`;
+        const helloRow = {
+          custom_id: "hello-1",
+          method: "POST",
+          url: "/v1/chat/completions",
+          body: {
+            model: aliasForRequest,
+            messages: [{ role: "user", content: "Say hello." }],
+          },
+        };
+        const helloPayload = `${JSON.stringify(helloRow)}\n`;
         const blob = new Blob([helloPayload], { type: "application/jsonl" });
         const file = new File([blob], `onboarding-hello-${Date.now()}.jsonl`, {
           type: "application/jsonl",
@@ -292,10 +323,12 @@ export function Onboarding() {
         console.warn("Background Hello World batch failed:", err);
       }
     })();
-    // We intentionally only run this once after auth is resolved; modelAlias
-    // is read inside the IIFE so we don't need it as a dep.
+    // The other deps are mutation handles that are stable across renders;
+    // re-running the effect when their identities churn would re-fire the
+    // batch on every render. The idempotency ref above is the single source
+    // of truth.
     // eslint-disable-next-line react-hooks/exhaustive-deps
-  }, [authLoading, isAuthenticated]);
+  }, [authLoading, isAuthenticated, modelsLoading, runnableModelAlias]);
 
   const goToDashboard = useCallback(() => {
     navigate("/models");
@@ -311,15 +344,18 @@ export function Onboarding() {
     return () => clearTimeout(timer);
   }, [runState, listenerState, goToDashboard]);
 
+  // Visible code samples always render against the display alias so the UI
+  // is never blank; outbound requests use runnableModelAlias and bail out
+  // when undefined.
   const snippets = useMemo(
-    () => buildSnippets(apiKey ?? "<your-api-key>", modelAlias),
-    [apiKey, modelAlias],
+    () => buildSnippets(apiKey ?? "<your-api-key>", displayModelAlias),
+    [apiKey, displayModelAlias],
   );
 
   const browserPayload =
     workloadType === "batch"
-      ? buildJsonlPayload(modelAlias)
-      : buildAsyncPayload(modelAlias);
+      ? buildJsonlPayload(displayModelAlias)
+      : buildAsyncPayload(displayModelAlias);
   const cliSnippet = snippets[workloadType][language];
 
   const handleCopyKey = async () => {
@@ -348,7 +384,15 @@ export function Onboarding() {
     // success/failure to the run state machine since the spec asks for a
     // simulated 2.5s "running" → "success" cycle that gives the user a
     // predictable redirect experience, regardless of how fast the API
-    // responds.
+    // responds. If we have no catalog-resolved alias we skip the network
+    // call entirely rather than firing against the placeholder display
+    // alias (which the user is unlikely to be entitled to).
+    const aliasForRequest = runnableModelAlias;
+    if (!aliasForRequest) {
+      setTimeout(() => setRunState("success"), RUN_NOW_SIMULATED_DELAY_MS);
+      return;
+    }
+
     void (async () => {
       try {
         // Always build the JSONL via the object helpers so we never round-
@@ -358,12 +402,12 @@ export function Onboarding() {
         // still flipped the UI to "success".
         const payload =
           workloadType === "batch"
-            ? buildJsonlPayload(modelAlias)
+            ? buildJsonlPayload(aliasForRequest)
             : `${JSON.stringify({
                 custom_id: "row-1",
                 method: "POST",
                 url: "/v1/chat/completions",
-                body: buildAsyncPayloadObject(modelAlias),
+                body: buildAsyncPayloadObject(aliasForRequest),
               })}\n`;
         const blob = new Blob([payload], { type: "application/jsonl" });
         const file = new File(

From f7e7f470f9cc3a6fec39b43ac31a6b7e24b4f7e7 Mon Sep 17 00:00:00 2001
From: Cursor Agent <cursoragent@cursor.com>
Date: Sun, 3 May 2026 03:27:40 +0000
Subject: [PATCH 2/4] fix(onboarding): drop medgemma fallback, gate Run Now on
 catalog
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

The previous split of displayModelAlias / runnableModelAlias still left
'medgemma-4b' visible in the rendered code samples for the brief window
between mount and the useModels query resolving. Anyone reading the
payload during that window would reasonably expect medgemma to be the
model the backend is asked to run — exactly the divergence we set out
to remove.

Replace the hard-coded fallback with an obviously-non-runnable
'<your-model-alias>' placeholder, and disable the Run Now button until
runnableModelAlias is populated. The visible payload and the outbound
payload now share a single source of truth: when there's a real alias,
both reference it; when there isn't, the placeholder is shown and the
button is disabled.

Co-authored-by: aschkanAH <aschkanAH@users.noreply.github.com>
---
 .../onboarding/Onboarding/Onboarding.tsx      | 78 +++++++++----------
 1 file changed, 38 insertions(+), 40 deletions(-)

diff --git a/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx b/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
index 0a2038a0d..853722c06 100644
--- a/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
+++ b/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
@@ -39,13 +39,13 @@ import { AppSidebar } from "../../../layout/Sidebar/AppSidebar";
 const INVITE_WEBHOOK_URL: string | undefined =
   import.meta.env.VITE_INVITE_WEBHOOK_URL;
 
-// Placeholder alias used purely for rendering the code samples while the
-// catalog query is in flight or empty. We deliberately do NOT use this for
-// outbound API calls — the user almost certainly isn't entitled to it on
-// every deployment, so firing real requests against it produces 4xx errors
-// (see "Model 'medgemma-4b' has not been configured…"). Real requests are
-// gated on a catalog-resolved alias (see `runnableModelAlias` below).
-const FALLBACK_DISPLAY_MODEL_ALIAS = "medgemma-4b";
+// Placeholder shown in the rendered code samples ONLY while the catalog
+// query is in flight or empty. Deliberately not a real model alias so it
+// can't be mistaken for one and so the visible payload never references a
+// model the user might or might not be entitled to. Outbound requests are
+// blocked entirely until a real catalog-resolved alias is available — see
+// `runnableModelAlias` and the disabled state on the Run Now button.
+const PLACEHOLDER_MODEL_ALIAS = "<your-model-alias>";
 
 const SUCCESS_REDIRECT_DELAY_MS = 2000;
 const RUN_NOW_SIMULATED_DELAY_MS = 2500;
@@ -210,21 +210,11 @@ export function Onboarding() {
   const createBatch = useCreateBatch();
   const uploadFile = useUploadFileWithProgress();
 
-  // Pull the first chat model alias from the catalog so the rendered code
-  // samples reference something that will actually work for the user.
-  //
-  // We expose two values intentionally:
-  //   - runnableModelAlias: undefined while the catalog is still loading and
-  //     when the user has no accessible chat model. Used for outbound
-  //     requests (background batch, Run Now) so we never fire batches against
-  //     a hard-coded model the user isn't entitled to. The earlier behaviour
-  //     of falling back to "medgemma-4b" silently caused a divergence between
-  //     the rendered payload (e.g. "deepseek") and the model actually sent to
-  //     the backend, producing "Model 'medgemma-4b' has not been configured"
-  //     errors in environments where that model isn't available.
-  //   - displayModelAlias: always resolved (real alias when available, hard-
-  //     coded placeholder otherwise) so the rendered code samples are never
-  //     blank.
+  // Pull the first accessible chat model alias from the catalog. Outbound
+  // requests are gated on this resolving to a concrete value; the rendered
+  // payload uses an obviously-non-runnable placeholder until then so the
+  // visible payload can never reference a model the backend isn't being
+  // asked to run.
   const { data: modelsData, isLoading: modelsLoading } = useModels({
     accessible: true,
     limit: 50,
@@ -235,7 +225,11 @@ export function Onboarding() {
     );
     return chat?.alias;
   }, [modelsData]);
-  const displayModelAlias = runnableModelAlias ?? FALLBACK_DISPLAY_MODEL_ALIAS;
+  // Single alias used for both rendering and outbound requests when
+  // available; otherwise an obviously-non-runnable placeholder for the UI
+  // (and the Run Now button is disabled, see below). This collapse ensures
+  // the visible payload and the outbound payload can never diverge.
+  const displayModelAlias = runnableModelAlias ?? PLACEHOLDER_MODEL_ALIAS;
 
   // Mint a live API key on mount so step 1 has something concrete to show.
   // We only do this once per visit and only when the user is authenticated.
@@ -267,13 +261,12 @@ export function Onboarding() {
       });
   }, [authLoading, isAuthenticated, currentUser, createApiKey]);
 
-  // Fire the "Hello World" sample batch in the background once we know which
-  // model to send it to. We deliberately wait for the catalog query so the
-  // outbound payload uses the same alias the visible code samples render
-  // (otherwise the user sees e.g. `deepseek` in the UI but the backend
-  // receives `medgemma-4b`). If the catalog has no accessible chat model we
-  // skip the background batch and the toast entirely — there's no plausible
-  // model to demo with, and a doomed POST would just spam the console.
+  // Fire the "Hello World" sample batch in the background once we know
+  // which model to send it to. We wait for the catalog query so the
+  // outbound payload uses the same alias the visible code samples render.
+  // If the catalog has no accessible chat model we skip the background
+  // batch and the toast entirely — there's no plausible model to demo
+  // with, and a doomed POST would just spam the console.
   useEffect(() => {
     if (sampleBatchRequestedRef.current) return;
     if (authLoading || !isAuthenticated) return;
@@ -378,21 +371,21 @@ export function Onboarding() {
 
   const handleRunNow = async () => {
     if (runState !== "idle") return;
+    // The button is disabled without a runnable alias; this guard is
+    // defensive in case the disabled prop is bypassed (e.g. via assistive
+    // tech or a stale render). We deliberately don't kick the simulated
+    // success state in that case — silently succeeding without a real
+    // request would re-introduce the visible-vs-actual divergence we just
+    // fixed.
+    const aliasForRequest = runnableModelAlias;
+    if (!aliasForRequest) return;
     setRunState("running");
 
     // Fire the real batch creation in the background. We don't surface its
     // success/failure to the run state machine since the spec asks for a
     // simulated 2.5s "running" → "success" cycle that gives the user a
     // predictable redirect experience, regardless of how fast the API
-    // responds. If we have no catalog-resolved alias we skip the network
-    // call entirely rather than firing against the placeholder display
-    // alias (which the user is unlikely to be entitled to).
-    const aliasForRequest = runnableModelAlias;
-    if (!aliasForRequest) {
-      setTimeout(() => setRunState("success"), RUN_NOW_SIMULATED_DELAY_MS);
-      return;
-    }
-
+    // responds.
     void (async () => {
       try {
         // Always build the JSONL via the object helpers so we never round-
@@ -700,7 +693,12 @@ export function Onboarding() {
                       </div>
                       <Button
                         onClick={handleRunNow}
-                        disabled={runState !== "idle"}
+                        disabled={runState !== "idle" || !runnableModelAlias}
+                        title={
+                          !runnableModelAlias
+                            ? "Loading available models…"
+                            : undefined
+                        }
                         className={`w-full whitespace-nowrap sm:w-auto ${
                           runState === "running"
                             ? "bg-amber-100 text-amber-700 hover:bg-amber-100"

From f134ea929a2df33e0c185d84a941d7f3564fcb81 Mon Sep 17 00:00:00 2001
From: Cursor Agent <cursoragent@cursor.com>
Date: Sun, 3 May 2026 04:35:27 +0000
Subject: [PATCH 3/4] feat(onboarding): redirect to job route after successful
 run
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Previously the post-success auto-redirect always landed users on
/models — fine as a generic 'where would you like to go next' but it
hides the workload they just queued. Send them instead to the route
that will surface their job:

  - /async when workloadType is 'async'
  - /batches when workloadType is 'batch'

Both routes are config-gated by batches.enabled (and async further
gated by batches.async_requests.enabled), so we consult
useAuthorization().canAccessRoute and fall back to /models when the
preferred destination isn't accessible on this deployment, to avoid
ProtectedRoute bouncing the user mid-redirect.

The 'Skip to Dashboard' header button still lands on /models per the
original spec. The CLI listener path also stays on /models — that path
is the 'click to continue' simulation, not an actual workload, so
there's no specific job for the user to view.

Inline success-strip copy now reflects the destination ('Taking you to
your batch/async request…') so the redirect isn't surprising.

Co-authored-by: aschkanAH <aschkanAH@users.noreply.github.com>
---
 .../onboarding/Onboarding/Onboarding.tsx      | 36 ++++++++++++++++---
 1 file changed, 31 insertions(+), 5 deletions(-)

diff --git a/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx b/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
index 853722c06..f30d6cadf 100644
--- a/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
+++ b/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
@@ -29,6 +29,7 @@ import {
   useUser,
 } from "@/api/control-layer/hooks";
 import { copyToClipboard as copyToClipboardUtil } from "@/utils/clipboard";
+import { useAuthorization } from "@/utils/authorization";
 import { AppSidebar } from "../../../layout/Sidebar/AppSidebar";
 
 // Webhook used by the "invite a teammate" form. Configured per-environment
@@ -184,6 +185,7 @@ export function Onboarding() {
   const navigate = useNavigate();
   const { isAuthenticated, isLoading: authLoading } = useAuth();
   const { data: currentUser } = useUser("current");
+  const { canAccessRoute } = useAuthorization();
 
   const [apiKey, setApiKey] = useState<string | null>(null);
   const [apiKeyError, setApiKeyError] = useState<string | null>(null);
@@ -323,19 +325,40 @@ export function Onboarding() {
     // eslint-disable-next-line react-hooks/exhaustive-deps
   }, [authLoading, isAuthenticated, modelsLoading, runnableModelAlias]);
 
+  // "Skip to Dashboard" header button always lands on /models per the spec.
   const goToDashboard = useCallback(() => {
     navigate("/models");
   }, [navigate]);
 
-  // Auto-redirect after success in both browser and CLI modes.
+  // Where to land the user after they successfully run a workload from the
+  // browser tab. We send them to the route that will show the job they just
+  // queued (/async for async tier, /batches for batch tier) so they see
+  // their output instead of a generic models list.
+  //
+  // Both routes share the `batches` permission and are config-gated by
+  // `batches.enabled` / `batches.async_requests.enabled`. If the resolved
+  // route isn't accessible on this deployment we fall back to /models so
+  // ProtectedRoute doesn't bounce the user mid-redirect.
+  const browserSuccessRoute = useMemo(() => {
+    const preferred = workloadType === "batch" ? "/batches" : "/async";
+    return canAccessRoute(preferred) ? preferred : "/models";
+  }, [workloadType, canAccessRoute]);
+
+  // Auto-redirect after success in both browser and CLI modes. The CLI
+  // listener path doesn't run an actual workload (it's a "click to
+  // continue" simulation), so we keep that path on /models — there's no
+  // job for the user to view. The browser run-now path goes to the
+  // job-specific route.
   useEffect(() => {
     const succeeded =
       runState === "success" || listenerState === "success";
     if (!succeeded || redirectScheduledRef.current) return;
     redirectScheduledRef.current = true;
-    const timer = setTimeout(goToDashboard, SUCCESS_REDIRECT_DELAY_MS);
+    const destination =
+      runState === "success" ? browserSuccessRoute : "/models";
+    const timer = setTimeout(() => navigate(destination), SUCCESS_REDIRECT_DELAY_MS);
     return () => clearTimeout(timer);
-  }, [runState, listenerState, goToDashboard]);
+  }, [runState, listenerState, browserSuccessRoute, navigate]);
 
   // Visible code samples always render against the display alias so the UI
   // is never blank; outbound requests use runnableModelAlias and bail out
@@ -742,8 +765,11 @@ export function Onboarding() {
                       <div className="flex items-center justify-between p-4">
                         <span className="flex items-center gap-2 text-sm font-medium text-emerald-800">
                           <Sparkles className="h-4 w-4" />
-                          Workload successfully received! Redirecting to
-                          dashboard…
+                          {browserSuccessRoute === "/batches"
+                            ? "Workload successfully received! Taking you to your batch…"
+                            : browserSuccessRoute === "/async"
+                              ? "Workload successfully received! Taking you to your async request…"
+                              : "Workload successfully received! Redirecting to dashboard…"}
                         </span>
                       </div>
                     </div>

From 807b26fe9aa16161b215616daaee225d353abbf0 Mon Sep 17 00:00:00 2001
From: Cursor Agent <cursoragent@cursor.com>
Date: Sun, 3 May 2026 09:12:11 +0000
Subject: [PATCH 4/4] fix(onboarding): redirect ref decouples timer from
 churn-prone deps
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Including browserSuccessRoute in the auto-redirect effect's deps caused
a lost-redirect bug: if the value's identity changed during the 2s
window (workloadType toggle, useAuthorization refetch race, config
invalidation, …) the cleanup function ran clearTimeout, the effect
re-ran, and the idempotency ref short-circuited it before a new timer
could be scheduled. The user would see 'Taking you to your batch…'
indefinitely without ever navigating.

Move the destination into a ref that's updated on every render so the
trigger effect captures the latest value at success-time without
declaring a dep. Deps are now only the success triggers + navigate,
none of which churn between idle and success, so the cleanup-cancel
path is unreachable by construction.

Co-authored-by: aschkanAH <aschkanAH@users.noreply.github.com>
---
 .../onboarding/Onboarding/Onboarding.tsx      | 30 ++++++++++++++++---
 1 file changed, 26 insertions(+), 4 deletions(-)

diff --git a/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx b/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
index f30d6cadf..39f5cda98 100644
--- a/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
+++ b/dashboard/src/components/features/onboarding/Onboarding/Onboarding.tsx
@@ -339,26 +339,48 @@ export function Onboarding() {
   // `batches.enabled` / `batches.async_requests.enabled`. If the resolved
   // route isn't accessible on this deployment we fall back to /models so
   // ProtectedRoute doesn't bounce the user mid-redirect.
+  //
+  // This is exposed for rendering the success-strip copy. The actual
+  // navigation reads from a ref captured at success-time (see below) so
+  // the redirect can't be lost when this value's identity churns
+  // (workloadType toggle, canAccessRoute refetch race, etc.) during the
+  // 2s redirect window.
   const browserSuccessRoute = useMemo(() => {
     const preferred = workloadType === "batch" ? "/batches" : "/async";
     return canAccessRoute(preferred) ? preferred : "/models";
   }, [workloadType, canAccessRoute]);
 
+  // Pinned destination for the auto-redirect timer. Updated on every
+  // render so the trigger effect can capture the latest value at the
+  // moment success fires, without having browserSuccessRoute as a dep
+  // (which would cause cleanup-then-skip races that lose the redirect).
+  const pendingRedirectRouteRef = useRef<string>("/models");
+  pendingRedirectRouteRef.current =
+    runState === "success" ? browserSuccessRoute : "/models";
+
   // Auto-redirect after success in both browser and CLI modes. The CLI
   // listener path doesn't run an actual workload (it's a "click to
   // continue" simulation), so we keep that path on /models — there's no
   // job for the user to view. The browser run-now path goes to the
   // job-specific route.
+  //
+  // Deps are deliberately limited to the success triggers and `navigate`
+  // (stable in practice). browserSuccessRoute is intentionally NOT a dep:
+  // including it caused a lost-redirect bug where toggling workloadType
+  // (or any churn in canAccessRoute) during the 2s window cleared the
+  // pending timer and the re-run of the effect short-circuited on the
+  // idempotency ref.
   useEffect(() => {
     const succeeded =
       runState === "success" || listenerState === "success";
     if (!succeeded || redirectScheduledRef.current) return;
     redirectScheduledRef.current = true;
-    const destination =
-      runState === "success" ? browserSuccessRoute : "/models";
-    const timer = setTimeout(() => navigate(destination), SUCCESS_REDIRECT_DELAY_MS);
+    const timer = setTimeout(
+      () => navigate(pendingRedirectRouteRef.current),
+      SUCCESS_REDIRECT_DELAY_MS,
+    );
     return () => clearTimeout(timer);
-  }, [runState, listenerState, browserSuccessRoute, navigate]);
+  }, [runState, listenerState, navigate]);
 
   // Visible code samples always render against the display alias so the UI
   // is never blank; outbound requests use runnableModelAlias and bail out