From 2c890bd8fbf336f9031a05f682245e99b28bd48d Mon Sep 17 00:00:00 2001
From: Gage Krumbach <gkrumbach@gmail.com>
Date: Fri, 6 Feb 2026 10:20:23 -0600
Subject: [PATCH 1/4] feat: refactor runner into modules + add rubric
 evaluation MCP tool
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

Break the 2160-line adapter.py into focused modules:
- auth.py — credential fetching, Vertex AI setup, user sanitization
- config.py — ambient.json, MCP config, repos config loading
- workspace.py — path setup, validation, prerequisites
- prompts.py — system prompt building + extracted string constants
- utils.py — redaction, URL parsing, env var expansion, subprocess
- tools/ — MCP tool definitions (session restart + rubric evaluation)
- adapter.py — slimmed to ~1000 lines, core SDK orchestration only

New dynamic MCP tool that enables workflow-level output evaluation:
- Reads .ambient/rubric.md for evaluation criteria
- Schema defined in ambient.json rubric.schema (JSON Schema format)
- Tool accepts score (number), comment (string), metadata (object)
- Logs to Langfuse via create_score() with trace_id from observability
- Activation prompt injected into system prompt
- Graceful error handling with reasons returned to agent

- Added RubricConfig type to AmbientConfig for ambient.json parsing
- Included rubric config in workflow metadata API response

- Fixed main.py _load_mcp_config reference after refactor
- Updated test imports for new module structure
- CI workflow tweaks
---
 .github/workflows/claude-live-test.yml        |    2 +
 components/backend/handlers/content.go        |   34 +-
 .../runners/claude-code-runner/adapter.py     | 1390 ++++-------------
 components/runners/claude-code-runner/auth.py |  351 +++++
 .../runners/claude-code-runner/config.py      |  150 ++
 components/runners/claude-code-runner/main.py |    5 +-
 .../runners/claude-code-runner/prompts.py     |  200 +++
 .../runners/claude-code-runner/pyproject.toml |    3 +-
 .../tests/test_auto_push.py                   |   77 +-
 .../tests/test_model_mapping.py               |  165 +-
 .../tests/test_wrapper_vertex.py              |  102 +-
 .../claude-code-runner/tools/__init__.py      |   15 +
 .../claude-code-runner/tools/rubric.py        |  218 +++
 .../claude-code-runner/tools/session.py       |   46 +
 .../runners/claude-code-runner/utils.py       |  174 +++
 .../runners/claude-code-runner/workspace.py   |  251 +++
 16 files changed, 1886 insertions(+), 1297 deletions(-)
 create mode 100644 components/runners/claude-code-runner/auth.py
 create mode 100644 components/runners/claude-code-runner/config.py
 create mode 100644 components/runners/claude-code-runner/prompts.py
 create mode 100644 components/runners/claude-code-runner/tools/__init__.py
 create mode 100644 components/runners/claude-code-runner/tools/rubric.py
 create mode 100644 components/runners/claude-code-runner/tools/session.py
 create mode 100644 components/runners/claude-code-runner/utils.py
 create mode 100644 components/runners/claude-code-runner/workspace.py

diff --git a/.github/workflows/claude-live-test.yml b/.github/workflows/claude-live-test.yml
index 7b6f3cad7..cb30491ef 100644
--- a/.github/workflows/claude-live-test.yml
+++ b/.github/workflows/claude-live-test.yml
@@ -216,6 +216,8 @@ jobs:
 
     - name: Run Claude with Playwright MCP
       uses: anthropics/claude-code-action@v1
+      continue-on-error: true
+      id: claude_test
       env:
         TEST_TOKEN: ${{ steps.token.outputs.token }}
         DEBUG: "*"
diff --git a/components/backend/handlers/content.go b/components/backend/handlers/content.go
index e0cd4aad5..ea7cd6cfb 100644
--- a/components/backend/handlers/content.go
+++ b/components/backend/handlers/content.go
@@ -663,15 +663,20 @@ func ContentWorkflowMetadata(c *gin.Context) {
 		log.Printf("ContentWorkflowMetadata: agents directory not found or unreadable: %v", err)
 	}
 
+	configResponse := gin.H{
+		"name":         ambientConfig.Name,
+		"description":  ambientConfig.Description,
+		"systemPrompt": ambientConfig.SystemPrompt,
+		"artifactsDir": ambientConfig.ArtifactsDir,
+	}
+	if ambientConfig.Rubric != nil {
+		configResponse["rubric"] = ambientConfig.Rubric
+	}
+
 	c.JSON(http.StatusOK, gin.H{
 		"commands": commands,
 		"agents":   agents,
-		"config": gin.H{
-			"name":         ambientConfig.Name,
-			"description":  ambientConfig.Description,
-			"systemPrompt": ambientConfig.SystemPrompt,
-			"artifactsDir": ambientConfig.ArtifactsDir,
-		},
+		"config":   configResponse,
 	})
 }
 
@@ -713,12 +718,21 @@ func parseFrontmatter(filePath string) map[string]string {
 	return result
 }
 
+// RubricConfig represents the rubric evaluation configuration in ambient.json.
+// Schema is a JSON Schema object that defines the tool's input_schema for
+// additional metadata fields beyond final_score and reasoning.
+type RubricConfig struct {
+	ActivationPrompt string                 `json:"activationPrompt,omitempty"`
+	Schema           map[string]interface{} `json:"schema,omitempty"`
+}
+
 // AmbientConfig represents the ambient.json configuration
 type AmbientConfig struct {
-	Name         string `json:"name"`
-	Description  string `json:"description"`
-	SystemPrompt string `json:"systemPrompt"`
-	ArtifactsDir string `json:"artifactsDir"`
+	Name         string        `json:"name"`
+	Description  string        `json:"description"`
+	SystemPrompt string        `json:"systemPrompt"`
+	ArtifactsDir string        `json:"artifactsDir"`
+	Rubric       *RubricConfig `json:"rubric,omitempty"`
 }
 
 // parseAmbientConfig reads and parses ambient.json from workflow directory
diff --git a/components/runners/claude-code-runner/adapter.py b/components/runners/claude-code-runner/adapter.py
index 3502abf0f..dbd7414ea 100644
--- a/components/runners/claude-code-runner/adapter.py
+++ b/components/runners/claude-code-runner/adapter.py
@@ -2,49 +2,59 @@
 """
 Claude Code Adapter for AG-UI Server.
 
-Refactored from wrapper.py to use async generators that yield AG-UI events
-instead of WebSocket messaging. This is the core adapter that wraps the
-Claude Code SDK and produces a stream of AG-UI protocol events.
+Core adapter that wraps the Claude Code SDK and produces a stream of
+AG-UI protocol events.  Business logic is delegated to focused modules:
+
+- ``auth``      — credential fetching and authentication setup
+- ``config``    — ambient.json, MCP, and repos configuration
+- ``workspace`` — path setup, validation, prerequisites
+- ``prompts``   — system prompt construction and constants
+- ``tools``     — MCP tool definitions (session, rubric)
+- ``utils``     — general utilities (redaction, URL parsing, subprocesses)
 """
 
-import asyncio
 import json as _json
 import logging
 import os
-import re
-import shutil
-import sys
 import uuid
-from datetime import datetime, timezone
 from pathlib import Path
 from typing import Any, AsyncIterator, Optional
-from urllib import error as _urllib_error
-from urllib import request as _urllib_request
-from urllib.parse import urlparse, urlunparse
 
 # Set umask to make files readable by content service container
 os.umask(0o022)
 
 # AG-UI Protocol Events
-from ag_ui.core import (BaseEvent, EventType, RawEvent, RunAgentInput,
-                        RunErrorEvent, RunFinishedEvent, RunStartedEvent,
-                        StateDeltaEvent, StateSnapshotEvent, StepFinishedEvent,
-                        StepStartedEvent, TextMessageContentEvent,
-                        TextMessageEndEvent, TextMessageStartEvent,
-                        ToolCallArgsEvent, ToolCallEndEvent,
-                        ToolCallStartEvent)
-
+from ag_ui.core import (
+    BaseEvent,
+    EventType,
+    RawEvent,
+    RunAgentInput,
+    RunErrorEvent,
+    RunFinishedEvent,
+    RunStartedEvent,
+    StateDeltaEvent,
+    StepFinishedEvent,
+    StepStartedEvent,
+    TextMessageContentEvent,
+    TextMessageEndEvent,
+    TextMessageStartEvent,
+    ToolCallArgsEvent,
+    ToolCallEndEvent,
+    ToolCallStartEvent,
+)
+
+import auth
+import config as runner_config
+import prompts
+import workspace
 from context import RunnerContext
+from tools import create_restart_session_tool, create_rubric_mcp_tool, load_rubric_content
+from utils import redact_secrets, run_cmd, url_with_token, parse_owner_repo
+from workspace import PrerequisiteError
 
 logger = logging.getLogger(__name__)
 
 
-class PrerequisiteError(RuntimeError):
-    """Raised when slash-command prerequisites are missing."""
-
-    pass
-
-
 class ClaudeCodeAdapter:
     """
     Adapter that wraps the Claude Code SDK for AG-UI server.
@@ -61,8 +71,6 @@ def __init__(self):
         self._turn_count = 0
 
         # AG-UI streaming state (per-run, not instance state)
-        # NOTE: _current_message_id and _current_tool_id are now local variables
-        # in _run_claude_agent_sdk to avoid race conditions with concurrent runs
         self._current_run_id: Optional[str] = None
         self._current_thread_id: Optional[str] = None
 
@@ -72,22 +80,19 @@ def __init__(self):
     async def initialize(self, context: RunnerContext):
         """Initialize the adapter with context."""
         self.context = context
-        logger.info(f"Initialized Claude Code adapter for session {context.session_id}")
+        logger.info(
+            f"Initialized Claude Code adapter for session {context.session_id}"
+        )
 
-        # NOTE: Credentials are now fetched at runtime from backend API
-        # No longer copying from mounted volumes or reading from env vars
-        # This ensures tokens are always fresh for long-running sessions
+        # Credentials are fetched on-demand from backend API
         logger.info("Credentials will be fetched on-demand from backend API")
 
         # Workspace is already prepared by init container (hydrate.sh)
-        # - Repos cloned to /workspace/repos/
-        # - Workflows cloned to /workspace/workflows/
-        # - State hydrated from S3 to .claude/, artifacts/, file-uploads/
         logger.info("Workspace prepared by init container, validating...")
 
-        # Validate prerequisite files exist for phase-based commands
+        # Validate prerequisite files for phase-based commands
         try:
-            await self._validate_prerequisites()
+            await workspace.validate_prerequisites(self.context)
         except PrerequisiteError as exc:
             self.last_exit_code = 2
             logger.error(
@@ -95,22 +100,12 @@ async def initialize(self, context: RunnerContext):
             )
             raise
 
-    def _timestamp(self) -> str:
-        """Return current UTC timestamp in ISO format."""
-        return datetime.now(timezone.utc).isoformat()
-
-    async def process_run(self, input_data: RunAgentInput) -> AsyncIterator[BaseEvent]:
-        """
-        Process a run and yield AG-UI events.
+    async def process_run(
+        self, input_data: RunAgentInput
+    ) -> AsyncIterator[BaseEvent]:
+        """Process a run and yield AG-UI events.
 
         This is the main entry point called by the FastAPI server.
-
-        Args:
-            input_data: RunAgentInput with thread_id, run_id, messages, tools
-            app_state: Optional FastAPI app.state for persistent client storage/reuse
-
-        Yields:
-            AG-UI events (RunStartedEvent, TextMessageContentEvent, etc.)
         """
         thread_id = input_data.thread_id or self.context.session_id
         run_id = input_data.run_id or str(uuid.uuid4())
@@ -118,9 +113,6 @@ async def process_run(self, input_data: RunAgentInput) -> AsyncIterator[BaseEven
         self._current_thread_id = thread_id
         self._current_run_id = run_id
 
-        # NOTE: Credentials are now fetched on-demand at runtime, no need to pre-fetch
-        # Each tool call will get fresh credentials from the backend API
-
         try:
             # Emit RUN_STARTED
             yield RunStartedEvent(
@@ -134,7 +126,9 @@ async def process_run(self, input_data: RunAgentInput) -> AsyncIterator[BaseEven
                 msg_dict = (
                     msg
                     if isinstance(msg, dict)
-                    else (msg.model_dump() if hasattr(msg, "model_dump") else {})
+                    else (
+                        msg.model_dump() if hasattr(msg, "model_dump") else {}
+                    )
                 )
                 role = msg_dict.get("role", "")
 
@@ -143,18 +137,14 @@ async def process_run(self, input_data: RunAgentInput) -> AsyncIterator[BaseEven
                     content = msg_dict.get("content", "")
                     msg_metadata = msg_dict.get("metadata", {})
 
-                    # Check if message should be hidden from UI
-                    is_hidden = isinstance(msg_metadata, dict) and msg_metadata.get(
-                        "hidden", False
-                    )
+                    is_hidden = isinstance(
+                        msg_metadata, dict
+                    ) and msg_metadata.get("hidden", False)
                     if is_hidden:
                         logger.info(
-                            f"Message {msg_id[:8]} marked as hidden (auto-sent initial/workflow prompt)"
+                            f"Message {msg_id[:8]} marked as hidden "
+                            "(auto-sent initial/workflow prompt)"
                         )
-
-                    # Emit user message as TEXT_MESSAGE events
-                    # Include metadata in RAW event for frontend filtering
-                    if is_hidden:
                         yield RawEvent(
                             type=EventType.RAW,
                             thread_id=thread_id,
@@ -193,11 +183,13 @@ async def process_run(self, input_data: RunAgentInput) -> AsyncIterator[BaseEven
 
             # Extract user message from input
             logger.info(
-                f"Extracting user message from {len(input_data.messages)} messages"
+                f"Extracting user message from "
+                f"{len(input_data.messages)} messages"
             )
             user_message = self._extract_user_message(input_data)
             logger.info(
-                f"Extracted user message: '{user_message[:100] if user_message else '(empty)'}...'"
+                f"Extracted user message: "
+                f"'{user_message[:100] if user_message else '(empty)'}...'"
             )
 
             if not user_message:
@@ -206,7 +198,10 @@ async def process_run(self, input_data: RunAgentInput) -> AsyncIterator[BaseEven
                     type=EventType.RAW,
                     thread_id=thread_id,
                     run_id=run_id,
-                    event={"type": "system_log", "message": "No user message provided"},
+                    event={
+                        "type": "system_log",
+                        "message": "No user message provided",
+                    },
                 )
                 yield RunFinishedEvent(
                     type=EventType.RUN_FINISHED,
@@ -216,7 +211,9 @@ async def process_run(self, input_data: RunAgentInput) -> AsyncIterator[BaseEven
                 return
 
             # Run Claude SDK and yield events
-            logger.info(f"Starting Claude SDK with prompt: '{user_message[:50]}...'")
+            logger.info(
+                f"Starting Claude SDK with prompt: '{user_message[:50]}...'"
+            )
             async for event in self._run_claude_agent_sdk(
                 user_message, thread_id, run_id
             ):
@@ -255,170 +252,173 @@ def _extract_user_message(self, input_data: RunAgentInput) -> str:
         """Extract user message text from RunAgentInput."""
         messages = input_data.messages or []
         logger.info(
-            f"Extracting from {len(messages)} messages, types: {[type(m).__name__ for m in messages]}"
+            f"Extracting from {len(messages)} messages, "
+            f"types: {[type(m).__name__ for m in messages]}"
         )
 
-        # Find the last user message
         for msg in reversed(messages):
-            logger.debug(
-                f"Checking message: type={type(msg).__name__}, hasattr(role)={hasattr(msg, 'role')}"
-            )
-
             if hasattr(msg, "role") and msg.role == "user":
-                # Handle different content formats
                 content = getattr(msg, "content", "")
                 if isinstance(content, str):
-                    logger.info(
-                        f"Found user message (object format): '{content[:50]}...'"
-                    )
                     return content
                 elif isinstance(content, list):
-                    # Content blocks format
                     for block in content:
                         if hasattr(block, "text"):
                             return block.text
                         elif isinstance(block, dict) and "text" in block:
                             return block["text"]
             elif isinstance(msg, dict):
-                logger.debug(
-                    f"Dict message: role={msg.get('role')}, content={msg.get('content', '')[:30]}..."
-                )
                 if msg.get("role") == "user":
                     content = msg.get("content", "")
                     if isinstance(content, str):
-                        logger.info(
-                            f"Found user message (dict format): '{content[:50]}...'"
-                        )
                         return content
 
         logger.warning("No user message found!")
         return ""
 
+    # ------------------------------------------------------------------
+    # SDK orchestration
+    # ------------------------------------------------------------------
+
     async def _run_claude_agent_sdk(
         self, prompt: str, thread_id: str, run_id: str
     ) -> AsyncIterator[BaseEvent]:
-        """Execute the Claude Code SDK with the given prompt and yield AG-UI events.
-
-        Creates a fresh client for each run - simpler and more reliable than client reuse.
-
-        Args:
-            prompt: The user prompt to send to Claude
-            thread_id: AG-UI thread identifier
-            run_id: AG-UI run identifier
-        """
-        # Per-run state - NOT instance variables to avoid race conditions with concurrent runs
+        """Execute the Claude Code SDK with the given prompt and yield AG-UI events."""
         current_message_id: Optional[str] = None
 
         logger.info(
-            f"_run_claude_agent_sdk called with prompt length={len(prompt)}, will create fresh client"
+            f"_run_claude_agent_sdk called with prompt length={len(prompt)}, "
+            "will create fresh client"
         )
         try:
-            # NOTE: Credentials are now fetched at runtime via _populate_runtime_credentials()
-            # No need for manual refresh - backend API always returns fresh tokens
-
-            # Check for authentication method
+            # --- Authentication ---
             logger.info("Checking authentication configuration...")
             api_key = self.context.get_env("ANTHROPIC_API_KEY", "")
             use_vertex = (
-                self.context.get_env("CLAUDE_CODE_USE_VERTEX", "").strip() == "1"
+                self.context.get_env("CLAUDE_CODE_USE_VERTEX", "").strip()
+                == "1"
             )
 
             logger.info(
-                f"Auth config: api_key={'set' if api_key else 'not set'}, use_vertex={use_vertex}"
+                f"Auth config: api_key={'set' if api_key else 'not set'}, "
+                f"use_vertex={use_vertex}"
             )
 
             if not api_key and not use_vertex:
                 raise RuntimeError(
-                    "Either ANTHROPIC_API_KEY or CLAUDE_CODE_USE_VERTEX=1 must be set"
+                    "Either ANTHROPIC_API_KEY or CLAUDE_CODE_USE_VERTEX=1 "
+                    "must be set"
                 )
 
-            # Set environment variables BEFORE importing SDK
             if api_key:
                 os.environ["ANTHROPIC_API_KEY"] = api_key
                 logger.info("Using Anthropic API key authentication")
 
-            # Configure Vertex AI if requested
             if use_vertex:
-                vertex_credentials = await self._setup_vertex_credentials()
+                vertex_credentials = await auth.setup_vertex_credentials(
+                    self.context
+                )
                 if "ANTHROPIC_API_KEY" in os.environ:
-                    logger.info("Clearing ANTHROPIC_API_KEY to force Vertex AI mode")
+                    logger.info(
+                        "Clearing ANTHROPIC_API_KEY to force Vertex AI mode"
+                    )
                     del os.environ["ANTHROPIC_API_KEY"]
 
                 os.environ["CLAUDE_CODE_USE_VERTEX"] = "1"
-                os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = vertex_credentials.get(
-                    "credentials_path", ""
+                os.environ["GOOGLE_APPLICATION_CREDENTIALS"] = (
+                    vertex_credentials.get("credentials_path", "")
+                )
+                os.environ["ANTHROPIC_VERTEX_PROJECT_ID"] = (
+                    vertex_credentials.get("project_id", "")
                 )
-                os.environ["ANTHROPIC_VERTEX_PROJECT_ID"] = vertex_credentials.get(
-                    "project_id", ""
+                os.environ["CLOUD_ML_REGION"] = vertex_credentials.get(
+                    "region", ""
                 )
-                os.environ["CLOUD_ML_REGION"] = vertex_credentials.get("region", "")
-
-            # NOW we can safely import the SDK
-            from claude_agent_sdk import (AssistantMessage, ClaudeAgentOptions,
-                                          ClaudeSDKClient, ResultMessage,
-                                          SystemMessage, TextBlock,
-                                          ThinkingBlock, ToolResultBlock,
-                                          ToolUseBlock, UserMessage,
-                                          create_sdk_mcp_server)
+
+            # --- SDK imports (after env vars are set) ---
+            from claude_agent_sdk import (
+                AssistantMessage,
+                ClaudeAgentOptions,
+                ClaudeSDKClient,
+                ResultMessage,
+                SystemMessage,
+                TextBlock,
+                ThinkingBlock,
+                ToolResultBlock,
+                ToolUseBlock,
+                UserMessage,
+                create_sdk_mcp_server,
+            )
             from claude_agent_sdk import tool as sdk_tool
             from claude_agent_sdk.types import StreamEvent
 
             from observability import ObservabilityManager
 
-            # Extract and sanitize user context for observability
+            # --- Observability ---
             raw_user_id = os.getenv("USER_ID", "").strip()
             raw_user_name = os.getenv("USER_NAME", "").strip()
-            user_id, user_name = self._sanitize_user_context(raw_user_id, raw_user_name)
+            user_id, user_name = auth.sanitize_user_context(
+                raw_user_id, raw_user_name
+            )
 
-            # Get model configuration
             model = self.context.get_env("LLM_MODEL")
             configured_model = model or "claude-sonnet-4-5@20250929"
 
             if use_vertex and model:
-                configured_model = self._map_to_vertex_model(model)
+                configured_model = auth.map_to_vertex_model(model)
 
-            # Initialize observability
             obs = ObservabilityManager(
-                session_id=self.context.session_id, user_id=user_id, user_name=user_name
+                session_id=self.context.session_id,
+                user_id=user_id,
+                user_name=user_name,
             )
             await obs.initialize(
                 prompt=prompt,
-                namespace=self.context.get_env("AGENTIC_SESSION_NAMESPACE", "unknown"),
+                namespace=self.context.get_env(
+                    "AGENTIC_SESSION_NAMESPACE", "unknown"
+                ),
                 model=configured_model,
             )
             obs._pending_initial_prompt = prompt
 
-            # Check if this is a resume session via IS_RESUME env var
-            # This is set by the operator when restarting a stopped/completed/failed session
+            # --- Workspace paths ---
             is_continuation = (
-                self.context.get_env("IS_RESUME", "").strip().lower() == "true"
+                self.context.get_env("IS_RESUME", "").strip().lower()
+                == "true"
             )
             if is_continuation:
                 logger.info("IS_RESUME=true - treating as continuation")
 
-            # Determine cwd and additional dirs
-            repos_cfg = self._get_repos_config()
+            repos_cfg = runner_config.get_repos_config()
             cwd_path = self.context.workspace_path
             add_dirs = []
             derived_name = None
 
-            # Check for active workflow first
-            active_workflow_url = (os.getenv("ACTIVE_WORKFLOW_GIT_URL") or "").strip()
+            active_workflow_url = (
+                os.getenv("ACTIVE_WORKFLOW_GIT_URL") or ""
+            ).strip()
             if active_workflow_url:
-                cwd_path, add_dirs, derived_name = self._setup_workflow_paths(
-                    active_workflow_url, repos_cfg
+                cwd_path, add_dirs, derived_name = (
+                    workspace.setup_workflow_paths(
+                        self.context, active_workflow_url, repos_cfg
+                    )
                 )
             elif repos_cfg:
-                cwd_path, add_dirs = self._setup_multi_repo_paths(repos_cfg)
+                cwd_path, add_dirs = workspace.setup_multi_repo_paths(
+                    self.context, repos_cfg
+                )
             else:
-                cwd_path = str(Path(self.context.workspace_path) / "artifacts")
+                cwd_path = str(
+                    Path(self.context.workspace_path) / "artifacts"
+                )
 
-            # Load ambient.json configuration
+            # --- Config ---
             ambient_config = (
-                self._load_ambient_config(cwd_path) if active_workflow_url else {}
+                runner_config.load_ambient_config(cwd_path)
+                if active_workflow_url
+                else {}
             )
 
-            # Ensure working directory exists
             cwd_path_obj = Path(cwd_path)
             if not cwd_path_obj.exists():
                 logger.warning(
@@ -433,40 +433,38 @@ async def _run_claude_agent_sdk(
             logger.info(f"Claude SDK CWD: {cwd_path}")
             logger.info(f"Claude SDK additional directories: {add_dirs}")
 
-            # Fetch fresh credentials from backend and populate environment
-            # This ensures MCP servers get fresh tokens for long-running sessions
-            await self._populate_runtime_credentials()
+            # --- Credentials ---
+            await auth.populate_runtime_credentials(self.context)
 
-            # Load MCP server configuration (webfetch is included in static .mcp.json)
-            mcp_servers = self._load_mcp_config(cwd_path) or {}
+            # --- MCP servers ---
+            mcp_servers = (
+                runner_config.load_mcp_config(self.context, cwd_path) or {}
+            )
 
-            # Pre-flight check: Validate MCP server authentication status
-            # Import here to avoid circular dependency
+            # Pre-flight check: Validate MCP server authentication
             from main import _check_mcp_authentication
 
             mcp_auth_warnings = []
             if mcp_servers:
                 for server_name in mcp_servers.keys():
                     is_auth, msg = _check_mcp_authentication(server_name)
-
                     if is_auth is False:
-                        # Authentication definitely failed
-                        mcp_auth_warnings.append(f"⚠️  {server_name}: {msg}")
+                        mcp_auth_warnings.append(
+                            f"⚠️  {server_name}: {msg}"
+                        )
                     elif is_auth is None:
-                        # Authentication needs refresh or uncertain
-                        mcp_auth_warnings.append(f"ℹ️  {server_name}: {msg}")
+                        mcp_auth_warnings.append(
+                            f"ℹ️  {server_name}: {msg}"
+                        )
 
             if mcp_auth_warnings:
-                warning_msg = "**MCP Server Authentication Issues:**\n\n" + "\n".join(
-                    mcp_auth_warnings
-                )
-                warning_msg += (
-                    "\n\nThese servers may not work correctly until re-authenticated."
+                warning_msg = (
+                    "**MCP Server Authentication Issues:**\n\n"
+                    + "\n".join(mcp_auth_warnings)
+                    + "\n\nThese servers may not work correctly "
+                    "until re-authenticated."
                 )
                 logger.warning(warning_msg)
-
-                # Send as RAW event (not chat message) so UI can display as banner/notification
-                # Don't send as TextMessage - that shows up in chat history
                 yield RawEvent(
                     type=EventType.RAW,
                     thread_id=thread_id,
@@ -481,36 +479,41 @@ async def _run_claude_agent_sdk(
                     },
                 )
 
-            # Create custom session control tools
-            # Capture self reference for the restart tool closure
-            adapter_ref = self
-
-            @sdk_tool(
-                "restart_session",
-                "Restart the Claude session to recover from issues, clear state, or get a fresh connection. Use this if you detect you're in a broken state or need to reset.",
-                {},
-            )
-            async def restart_session_tool(args: dict) -> dict:
-                """Tool that allows Claude to request a session restart."""
-                adapter_ref._restart_requested = True
-                logger.info("🔄 Session restart requested by Claude via MCP tool")
-                return {
-                    "content": [
-                        {
-                            "type": "text",
-                            "text": "Session restart has been requested. The current run will complete and a fresh session will be established. Your conversation context will be preserved on disk.",
-                        }
-                    ]
-                }
-
-            # Create SDK MCP server for session tools
+            # --- MCP tools ---
+            # Session control tool
+            restart_tool = create_restart_session_tool(self, sdk_tool)
             session_tools_server = create_sdk_mcp_server(
-                name="session", version="1.0.0", tools=[restart_session_tool]
+                name="session", version="1.0.0", tools=[restart_tool]
             )
             mcp_servers["session"] = session_tools_server
-            logger.info("Added custom session control MCP tools (restart_session)")
+            logger.info(
+                "Added custom session control MCP tools (restart_session)"
+            )
+
+            # Dynamic rubric evaluation tool
+            rubric_content, rubric_config = load_rubric_content(cwd_path)
+            if rubric_content or rubric_config:
+                rubric_tool = create_rubric_mcp_tool(
+                    rubric_content=rubric_content or "",
+                    rubric_config=rubric_config,
+                    obs=obs,
+                    session_id=self.context.session_id,
+                    sdk_tool_decorator=sdk_tool,
+                )
+                if rubric_tool:
+                    rubric_server = create_sdk_mcp_server(
+                        name="rubric",
+                        version="1.0.0",
+                        tools=[rubric_tool],
+                    )
+                    mcp_servers["rubric"] = rubric_server
+                    logger.info(
+                        "Added dynamic rubric evaluation MCP tool "
+                        f"(categories: "
+                        f"{list(rubric_config.get('schema', {}).keys())})"
+                    )
 
-            # Disable built-in WebFetch in favor of WebFetch.MCP from config
+            # Tool permissions
             allowed_tools = [
                 "Read",
                 "Write",
@@ -525,28 +528,31 @@ async def restart_session_tool(args: dict) -> dict:
                 for server_name in mcp_servers.keys():
                     allowed_tools.append(f"mcp__{server_name}")
                 logger.info(
-                    f"MCP tool permissions granted for servers: {list(mcp_servers.keys())}"
+                    f"MCP tool permissions granted for servers: "
+                    f"{list(mcp_servers.keys())}"
                 )
 
-            # Build workspace context system prompt
-            workspace_prompt = self._build_workspace_context_prompt(
+            # --- System prompt ---
+            workspace_prompt = prompts.build_workspace_context_prompt(
                 repos_cfg=repos_cfg,
-                workflow_name=derived_name if active_workflow_url else None,
+                workflow_name=(
+                    derived_name if active_workflow_url else None
+                ),
                 artifacts_path="artifacts",
                 ambient_config=ambient_config,
+                workspace_path=self.context.workspace_path,
             )
-            # SystemPromptPreset format: uses claude_code preset with appended workspace context
             system_prompt_config = {
                 "type": "preset",
                 "preset": "claude_code",
                 "append": workspace_prompt,
             }
 
-            # Capture stderr from the SDK to diagnose MCP server failures
+            # Capture stderr from the SDK
             def sdk_stderr_handler(line: str):
                 logger.warning(f"[SDK stderr] {line.rstrip()}")
 
-            # Configure SDK options
+            # --- SDK options ---
             options = ClaudeAgentOptions(
                 cwd=cwd_path,
                 permission_mode="acceptEdits",
@@ -561,7 +567,6 @@ def sdk_stderr_handler(line: str):
             if self._skip_resume_on_restart:
                 self._skip_resume_on_restart = False
 
-            # Set additional options
             try:
                 if add_dirs:
                     options.add_dirs = add_dirs
@@ -592,6 +597,7 @@ def sdk_stderr_handler(line: str):
                 except Exception:
                     pass
 
+            # --- Client creation ---
             result_payload = None
             current_message = None
             sdk_session_id = None
@@ -601,16 +607,14 @@ def create_sdk_client(opts, disable_continue=False):
                     opts.continue_conversation = False
                 return ClaudeSDKClient(options=opts)
 
-            # Create fresh client for each run
-            # (Python SDK has issues with client reuse despite docs suggesting it should work)
             logger.info("Creating new ClaudeSDKClient for this run...")
 
-            # Enable continue_conversation to resume from disk state
             if not self._first_run or is_continuation:
                 try:
                     options.continue_conversation = True
                     logger.info(
-                        "Enabled continue_conversation (will resume from disk state)"
+                        "Enabled continue_conversation "
+                        "(will resume from disk state)"
                     )
                     yield RawEvent(
                         type=EventType.RAW,
@@ -622,18 +626,27 @@ def create_sdk_client(opts, disable_continue=False):
                         },
                     )
                 except Exception as e:
-                    logger.warning(f"Failed to set continue_conversation: {e}")
+                    logger.warning(
+                        f"Failed to set continue_conversation: {e}"
+                    )
 
             try:
                 logger.info("Creating ClaudeSDKClient...")
                 client = create_sdk_client(options)
-                logger.info("Connecting ClaudeSDKClient (initializing subprocess)...")
+                logger.info(
+                    "Connecting ClaudeSDKClient (initializing subprocess)..."
+                )
                 await client.connect()
                 logger.info("ClaudeSDKClient connected successfully!")
             except Exception as resume_error:
                 error_str = str(resume_error).lower()
-                if "no conversation found" in error_str or "session" in error_str:
-                    logger.warning(f"Conversation continuation failed: {resume_error}")
+                if (
+                    "no conversation found" in error_str
+                    or "session" in error_str
+                ):
+                    logger.warning(
+                        f"Conversation continuation failed: {resume_error}"
+                    )
                     yield RawEvent(
                         type=EventType.RAW,
                         thread_id=thread_id,
@@ -649,7 +662,6 @@ def create_sdk_client(opts, disable_continue=False):
                     raise
 
             try:
-                # Store client reference for interrupt support
                 self._active_client = client
 
                 # Process the prompt
@@ -662,18 +674,23 @@ def create_sdk_client(opts, disable_continue=False):
                     step_name="processing_prompt",
                 )
 
-                logger.info(f"Sending query to Claude SDK: '{prompt[:100]}...'")
+                logger.info(
+                    f"Sending query to Claude SDK: '{prompt[:100]}...'"
+                )
                 await client.query(prompt)
                 logger.info("Query sent, waiting for response stream...")
 
-                # Process response stream
-                logger.info("Starting to consume receive_response() iterator...")
+                # --- Process response stream ---
+                logger.info(
+                    "Starting to consume receive_response() iterator..."
+                )
                 message_count = 0
 
                 async for message in client.receive_response():
                     message_count += 1
                     logger.info(
-                        f"[ClaudeSDKClient Message #{message_count}]: {message}"
+                        f"[ClaudeSDKClient Message #{message_count}]: "
+                        f"{message}"
                     )
 
                     # Handle StreamEvent for real-time streaming chunks
@@ -705,19 +722,23 @@ def create_sdk_client(opts, disable_continue=False):
                                     )
                         continue
 
-                    # Capture SDK session ID from init message
+                    # Capture SDK session ID
                     if isinstance(message, SystemMessage):
-                        if message.subtype == "init" and message.data.get("session_id"):
+                        if message.subtype == "init" and message.data.get(
+                            "session_id"
+                        ):
                             sdk_session_id = message.data.get("session_id")
-                            logger.info(f"Captured SDK session ID: {sdk_session_id}")
+                            logger.info(
+                                f"Captured SDK session ID: {sdk_session_id}"
+                            )
 
                     if isinstance(message, (AssistantMessage, UserMessage)):
                         if isinstance(message, AssistantMessage):
                             current_message = message
-                            obs.start_turn(configured_model, user_input=prompt)
+                            obs.start_turn(
+                                configured_model, user_input=prompt
+                            )
 
-                            # Emit trace_id for feedback association
-                            # Frontend can use this to link feedback to specific Langfuse traces
                             trace_id = obs.get_current_trace_id()
                             if trace_id:
                                 yield RawEvent(
@@ -731,26 +752,34 @@ def create_sdk_client(opts, disable_continue=False):
                                 )
 
                         # Process all blocks in the message
-                        for block in getattr(message, "content", []) or []:
+                        for block in (
+                            getattr(message, "content", []) or []
+                        ):
                             if isinstance(block, TextBlock):
                                 text_piece = getattr(block, "text", None)
                                 if text_piece:
                                     logger.info(
-                                        f"TextBlock received (complete), text length={len(text_piece)}"
+                                        f"TextBlock received (complete), "
+                                        f"text length={len(text_piece)}"
                                     )
 
                             elif isinstance(block, ToolUseBlock):
-                                tool_name = getattr(block, "name", "") or "unknown"
-                                tool_input = getattr(block, "input", {}) or {}
-                                tool_id = getattr(block, "id", None) or str(
-                                    uuid.uuid4()
+                                tool_name = (
+                                    getattr(block, "name", "") or "unknown"
+                                )
+                                tool_input = (
+                                    getattr(block, "input", {}) or {}
                                 )
+                                tool_id = getattr(
+                                    block, "id", None
+                                ) or str(uuid.uuid4())
                                 parent_tool_use_id = getattr(
                                     message, "parent_tool_use_id", None
                                 )
 
                                 logger.info(
-                                    f"ToolUseBlock detected: {tool_name} (id={tool_id[:12]})"
+                                    f"ToolUseBlock detected: {tool_name} "
+                                    f"(id={tool_id[:12]})"
                                 )
 
                                 yield ToolCallStartEvent(
@@ -772,20 +801,28 @@ def create_sdk_client(opts, disable_continue=False):
                                         delta=args_json,
                                     )
 
-                                obs.track_tool_use(tool_name, tool_id, tool_input)
+                                obs.track_tool_use(
+                                    tool_name, tool_id, tool_input
+                                )
 
                             elif isinstance(block, ToolResultBlock):
-                                tool_use_id = getattr(block, "tool_use_id", None)
+                                tool_use_id = getattr(
+                                    block, "tool_use_id", None
+                                )
                                 content = getattr(block, "content", None)
                                 is_error = getattr(block, "is_error", None)
                                 result_text = getattr(block, "text", None)
                                 result_content = (
-                                    content if content is not None else result_text
+                                    content
+                                    if content is not None
+                                    else result_text
                                 )
 
                                 if result_content is not None:
                                     try:
-                                        result_str = _json.dumps(result_content)
+                                        result_str = _json.dumps(
+                                            result_content
+                                        )
                                     except (TypeError, ValueError):
                                         result_str = str(result_content)
                                 else:
@@ -797,16 +834,28 @@ def create_sdk_client(opts, disable_continue=False):
                                         thread_id=thread_id,
                                         run_id=run_id,
                                         tool_call_id=tool_use_id,
-                                        result=result_str if not is_error else None,
-                                        error=result_str if is_error else None,
+                                        result=(
+                                            result_str
+                                            if not is_error
+                                            else None
+                                        ),
+                                        error=(
+                                            result_str
+                                            if is_error
+                                            else None
+                                        ),
                                     )
 
                                 obs.track_tool_result(
-                                    tool_use_id, result_content, is_error or False
+                                    tool_use_id,
+                                    result_content,
+                                    is_error or False,
                                 )
 
                             elif isinstance(block, ThinkingBlock):
-                                thinking_text = getattr(block, "thinking", "")
+                                thinking_text = getattr(
+                                    block, "thinking", ""
+                                )
                                 signature = getattr(block, "signature", "")
                                 yield RawEvent(
                                     type=EventType.RAW,
@@ -820,7 +869,10 @@ def create_sdk_client(opts, disable_continue=False):
                                 )
 
                         # End text message after processing all blocks
-                        if getattr(message, "content", []) and current_message_id:
+                        if (
+                            getattr(message, "content", [])
+                            and current_message_id
+                        ):
                             yield TextMessageEndEvent(
                                 type=EventType.TEXT_MESSAGE_END,
                                 thread_id=thread_id,
@@ -848,11 +900,14 @@ def create_sdk_client(opts, disable_continue=False):
                         sdk_num_turns = getattr(message, "num_turns", None)
 
                         logger.info(
-                            f"ResultMessage: num_turns={sdk_num_turns}, usage={usage_raw}"
+                            f"ResultMessage: num_turns={sdk_num_turns}, "
+                            f"usage={usage_raw}"
                         )
 
                         # Convert usage object to dict if needed
-                        if usage_raw is not None and not isinstance(usage_raw, dict):
+                        if usage_raw is not None and not isinstance(
+                            usage_raw, dict
+                        ):
                             try:
                                 if hasattr(usage_raw, "__dict__"):
                                     usage_raw = usage_raw.__dict__
@@ -860,36 +915,42 @@ def create_sdk_client(opts, disable_continue=False):
                                     usage_raw = usage_raw.model_dump()
                             except Exception as e:
                                 logger.warning(
-                                    f"Could not convert usage object to dict: {e}"
+                                    "Could not convert usage object "
+                                    f"to dict: {e}"
                                 )
 
-                        # Update turn count
                         if (
                             sdk_num_turns is not None
                             and sdk_num_turns > self._turn_count
                         ):
                             self._turn_count = sdk_num_turns
 
-                        # Complete turn tracking
                         if current_message:
                             obs.end_turn(
                                 self._turn_count,
                                 current_message,
-                                usage_raw if isinstance(usage_raw, dict) else None,
+                                (
+                                    usage_raw
+                                    if isinstance(usage_raw, dict)
+                                    else None
+                                ),
                             )
                             current_message = None
 
                         result_payload = {
                             "subtype": getattr(message, "subtype", None),
-                            "duration_ms": getattr(message, "duration_ms", None),
+                            "duration_ms": getattr(
+                                message, "duration_ms", None
+                            ),
                             "is_error": getattr(message, "is_error", None),
                             "num_turns": getattr(message, "num_turns", None),
-                            "total_cost_usd": getattr(message, "total_cost_usd", None),
+                            "total_cost_usd": getattr(
+                                message, "total_cost_usd", None
+                            ),
                             "usage": usage_raw,
                             "result": getattr(message, "result", None),
                         }
 
-                        # Emit state delta with result
                         yield StateDeltaEvent(
                             type=EventType.STATE_DELTA,
                             thread_id=thread_id,
@@ -913,31 +974,31 @@ def create_sdk_client(opts, disable_continue=False):
                 )
 
                 logger.info(
-                    f"Response iterator fully consumed ({message_count} messages total)"
+                    f"Response iterator fully consumed "
+                    f"({message_count} messages total)"
                 )
 
-                # Mark first run complete
                 self._first_run = False
 
-                # Check if restart was requested by Claude
+                # Check if restart was requested
                 if self._restart_requested:
-                    logger.info("🔄 Restart was requested, emitting restart event")
-                    self._restart_requested = False  # Reset flag
+                    logger.info(
+                        "🔄 Restart was requested, emitting restart event"
+                    )
+                    self._restart_requested = False
                     yield RawEvent(
                         type=EventType.RAW,
                         thread_id=thread_id,
                         run_id=run_id,
                         event={
                             "type": "session_restart_requested",
-                            "message": "Claude requested a session restart. Reconnecting...",
+                            "message": "Claude requested a session restart. "
+                            "Reconnecting...",
                         },
                     )
 
             finally:
-                # Clear active client reference
                 self._active_client = None
-
-                # Always disconnect client at end of run
                 if client is not None:
                     logger.info("Disconnecting client (end of run)")
                     await client.disconnect()
@@ -952,9 +1013,7 @@ def create_sdk_client(opts, disable_continue=False):
             raise
 
     async def interrupt(self) -> None:
-        """
-        Interrupt the active Claude SDK execution.
-        """
+        """Interrupt the active Claude SDK execution."""
         if self._active_client is None:
             logger.warning("Interrupt requested but no active client")
             return
@@ -965,834 +1024,3 @@ async def interrupt(self) -> None:
             logger.info("Interrupt signal sent successfully")
         except Exception as e:
             logger.error(f"Failed to interrupt Claude SDK: {e}")
-
-    def _setup_workflow_paths(
-        self, active_workflow_url: str, repos_cfg: list
-    ) -> tuple[str, list, str]:
-        """Setup paths for workflow mode."""
-        add_dirs = []
-        derived_name = None
-        cwd_path = self.context.workspace_path
-
-        try:
-            owner, repo, _ = self._parse_owner_repo(active_workflow_url)
-            derived_name = repo or ""
-            if not derived_name:
-                p = urlparse(active_workflow_url)
-                parts = [pt for pt in (p.path or "").split("/") if pt]
-                if parts:
-                    derived_name = parts[-1]
-            derived_name = (derived_name or "").removesuffix(".git").strip()
-
-            if derived_name:
-                workflow_path = str(
-                    Path(self.context.workspace_path) / "workflows" / derived_name
-                )
-                if Path(workflow_path).exists():
-                    cwd_path = workflow_path
-                    logger.info(f"Using workflow as CWD: {derived_name}")
-                else:
-                    logger.warning(
-                        f"Workflow directory not found: {workflow_path}, using default"
-                    )
-                    cwd_path = str(
-                        Path(self.context.workspace_path) / "workflows" / "default"
-                    )
-            else:
-                cwd_path = str(
-                    Path(self.context.workspace_path) / "workflows" / "default"
-                )
-        except Exception as e:
-            logger.warning(f"Failed to derive workflow name: {e}, using default")
-            cwd_path = str(Path(self.context.workspace_path) / "workflows" / "default")
-
-        # Add all repos as additional directories (repos are in /workspace/repos/{name})
-        repos_base = Path(self.context.workspace_path) / "repos"
-        for r in repos_cfg:
-            name = (r.get("name") or "").strip()
-            if name:
-                repo_path = str(repos_base / name)
-                if repo_path not in add_dirs:
-                    add_dirs.append(repo_path)
-
-        # Add artifacts and file-uploads directories
-        artifacts_path = str(Path(self.context.workspace_path) / "artifacts")
-        if artifacts_path not in add_dirs:
-            add_dirs.append(artifacts_path)
-
-        file_uploads_path = str(Path(self.context.workspace_path) / "file-uploads")
-        if file_uploads_path not in add_dirs:
-            add_dirs.append(file_uploads_path)
-
-        return cwd_path, add_dirs, derived_name
-
-    def _setup_multi_repo_paths(self, repos_cfg: list) -> tuple[str, list]:
-        """Setup paths for multi-repo mode.
-
-        Repos are cloned to /workspace/repos/{name} by both:
-        - hydrate.sh (init container)
-        - clone_repo_at_runtime() (runtime addition)
-        """
-        add_dirs = []
-        repos_base = Path(self.context.workspace_path) / "repos"
-
-        main_name = (os.getenv("MAIN_REPO_NAME") or "").strip()
-        if not main_name:
-            idx_raw = (os.getenv("MAIN_REPO_INDEX") or "").strip()
-            try:
-                idx_val = int(idx_raw) if idx_raw else 0
-            except Exception:
-                idx_val = 0
-            if idx_val < 0 or idx_val >= len(repos_cfg):
-                idx_val = 0
-            main_name = (repos_cfg[idx_val].get("name") or "").strip()
-
-        # Main repo path is /workspace/repos/{name}
-        cwd_path = (
-            str(repos_base / main_name) if main_name else self.context.workspace_path
-        )
-
-        for r in repos_cfg:
-            name = (r.get("name") or "").strip()
-            if not name:
-                continue
-            # All repos are in /workspace/repos/{name}
-            p = str(repos_base / name)
-            if p != cwd_path:
-                add_dirs.append(p)
-
-        # Add artifacts and file-uploads directories
-        artifacts_path = str(Path(self.context.workspace_path) / "artifacts")
-        if artifacts_path not in add_dirs:
-            add_dirs.append(artifacts_path)
-
-        file_uploads_path = str(Path(self.context.workspace_path) / "file-uploads")
-        if file_uploads_path not in add_dirs:
-            add_dirs.append(file_uploads_path)
-
-        return cwd_path, add_dirs
-
-    @staticmethod
-    def _sanitize_user_context(user_id: str, user_name: str) -> tuple[str, str]:
-        """Validate and sanitize user context fields to prevent injection attacks."""
-        if user_id:
-            user_id = str(user_id).strip()
-            if len(user_id) > 255:
-                user_id = user_id[:255]
-            sanitized_id = re.sub(r"[^a-zA-Z0-9@._-]", "", user_id)
-            user_id = sanitized_id
-
-        if user_name:
-            user_name = str(user_name).strip()
-            if len(user_name) > 255:
-                user_name = user_name[:255]
-            sanitized_name = re.sub(r"[\x00-\x1f\x7f-\x9f]", "", user_name)
-            user_name = sanitized_name
-
-        return user_id, user_name
-
-    def _map_to_vertex_model(self, model: str) -> str:
-        """Map Anthropic API model names to Vertex AI model names."""
-        model_map = {
-            "claude-opus-4-6": "claude-opus-4-6",
-            "claude-opus-4-5": "claude-opus-4-5@20251101",
-            "claude-opus-4-1": "claude-opus-4-1@20250805",
-            "claude-sonnet-4-5": "claude-sonnet-4-5@20250929",
-            "claude-haiku-4-5": "claude-haiku-4-5@20251001",
-        }
-        return model_map.get(model, model)
-
-    async def _setup_vertex_credentials(self) -> dict:
-        """Set up Google Cloud Vertex AI credentials from service account."""
-        service_account_path = self.context.get_env(
-            "GOOGLE_APPLICATION_CREDENTIALS", ""
-        ).strip()
-        project_id = self.context.get_env("ANTHROPIC_VERTEX_PROJECT_ID", "").strip()
-        region = self.context.get_env("CLOUD_ML_REGION", "").strip()
-
-        if not service_account_path:
-            raise RuntimeError(
-                "GOOGLE_APPLICATION_CREDENTIALS must be set when CLAUDE_CODE_USE_VERTEX=1"
-            )
-        if not project_id:
-            raise RuntimeError(
-                "ANTHROPIC_VERTEX_PROJECT_ID must be set when CLAUDE_CODE_USE_VERTEX=1"
-            )
-        if not region:
-            raise RuntimeError(
-                "CLOUD_ML_REGION must be set when CLAUDE_CODE_USE_VERTEX=1"
-            )
-
-        if not Path(service_account_path).exists():
-            raise RuntimeError(
-                f"Service account key file not found at {service_account_path}"
-            )
-
-        logger.info(f"Vertex AI configured: project={project_id}, region={region}")
-        return {
-            "credentials_path": service_account_path,
-            "project_id": project_id,
-            "region": region,
-        }
-
-    async def _prepare_workspace(self) -> AsyncIterator[BaseEvent]:
-        """Validate workspace prepared by init container.
-
-        The init-hydrate container now handles:
-        - Downloading state from S3 (.claude/, artifacts/, file-uploads/)
-        - Cloning repos to /workspace/repos/
-        - Cloning workflows to /workspace/workflows/
-
-        Runner just validates and logs what's ready.
-        """
-        workspace = Path(self.context.workspace_path)
-        logger.info(f"Validating workspace at {workspace}")
-
-        # Check what was hydrated
-        hydrated_paths = []
-        for path_name in [".claude", "artifacts", "file-uploads"]:
-            path_dir = workspace / path_name
-            if path_dir.exists():
-                file_count = len([f for f in path_dir.rglob("*") if f.is_file()])
-                if file_count > 0:
-                    hydrated_paths.append(f"{path_name} ({file_count} files)")
-
-        if hydrated_paths:
-            logger.info(f"Hydrated from S3: {', '.join(hydrated_paths)}")
-        else:
-            logger.info("No state hydrated (fresh session)")
-
-        # No further preparation needed - init container did the work
-
-    async def _validate_prerequisites(self):
-        """Validate prerequisite files exist for phase-based slash commands."""
-        prompt = self.context.get_env("INITIAL_PROMPT", "")
-        if not prompt:
-            return
-
-        prompt_lower = prompt.strip().lower()
-
-        prerequisites = {
-            "/speckit.plan": (
-                "spec.md",
-                "Specification file (spec.md) not found. Please run /speckit.specify first.",
-            ),
-            "/speckit.tasks": (
-                "plan.md",
-                "Planning file (plan.md) not found. Please run /speckit.plan first.",
-            ),
-            "/speckit.implement": (
-                "tasks.md",
-                "Tasks file (tasks.md) not found. Please run /speckit.tasks first.",
-            ),
-        }
-
-        for cmd, (required_file, error_msg) in prerequisites.items():
-            if prompt_lower.startswith(cmd):
-                workspace = Path(self.context.workspace_path)
-                found = False
-
-                if (workspace / required_file).exists():
-                    found = True
-                    break
-
-                for subdir in workspace.rglob("specs/*/"):
-                    if (subdir / required_file).exists():
-                        found = True
-                        break
-
-                if not found:
-                    raise PrerequisiteError(error_msg)
-                break
-
-    async def _initialize_workflow_if_set(self) -> AsyncIterator[BaseEvent]:
-        """Validate workflow was cloned by init container."""
-        active_workflow_url = (os.getenv("ACTIVE_WORKFLOW_GIT_URL") or "").strip()
-        if not active_workflow_url:
-            return
-
-        try:
-            owner, repo, _ = self._parse_owner_repo(active_workflow_url)
-            derived_name = repo or ""
-            if not derived_name:
-                p = urlparse(active_workflow_url)
-                parts = [pt for pt in (p.path or "").split("/") if pt]
-                if parts:
-                    derived_name = parts[-1]
-            derived_name = (derived_name or "").removesuffix(".git").strip()
-
-            if not derived_name:
-                logger.warning("Could not derive workflow name from URL")
-                return
-
-            # Check for cloned workflow (init container uses -clone-temp suffix)
-            workspace = Path(self.context.workspace_path)
-            workflow_temp_dir = workspace / "workflows" / f"{derived_name}-clone-temp"
-            workflow_dir = workspace / "workflows" / derived_name
-
-            if workflow_temp_dir.exists():
-                logger.info(
-                    f"Workflow {derived_name} cloned by init container at {workflow_temp_dir.name}"
-                )
-            elif workflow_dir.exists():
-                logger.info(f"Workflow {derived_name} available at {workflow_dir.name}")
-            else:
-                logger.warning(
-                    f"Workflow {derived_name} not found (init container may have failed to clone)"
-                )
-
-        except Exception as e:
-            logger.error(f"Failed to validate workflow: {e}")
-
-    async def _run_cmd(self, cmd, cwd=None, capture_stdout=False, ignore_errors=False):
-        """Run a subprocess command asynchronously."""
-        cmd_safe = [self._redact_secrets(str(arg)) for arg in cmd]
-        logger.info(f"Running command: {' '.join(cmd_safe)}")
-
-        proc = await asyncio.create_subprocess_exec(
-            *cmd,
-            stdout=asyncio.subprocess.PIPE,
-            stderr=asyncio.subprocess.PIPE,
-            cwd=cwd or self.context.workspace_path,
-        )
-        stdout_data, stderr_data = await proc.communicate()
-        stdout_text = stdout_data.decode("utf-8", errors="replace")
-        stderr_text = stderr_data.decode("utf-8", errors="replace")
-
-        if stdout_text.strip():
-            logger.info(f"Command stdout: {self._redact_secrets(stdout_text.strip())}")
-        if stderr_text.strip():
-            logger.info(f"Command stderr: {self._redact_secrets(stderr_text.strip())}")
-
-        if proc.returncode != 0 and not ignore_errors:
-            raise RuntimeError(stderr_text or f"Command failed: {' '.join(cmd_safe)}")
-
-        if capture_stdout:
-            return stdout_text
-        return ""
-
-    def _url_with_token(self, url: str, token: str) -> str:
-        """Add authentication token to URL."""
-        if not token or not url.lower().startswith("http"):
-            return url
-        try:
-            parsed = urlparse(url)
-            netloc = parsed.netloc
-            if "@" in netloc:
-                netloc = netloc.split("@", 1)[1]
-
-            hostname = parsed.hostname or ""
-            if "gitlab" in hostname.lower():
-                auth = f"oauth2:{token}@"
-            else:
-                auth = f"x-access-token:{token}@"
-
-            new_netloc = auth + netloc
-            return urlunparse(
-                (
-                    parsed.scheme,
-                    new_netloc,
-                    parsed.path,
-                    parsed.params,
-                    parsed.query,
-                    parsed.fragment,
-                )
-            )
-        except Exception:
-            return url
-
-    def _redact_secrets(self, text: str) -> str:
-        """Redact tokens and secrets from text for safe logging."""
-        if not text:
-            return text
-
-        text = re.sub(r"gh[pousr]_[a-zA-Z0-9]{36,255}", "gh*_***REDACTED***", text)
-        text = re.sub(r"sk-ant-[a-zA-Z0-9\-_]{30,200}", "sk-ant-***REDACTED***", text)
-        text = re.sub(r"pk-lf-[a-zA-Z0-9\-_]{10,100}", "pk-lf-***REDACTED***", text)
-        text = re.sub(r"sk-lf-[a-zA-Z0-9\-_]{10,100}", "sk-lf-***REDACTED***", text)
-        text = re.sub(
-            r"x-access-token:[^@\s]+@", "x-access-token:***REDACTED***@", text
-        )
-        text = re.sub(r"oauth2:[^@\s]+@", "oauth2:***REDACTED***@", text)
-        text = re.sub(r"://[^:@\s]+:[^@\s]+@", "://***REDACTED***@", text)
-        text = re.sub(
-            r'(ANTHROPIC_API_KEY|LANGFUSE_SECRET_KEY|LANGFUSE_PUBLIC_KEY|BOT_TOKEN|GIT_TOKEN)\s*=\s*[^\s\'"]+',
-            r"\1=***REDACTED***",
-            text,
-        )
-        return text
-
-    async def _fetch_token_for_url(self, url: str) -> str:
-        """Fetch appropriate token based on repository URL."""
-        try:
-            parsed = urlparse(url)
-            hostname = parsed.hostname or ""
-
-            if "gitlab" in hostname.lower():
-                token = await self._fetch_gitlab_token()
-                if token:
-                    logger.info(f"Using fresh GitLab token for {hostname}")
-                    return token
-                else:
-                    logger.warning(f"No GitLab credentials configured for {url}")
-                    return ""
-
-            # Always fetch fresh GitHub token (PAT or App)
-            token = await self._fetch_github_token()
-            if token:
-                logger.info(f"Using fresh GitHub token for {hostname}")
-            return token
-
-        except Exception as e:
-            logger.warning(
-                f"Failed to parse URL {url}: {e}, falling back to GitHub token"
-            )
-            return os.getenv("GITHUB_TOKEN") or await self._fetch_github_token()
-
-    async def _populate_runtime_credentials(self) -> None:
-        """Fetch all credentials from backend and populate environment variables.
-
-        This is called before each SDK run to ensure MCP servers have fresh tokens.
-        """
-        logger.info("Fetching fresh credentials from backend API...")
-
-        # Fetch Google credentials
-        google_creds = await self._fetch_google_credentials()
-        if google_creds.get("accessToken"):
-            # Write credentials to file for workspace-mcp
-            creds_dir = Path("/workspace/.google_workspace_mcp/credentials")
-            creds_dir.mkdir(parents=True, exist_ok=True)
-            creds_file = creds_dir / "credentials.json"
-
-            # Get OAuth client config from env
-            client_id = os.getenv("GOOGLE_OAUTH_CLIENT_ID", "")
-            client_secret = os.getenv("GOOGLE_OAUTH_CLIENT_SECRET", "")
-
-            # Create credentials.json for workspace-mcp
-            creds_data = {
-                "token": google_creds.get("accessToken"),
-                "refresh_token": "",  # Backend handles refresh
-                "token_uri": "https://oauth2.googleapis.com/token",
-                "client_id": client_id,
-                "client_secret": client_secret,
-                "scopes": google_creds.get("scopes", []),
-                "expiry": google_creds.get("expiresAt", ""),
-            }
-
-            with open(creds_file, "w") as f:
-                _json.dump(creds_data, f, indent=2)
-            creds_file.chmod(0o644)
-            logger.info("✓ Updated Google credentials file for workspace-mcp")
-
-            # Set USER_GOOGLE_EMAIL for MCP server (from backend API response)
-            user_email = google_creds.get("email", "")
-            if user_email and user_email != "user@example.com":
-                os.environ["USER_GOOGLE_EMAIL"] = user_email
-                logger.info(
-                    f"✓ Set USER_GOOGLE_EMAIL to {user_email} for workspace-mcp"
-                )
-
-        # Fetch Jira credentials
-        jira_creds = await self._fetch_jira_credentials()
-        if jira_creds.get("apiToken"):
-            os.environ["JIRA_URL"] = jira_creds.get("url", "")
-            os.environ["JIRA_API_TOKEN"] = jira_creds.get("apiToken", "")
-            os.environ["JIRA_EMAIL"] = jira_creds.get("email", "")
-            logger.info("✓ Updated Jira credentials in environment")
-
-        # Fetch GitLab token
-        gitlab_token = await self._fetch_gitlab_token()
-        if gitlab_token:
-            os.environ["GITLAB_TOKEN"] = gitlab_token
-            logger.info("✓ Updated GitLab token in environment")
-
-        # Fetch GitHub token (PAT or App)
-        github_token = await self._fetch_github_token()
-        if github_token:
-            os.environ["GITHUB_TOKEN"] = github_token
-            logger.info("✓ Updated GitHub token in environment")
-
-        logger.info("Runtime credentials populated successfully")
-
-    async def _fetch_credential(self, credential_type: str) -> dict:
-        """Fetch credentials from backend API at runtime.
-
-        Args:
-            credential_type: One of 'github', 'google', 'jira', 'gitlab'
-
-        Returns:
-            Dictionary with credential data or empty dict if unavailable
-        """
-        base = os.getenv("BACKEND_API_URL", "").rstrip("/")
-        project = os.getenv("PROJECT_NAME") or os.getenv(
-            "AGENTIC_SESSION_NAMESPACE", ""
-        )
-        project = project.strip()
-        session_id = self.context.session_id
-
-        if not base or not project or not session_id:
-            logger.warning(
-                f"Cannot fetch {credential_type} credentials: missing environment variables (base={base}, project={project}, session={session_id})"
-            )
-            return {}
-
-        url = f"{base}/projects/{project}/agentic-sessions/{session_id}/credentials/{credential_type}"
-        logger.info(f"Fetching fresh {credential_type} credentials from: {url}")
-
-        req = _urllib_request.Request(url, method="GET")
-        bot = (os.getenv("BOT_TOKEN") or "").strip()
-        if bot:
-            req.add_header("Authorization", f"Bearer {bot}")
-
-        loop = asyncio.get_event_loop()
-
-        def _do_req():
-            try:
-                with _urllib_request.urlopen(req, timeout=10) as resp:
-                    return resp.read().decode("utf-8", errors="replace")
-            except Exception as e:
-                logger.warning(f"{credential_type} credential fetch failed: {e}")
-                return ""
-
-        resp_text = await loop.run_in_executor(None, _do_req)
-        if not resp_text:
-            return {}
-
-        try:
-            data = _json.loads(resp_text)
-            logger.info(
-                f"Successfully fetched {credential_type} credentials from backend"
-            )
-            return data
-        except Exception as e:
-            logger.error(f"Failed to parse {credential_type} credential response: {e}")
-            return {}
-
-    async def _fetch_github_token(self) -> str:
-        """Fetch GitHub token from backend API (always fresh - PAT or minted App token)."""
-        data = await self._fetch_credential("github")
-        token = data.get("token", "")
-        if token:
-            logger.info("Using fresh GitHub token from backend")
-        return token
-
-    async def _fetch_google_credentials(self) -> dict:
-        """Fetch Google OAuth credentials from backend API."""
-        data = await self._fetch_credential("google")
-        if data.get("accessToken"):
-            logger.info(
-                f"Using fresh Google credentials from backend (email: {data.get('email', 'unknown')})"
-            )
-        return data
-
-    async def _fetch_jira_credentials(self) -> dict:
-        """Fetch Jira credentials from backend API."""
-        data = await self._fetch_credential("jira")
-        if data.get("apiToken"):
-            logger.info(
-                f"Using Jira credentials from backend (url: {data.get('url', 'unknown')})"
-            )
-        return data
-
-    async def _fetch_gitlab_token(self) -> str:
-        """Fetch GitLab token from backend API."""
-        data = await self._fetch_credential("gitlab")
-        token = data.get("token", "")
-        if token:
-            logger.info(
-                f"Using fresh GitLab token from backend (instance: {data.get('instanceUrl', 'unknown')})"
-            )
-        return token
-
-    async def _fetch_github_token_legacy(self) -> str:
-        """Legacy method - kept for backward compatibility."""
-        # Build mint URL from environment
-        base = os.getenv("BACKEND_API_URL", "").rstrip("/")
-        project = os.getenv("PROJECT_NAME") or os.getenv(
-            "AGENTIC_SESSION_NAMESPACE", ""
-        )
-        project = project.strip()
-        session_id = self.context.session_id
-
-        if not base or not project or not session_id:
-            logger.warning("Cannot fetch GitHub token: missing environment variables")
-            return ""
-
-        url = f"{base}/projects/{project}/agentic-sessions/{session_id}/github/token"
-        logger.info(f"Fetching GitHub token from legacy endpoint: {url}")
-
-        req = _urllib_request.Request(
-            url, data=b"{}", headers={"Content-Type": "application/json"}, method="POST"
-        )
-        bot = (os.getenv("BOT_TOKEN") or "").strip()
-        if bot:
-            req.add_header("Authorization", f"Bearer {bot}")
-
-        loop = asyncio.get_event_loop()
-
-        def _do_req():
-            try:
-                with _urllib_request.urlopen(req, timeout=10) as resp:
-                    return resp.read().decode("utf-8", errors="replace")
-            except Exception as e:
-                logger.warning(f"GitHub token fetch failed: {e}")
-                return ""
-
-        resp_text = await loop.run_in_executor(None, _do_req)
-        if not resp_text:
-            return ""
-
-        try:
-            data = _json.loads(resp_text)
-            token = str(data.get("token") or "")
-            if token:
-                logger.info("Successfully fetched GitHub token from backend")
-            return token
-        except Exception as e:
-            logger.error(f"Failed to parse token response: {e}")
-            return ""
-
-    def _parse_owner_repo(self, url: str) -> tuple[str, str, str]:
-        """Return (owner, name, host) from various URL formats."""
-        s = (url or "").strip()
-        s = s.removesuffix(".git")
-        host = "github.com"
-        try:
-            if s.startswith("http://") or s.startswith("https://"):
-                p = urlparse(s)
-                host = p.netloc
-                parts = [pt for pt in p.path.split("/") if pt]
-                if len(parts) >= 2:
-                    return parts[0], parts[1], host
-            if s.startswith("git@") or ":" in s:
-                s2 = s
-                if s2.startswith("git@"):
-                    s2 = s2.replace(":", "/", 1)
-                    s2 = s2.replace("git@", "ssh://git@", 1)
-                p = urlparse(s2)
-                host = p.hostname or host
-                parts = [pt for pt in (p.path or "").split("/") if pt]
-                if len(parts) >= 2:
-                    return parts[-2], parts[-1], host
-            parts = [pt for pt in s.split("/") if pt]
-            if len(parts) == 2:
-                return parts[0], parts[1], host
-        except Exception:
-            return "", "", host
-        return "", "", host
-
-    def _get_repos_config(self) -> list[dict]:
-        """Read repos mapping from REPOS_JSON env if present.
-
-        Expected format: [{"url": "...", "branch": "main", "autoPush": true}, ...]
-        Returns: [{"name": "repo-name", "url": "...", "branch": "...", "autoPush": bool}, ...]
-        """
-        try:
-            raw = os.getenv("REPOS_JSON", "").strip()
-            if not raw:
-                return []
-            data = _json.loads(raw)
-            if isinstance(data, list):
-                out = []
-                for it in data:
-                    if not isinstance(it, dict):
-                        continue
-
-                    # Extract simple format fields
-                    url = str(it.get("url") or "").strip()
-                    # Auto-generate branch from session name if not provided
-                    branch_from_json = it.get("branch")
-                    if branch_from_json and str(branch_from_json).strip():
-                        branch = str(branch_from_json).strip()
-                    else:
-                        # Fallback: use AGENTIC_SESSION_NAME to match backend logic
-                        session_id = os.getenv("AGENTIC_SESSION_NAME", "").strip()
-                        branch = f"ambient/{session_id}" if session_id else "main"
-                    # Parse autoPush as boolean, defaulting to False for invalid types
-                    auto_push_raw = it.get("autoPush", False)
-                    auto_push = (
-                        auto_push_raw if isinstance(auto_push_raw, bool) else False
-                    )
-
-                    if not url:
-                        continue
-
-                    # Derive repo name from URL if not provided
-                    name = str(it.get("name") or "").strip()
-                    if not name:
-                        try:
-                            owner, repo, _ = self._parse_owner_repo(url)
-                            derived = repo or ""
-                            if not derived:
-                                p = urlparse(url)
-                                parts = [pt for pt in (p.path or "").split("/") if pt]
-                                if parts:
-                                    derived = parts[-1]
-                            name = (derived or "").removesuffix(".git").strip()
-                        except Exception:
-                            name = ""
-
-                    if name and url:
-                        out.append(
-                            {
-                                "name": name,
-                                "url": url,
-                                "branch": branch,
-                                "autoPush": auto_push,
-                            }
-                        )
-                return out
-        except Exception:
-            return []
-        return []
-
-    def _expand_env_vars(self, value: Any) -> Any:
-        """Recursively expand ${VAR} and ${VAR:-default} patterns in config values."""
-        if isinstance(value, str):
-            # Pattern: ${VAR} or ${VAR:-default}
-            pattern = r"\$\{([^}:]+)(?::-([^}]*))?\}"
-
-            def replace_var(match):
-                var_name = match.group(1)
-                default_val = match.group(2) if match.group(2) is not None else ""
-                return os.environ.get(var_name, default_val)
-
-            return re.sub(pattern, replace_var, value)
-        elif isinstance(value, dict):
-            return {k: self._expand_env_vars(v) for k, v in value.items()}
-        elif isinstance(value, list):
-            return [self._expand_env_vars(item) for item in value]
-        return value
-
-    def _load_mcp_config(self, cwd_path: str) -> Optional[dict]:
-        """Load MCP server configuration from the ambient runner's .mcp.json file."""
-        try:
-            # Allow override via MCP_CONFIG_FILE env var (useful for e2e with minimal MCPs)
-            mcp_config_file = self.context.get_env(
-                "MCP_CONFIG_FILE", "/app/claude-runner/.mcp.json"
-            )
-            runner_mcp_file = Path(mcp_config_file)
-
-            if runner_mcp_file.exists() and runner_mcp_file.is_file():
-                logger.info(f"Loading MCP config from: {runner_mcp_file}")
-                with open(runner_mcp_file, "r") as f:
-                    config = _json.load(f)
-                    mcp_servers = config.get("mcpServers", {})
-                    # Expand environment variables in the config
-                    expanded = self._expand_env_vars(mcp_servers)
-                    logger.info(
-                        f"Expanded MCP config env vars for {len(expanded)} servers"
-                    )
-                    return expanded
-            else:
-                logger.info(f"No MCP config file found at: {runner_mcp_file}")
-                return None
-
-        except _json.JSONDecodeError as e:
-            logger.error(f"Failed to parse MCP config: {e}")
-            return None
-        except Exception as e:
-            logger.error(f"Error loading MCP config: {e}")
-            return None
-
-    def _load_ambient_config(self, cwd_path: str) -> dict:
-        """Load ambient.json configuration from workflow directory."""
-        try:
-            config_path = Path(cwd_path) / ".ambient" / "ambient.json"
-
-            if not config_path.exists():
-                logger.info(f"No ambient.json found at {config_path}, using defaults")
-                return {}
-
-            with open(config_path, "r") as f:
-                config = _json.load(f)
-                logger.info(f"Loaded ambient.json: name={config.get('name')}")
-                return config
-
-        except _json.JSONDecodeError as e:
-            logger.error(f"Failed to parse ambient.json: {e}")
-            return {}
-        except Exception as e:
-            logger.error(f"Error loading ambient.json: {e}")
-            return {}
-
-    def _build_workspace_context_prompt(
-        self, repos_cfg, workflow_name, artifacts_path, ambient_config
-    ):
-        """Generate concise system prompt describing workspace layout."""
-        prompt = "# Workspace Structure\n\n"
-
-        # Workflow directory (if active)
-        if workflow_name:
-            prompt += f"**Working Directory**: workflows/{workflow_name}/ (workflow logic - do not create files here)\n\n"
-
-        # Artifacts
-        prompt += f"**Artifacts**: {artifacts_path} (create all output files here)\n\n"
-
-        # Uploaded files
-        file_uploads_path = Path(self.context.workspace_path) / "file-uploads"
-        if file_uploads_path.exists() and file_uploads_path.is_dir():
-            try:
-                files = sorted(
-                    [f.name for f in file_uploads_path.iterdir() if f.is_file()]
-                )
-                if files:
-                    max_display = 10
-                    if len(files) <= max_display:
-                        prompt += f"**Uploaded Files**: {', '.join(files)}\n\n"
-                    else:
-                        prompt += f"**Uploaded Files** ({len(files)} total): {', '.join(files[:max_display])}, and {len(files) - max_display} more\n\n"
-            except Exception:
-                pass
-        else:
-            prompt += "**Uploaded Files**: None\n\n"
-
-        # Repositories
-        if repos_cfg:
-            session_id = os.getenv("AGENTIC_SESSION_NAME", "").strip()
-            feature_branch = f"ambient/{session_id}" if session_id else None
-
-            repo_names = [
-                repo.get("name", f"repo-{i}") for i, repo in enumerate(repos_cfg)
-            ]
-            if len(repo_names) <= 5:
-                prompt += f"**Repositories**: {', '.join([f'repos/{name}/' for name in repo_names])}\n"
-            else:
-                prompt += f"**Repositories** ({len(repo_names)} total): {', '.join([f'repos/{name}/' for name in repo_names[:5]])}, and {len(repo_names) - 5} more\n"
-
-            if feature_branch:
-                prompt += f"**Working Branch**: `{feature_branch}` (all repos are on this feature branch)\n\n"
-            else:
-                prompt += "\n"
-
-            # Add git push instructions for repos with autoPush enabled
-            auto_push_repos = [
-                repo for repo in repos_cfg if repo.get("autoPush", False)
-            ]
-            if auto_push_repos:
-                push_branch = feature_branch or "ambient/<session-id>"
-
-                prompt += "## Git Push Instructions\n\n"
-                prompt += "The following repositories have auto-push enabled. When you make changes to these repositories, you MUST commit and push your changes:\n\n"
-                for repo in auto_push_repos:
-                    repo_name = repo.get("name", "unknown")
-                    prompt += f"- **repos/{repo_name}/**\n"
-                prompt += "\nAfter making changes to any auto-push repository:\n"
-                prompt += "1. Use `git add` to stage your changes\n"
-                prompt += '2. Use `git commit -m "description"` to commit with a descriptive message\n'
-                prompt += f"3. Use `git push origin {push_branch}` to push to the remote repository\n\n"
-
-        # MCP Integration Setup Instructions
-        prompt += "## MCP Integrations\n"
-        prompt += "If you need Google Drive access: Ask user to go to Integrations page in Ambient and authenticate with Google Drive.\n"
-        prompt += "If you need Jira access: Ask user to go to Workspace Settings in Ambient and configure Jira credentials there.\n\n"
-
-        # Workflow instructions (if any)
-        if ambient_config.get("systemPrompt"):
-            prompt += f"## Workflow Instructions\n{ambient_config['systemPrompt']}\n\n"
-
-        return prompt
-
-    # NOTE: Google credential copy functions removed - credentials now fetched at runtime via backend API
-    # This supersedes PR #562's volume mounting approach with just-in-time credential fetching
-    # See _populate_runtime_credentials() for new approach
diff --git a/components/runners/claude-code-runner/auth.py b/components/runners/claude-code-runner/auth.py
new file mode 100644
index 000000000..27d4cc77d
--- /dev/null
+++ b/components/runners/claude-code-runner/auth.py
@@ -0,0 +1,351 @@
+"""
+Authentication and credential management for the Claude Code runner.
+
+Handles Anthropic API keys, Vertex AI setup, and runtime credential
+fetching from the backend API (GitHub, Google, Jira, GitLab).
+"""
+
+import asyncio
+import json as _json
+import logging
+import os
+import re
+from pathlib import Path
+from urllib import request as _urllib_request
+from urllib.parse import urlparse
+
+from context import RunnerContext
+
+logger = logging.getLogger(__name__)
+
+
+# ---------------------------------------------------------------------------
+# User context sanitization
+# ---------------------------------------------------------------------------
+
+def sanitize_user_context(user_id: str, user_name: str) -> tuple[str, str]:
+    """Validate and sanitize user context fields to prevent injection attacks."""
+    if user_id:
+        user_id = str(user_id).strip()
+        if len(user_id) > 255:
+            user_id = user_id[:255]
+        user_id = re.sub(r"[^a-zA-Z0-9@._-]", "", user_id)
+
+    if user_name:
+        user_name = str(user_name).strip()
+        if len(user_name) > 255:
+            user_name = user_name[:255]
+        user_name = re.sub(r"[\x00-\x1f\x7f-\x9f]", "", user_name)
+
+    return user_id, user_name
+
+
+# ---------------------------------------------------------------------------
+# Model helpers
+# ---------------------------------------------------------------------------
+
+# Anthropic API → Vertex AI model name mapping
+VERTEX_MODEL_MAP: dict[str, str] = {
+    "claude-opus-4-5": "claude-opus-4-5@20251101",
+    "claude-opus-4-1": "claude-opus-4-1@20250805",
+    "claude-sonnet-4-5": "claude-sonnet-4-5@20250929",
+    "claude-haiku-4-5": "claude-haiku-4-5@20251001",
+}
+
+
+def map_to_vertex_model(model: str) -> str:
+    """Map Anthropic API model names to Vertex AI model names."""
+    return VERTEX_MODEL_MAP.get(model, model)
+
+
+async def setup_vertex_credentials(context: RunnerContext) -> dict:
+    """Set up Google Cloud Vertex AI credentials from service account.
+
+    Returns:
+        Dict with credentials_path, project_id, region.
+
+    Raises:
+        RuntimeError: If required environment variables are missing.
+    """
+    service_account_path = context.get_env(
+        "GOOGLE_APPLICATION_CREDENTIALS", ""
+    ).strip()
+    project_id = context.get_env("ANTHROPIC_VERTEX_PROJECT_ID", "").strip()
+    region = context.get_env("CLOUD_ML_REGION", "").strip()
+
+    if not service_account_path:
+        raise RuntimeError(
+            "GOOGLE_APPLICATION_CREDENTIALS must be set when CLAUDE_CODE_USE_VERTEX=1"
+        )
+    if not project_id:
+        raise RuntimeError(
+            "ANTHROPIC_VERTEX_PROJECT_ID must be set when CLAUDE_CODE_USE_VERTEX=1"
+        )
+    if not region:
+        raise RuntimeError(
+            "CLOUD_ML_REGION must be set when CLAUDE_CODE_USE_VERTEX=1"
+        )
+
+    if not Path(service_account_path).exists():
+        raise RuntimeError(
+            f"Service account key file not found at {service_account_path}"
+        )
+
+    logger.info(f"Vertex AI configured: project={project_id}, region={region}")
+    return {
+        "credentials_path": service_account_path,
+        "project_id": project_id,
+        "region": region,
+    }
+
+
+# ---------------------------------------------------------------------------
+# Backend credential fetching
+# ---------------------------------------------------------------------------
+
+async def _fetch_credential(context: RunnerContext, credential_type: str) -> dict:
+    """Fetch credentials from backend API at runtime.
+
+    Args:
+        context: Runner context with session_id.
+        credential_type: One of 'github', 'google', 'jira', 'gitlab'.
+
+    Returns:
+        Dictionary with credential data or empty dict if unavailable.
+    """
+    base = os.getenv("BACKEND_API_URL", "").rstrip("/")
+    project = os.getenv("PROJECT_NAME") or os.getenv(
+        "AGENTIC_SESSION_NAMESPACE", ""
+    )
+    project = project.strip()
+    session_id = context.session_id
+
+    if not base or not project or not session_id:
+        logger.warning(
+            f"Cannot fetch {credential_type} credentials: missing environment "
+            f"variables (base={base}, project={project}, session={session_id})"
+        )
+        return {}
+
+    url = (
+        f"{base}/projects/{project}/agentic-sessions/"
+        f"{session_id}/credentials/{credential_type}"
+    )
+    logger.info(f"Fetching fresh {credential_type} credentials from: {url}")
+
+    req = _urllib_request.Request(url, method="GET")
+    bot = (os.getenv("BOT_TOKEN") or "").strip()
+    if bot:
+        req.add_header("Authorization", f"Bearer {bot}")
+
+    loop = asyncio.get_event_loop()
+
+    def _do_req():
+        try:
+            with _urllib_request.urlopen(req, timeout=10) as resp:
+                return resp.read().decode("utf-8", errors="replace")
+        except Exception as e:
+            logger.warning(f"{credential_type} credential fetch failed: {e}")
+            return ""
+
+    resp_text = await loop.run_in_executor(None, _do_req)
+    if not resp_text:
+        return {}
+
+    try:
+        data = _json.loads(resp_text)
+        logger.info(
+            f"Successfully fetched {credential_type} credentials from backend"
+        )
+        return data
+    except Exception as e:
+        logger.error(
+            f"Failed to parse {credential_type} credential response: {e}"
+        )
+        return {}
+
+
+async def fetch_github_token(context: RunnerContext) -> str:
+    """Fetch GitHub token from backend API (always fresh — PAT or minted App token)."""
+    data = await _fetch_credential(context, "github")
+    token = data.get("token", "")
+    if token:
+        logger.info("Using fresh GitHub token from backend")
+    return token
+
+
+async def fetch_google_credentials(context: RunnerContext) -> dict:
+    """Fetch Google OAuth credentials from backend API."""
+    data = await _fetch_credential(context, "google")
+    if data.get("accessToken"):
+        logger.info(
+            f"Using fresh Google credentials from backend "
+            f"(email: {data.get('email', 'unknown')})"
+        )
+    return data
+
+
+async def fetch_jira_credentials(context: RunnerContext) -> dict:
+    """Fetch Jira credentials from backend API."""
+    data = await _fetch_credential(context, "jira")
+    if data.get("apiToken"):
+        logger.info(
+            f"Using Jira credentials from backend "
+            f"(url: {data.get('url', 'unknown')})"
+        )
+    return data
+
+
+async def fetch_gitlab_token(context: RunnerContext) -> str:
+    """Fetch GitLab token from backend API."""
+    data = await _fetch_credential(context, "gitlab")
+    token = data.get("token", "")
+    if token:
+        logger.info(
+            f"Using fresh GitLab token from backend "
+            f"(instance: {data.get('instanceUrl', 'unknown')})"
+        )
+    return token
+
+
+async def fetch_token_for_url(context: RunnerContext, url: str) -> str:
+    """Fetch appropriate token based on repository URL host."""
+    try:
+        parsed = urlparse(url)
+        hostname = parsed.hostname or ""
+
+        if "gitlab" in hostname.lower():
+            token = await fetch_gitlab_token(context)
+            if token:
+                logger.info(f"Using fresh GitLab token for {hostname}")
+                return token
+            else:
+                logger.warning(f"No GitLab credentials configured for {url}")
+                return ""
+
+        token = await fetch_github_token(context)
+        if token:
+            logger.info(f"Using fresh GitHub token for {hostname}")
+        return token
+
+    except Exception as e:
+        logger.warning(
+            f"Failed to parse URL {url}: {e}, falling back to GitHub token"
+        )
+        return os.getenv("GITHUB_TOKEN") or await fetch_github_token(context)
+
+
+async def populate_runtime_credentials(context: RunnerContext) -> None:
+    """Fetch all credentials from backend and populate environment variables.
+
+    Called before each SDK run to ensure MCP servers have fresh tokens.
+    """
+    logger.info("Fetching fresh credentials from backend API...")
+
+    # Google credentials
+    google_creds = await fetch_google_credentials(context)
+    if google_creds.get("accessToken"):
+        creds_dir = Path("/workspace/.google_workspace_mcp/credentials")
+        creds_dir.mkdir(parents=True, exist_ok=True)
+        creds_file = creds_dir / "credentials.json"
+
+        client_id = os.getenv("GOOGLE_OAUTH_CLIENT_ID", "")
+        client_secret = os.getenv("GOOGLE_OAUTH_CLIENT_SECRET", "")
+
+        creds_data = {
+            "token": google_creds.get("accessToken"),
+            "refresh_token": "",
+            "token_uri": "https://oauth2.googleapis.com/token",
+            "client_id": client_id,
+            "client_secret": client_secret,
+            "scopes": google_creds.get("scopes", []),
+            "expiry": google_creds.get("expiresAt", ""),
+        }
+
+        with open(creds_file, "w") as f:
+            _json.dump(creds_data, f, indent=2)
+        creds_file.chmod(0o644)
+        logger.info("✓ Updated Google credentials file for workspace-mcp")
+
+        user_email = google_creds.get("email", "")
+        if user_email and user_email != "user@example.com":
+            os.environ["USER_GOOGLE_EMAIL"] = user_email
+            logger.info(
+                f"✓ Set USER_GOOGLE_EMAIL to {user_email} for workspace-mcp"
+            )
+
+    # Jira credentials
+    jira_creds = await fetch_jira_credentials(context)
+    if jira_creds.get("apiToken"):
+        os.environ["JIRA_URL"] = jira_creds.get("url", "")
+        os.environ["JIRA_API_TOKEN"] = jira_creds.get("apiToken", "")
+        os.environ["JIRA_EMAIL"] = jira_creds.get("email", "")
+        logger.info("✓ Updated Jira credentials in environment")
+
+    # GitLab token
+    gitlab_token = await fetch_gitlab_token(context)
+    if gitlab_token:
+        os.environ["GITLAB_TOKEN"] = gitlab_token
+        logger.info("✓ Updated GitLab token in environment")
+
+    # GitHub token
+    github_token = await fetch_github_token(context)
+    if github_token:
+        os.environ["GITHUB_TOKEN"] = github_token
+        logger.info("✓ Updated GitHub token in environment")
+
+    logger.info("Runtime credentials populated successfully")
+
+
+async def fetch_github_token_legacy(context: RunnerContext) -> str:
+    """Legacy method — kept for backward compatibility."""
+    base = os.getenv("BACKEND_API_URL", "").rstrip("/")
+    project = os.getenv("PROJECT_NAME") or os.getenv(
+        "AGENTIC_SESSION_NAMESPACE", ""
+    )
+    project = project.strip()
+    session_id = context.session_id
+
+    if not base or not project or not session_id:
+        logger.warning("Cannot fetch GitHub token: missing environment variables")
+        return ""
+
+    url = (
+        f"{base}/projects/{project}/agentic-sessions/"
+        f"{session_id}/github/token"
+    )
+    logger.info(f"Fetching GitHub token from legacy endpoint: {url}")
+
+    req = _urllib_request.Request(
+        url,
+        data=b"{}",
+        headers={"Content-Type": "application/json"},
+        method="POST",
+    )
+    bot = (os.getenv("BOT_TOKEN") or "").strip()
+    if bot:
+        req.add_header("Authorization", f"Bearer {bot}")
+
+    loop = asyncio.get_event_loop()
+
+    def _do_req():
+        try:
+            with _urllib_request.urlopen(req, timeout=10) as resp:
+                return resp.read().decode("utf-8", errors="replace")
+        except Exception as e:
+            logger.warning(f"GitHub token fetch failed: {e}")
+            return ""
+
+    resp_text = await loop.run_in_executor(None, _do_req)
+    if not resp_text:
+        return ""
+
+    try:
+        data = _json.loads(resp_text)
+        token = str(data.get("token") or "")
+        if token:
+            logger.info("Successfully fetched GitHub token from backend")
+        return token
+    except Exception as e:
+        logger.error(f"Failed to parse token response: {e}")
+        return ""
diff --git a/components/runners/claude-code-runner/config.py b/components/runners/claude-code-runner/config.py
new file mode 100644
index 000000000..18bd328fb
--- /dev/null
+++ b/components/runners/claude-code-runner/config.py
@@ -0,0 +1,150 @@
+"""
+Configuration loading for the Claude Code runner.
+
+Reads ambient.json, MCP server config, and repository configuration
+from environment variables and the filesystem.
+"""
+
+import json as _json
+import logging
+import os
+from pathlib import Path
+from typing import Optional
+
+from context import RunnerContext
+from utils import expand_env_vars, parse_owner_repo
+
+logger = logging.getLogger(__name__)
+
+
+def load_ambient_config(cwd_path: str) -> dict:
+    """Load ambient.json configuration from workflow directory.
+
+    Returns:
+        Parsed config dict, or empty dict if not found / invalid.
+    """
+    try:
+        config_path = Path(cwd_path) / ".ambient" / "ambient.json"
+
+        if not config_path.exists():
+            logger.info(
+                f"No ambient.json found at {config_path}, using defaults"
+            )
+            return {}
+
+        with open(config_path, "r") as f:
+            config = _json.load(f)
+            logger.info(f"Loaded ambient.json: name={config.get('name')}")
+            return config
+
+    except _json.JSONDecodeError as e:
+        logger.error(f"Failed to parse ambient.json: {e}")
+        return {}
+    except Exception as e:
+        logger.error(f"Error loading ambient.json: {e}")
+        return {}
+
+
+def load_mcp_config(context: RunnerContext, cwd_path: str) -> Optional[dict]:
+    """Load MCP server configuration from the ambient runner's .mcp.json file.
+
+    Returns:
+        Dict of MCP server configs with env vars expanded, or None.
+    """
+    try:
+        mcp_config_file = context.get_env(
+            "MCP_CONFIG_FILE", "/app/claude-runner/.mcp.json"
+        )
+        runner_mcp_file = Path(mcp_config_file)
+
+        if runner_mcp_file.exists() and runner_mcp_file.is_file():
+            logger.info(f"Loading MCP config from: {runner_mcp_file}")
+            with open(runner_mcp_file, "r") as f:
+                config = _json.load(f)
+                mcp_servers = config.get("mcpServers", {})
+                expanded = expand_env_vars(mcp_servers)
+                logger.info(
+                    f"Expanded MCP config env vars for {len(expanded)} servers"
+                )
+                return expanded
+        else:
+            logger.info(f"No MCP config file found at: {runner_mcp_file}")
+            return None
+
+    except _json.JSONDecodeError as e:
+        logger.error(f"Failed to parse MCP config: {e}")
+        return None
+    except Exception as e:
+        logger.error(f"Error loading MCP config: {e}")
+        return None
+
+
+def get_repos_config() -> list[dict]:
+    """Read repos mapping from REPOS_JSON env if present.
+
+    Expected format::
+
+        [{"url": "...", "branch": "main", "autoPush": true}, ...]
+
+    Returns:
+        List of dicts: ``[{"name": ..., "url": ..., "branch": ..., "autoPush": bool}, ...]``
+    """
+    try:
+        raw = os.getenv("REPOS_JSON", "").strip()
+        if not raw:
+            return []
+        data = _json.loads(raw)
+        if isinstance(data, list):
+            out: list[dict] = []
+            for it in data:
+                if not isinstance(it, dict):
+                    continue
+
+                url = str(it.get("url") or "").strip()
+                branch_from_json = it.get("branch")
+                if branch_from_json and str(branch_from_json).strip():
+                    branch = str(branch_from_json).strip()
+                else:
+                    session_id = os.getenv("AGENTIC_SESSION_NAME", "").strip()
+                    branch = (
+                        f"ambient/{session_id}" if session_id else "main"
+                    )
+                auto_push_raw = it.get("autoPush", False)
+                auto_push = (
+                    auto_push_raw if isinstance(auto_push_raw, bool) else False
+                )
+
+                if not url:
+                    continue
+
+                name = str(it.get("name") or "").strip()
+                if not name:
+                    try:
+                        _owner, repo, _ = parse_owner_repo(url)
+                        derived = repo or ""
+                        if not derived:
+                            from urllib.parse import urlparse
+
+                            p = urlparse(url)
+                            parts = [
+                                pt for pt in (p.path or "").split("/") if pt
+                            ]
+                            if parts:
+                                derived = parts[-1]
+                        name = (derived or "").removesuffix(".git").strip()
+                    except Exception:
+                        name = ""
+
+                if name and url:
+                    out.append(
+                        {
+                            "name": name,
+                            "url": url,
+                            "branch": branch,
+                            "autoPush": auto_push,
+                        }
+                    )
+            return out
+    except Exception:
+        return []
+    return []
diff --git a/components/runners/claude-code-runner/main.py b/components/runners/claude-code-runner/main.py
index ea5a607b3..f38af794e 100644
--- a/components/runners/claude-code-runner/main.py
+++ b/components/runners/claude-code-runner/main.py
@@ -696,8 +696,9 @@ async def get_mcp_status():
             if os.path.exists(workflow_path):
                 cwd_path = workflow_path
 
-        # Use adapter's method to load MCP config (same as it does during runs)
-        mcp_config = adapter._load_mcp_config(cwd_path)
+        # Load MCP config using the config module (same as adapter does during runs)
+        import config as runner_config
+        mcp_config = runner_config.load_mcp_config(adapter.context, cwd_path)
         logger.info(f"MCP config: {mcp_config}")
 
         if mcp_config:
diff --git a/components/runners/claude-code-runner/prompts.py b/components/runners/claude-code-runner/prompts.py
new file mode 100644
index 000000000..4008057dd
--- /dev/null
+++ b/components/runners/claude-code-runner/prompts.py
@@ -0,0 +1,200 @@
+"""
+System prompt construction and prompt constants for the Claude Code runner.
+
+All hardcoded prompt strings are defined as constants here, and the main
+build function assembles them into the workspace context prompt that gets
+appended to the Claude Code system prompt preset.
+"""
+
+import logging
+import os
+from pathlib import Path
+
+logger = logging.getLogger(__name__)
+
+
+# ---------------------------------------------------------------------------
+# Prompt constants
+# ---------------------------------------------------------------------------
+
+WORKSPACE_STRUCTURE_HEADER = "# Workspace Structure\n\n"
+
+MCP_INTEGRATIONS_PROMPT = (
+    "## MCP Integrations\n"
+    "If you need Google Drive access: Ask user to go to Integrations page "
+    "in Ambient and authenticate with Google Drive.\n"
+    "If you need Jira access: Ask user to go to Workspace Settings in Ambient "
+    "and configure Jira credentials there.\n\n"
+)
+
+GIT_PUSH_INSTRUCTIONS_HEADER = "## Git Push Instructions\n\n"
+
+GIT_PUSH_INSTRUCTIONS_BODY = (
+    "The following repositories have auto-push enabled. When you make changes "
+    "to these repositories, you MUST commit and push your changes:\n\n"
+)
+
+GIT_PUSH_STEPS = (
+    "\nAfter making changes to any auto-push repository:\n"
+    "1. Use `git add` to stage your changes\n"
+    '2. Use `git commit -m "description"` to commit with a descriptive message\n'
+    "3. Use `git push origin {branch}` to push to the remote repository\n\n"
+)
+
+RUBRIC_EVALUATION_HEADER = "## Rubric Evaluation\n\n"
+
+RUBRIC_EVALUATION_INTRO = (
+    "This workflow includes a scoring rubric for evaluating outputs. "
+    "The rubric is located at `.ambient/rubric.md`.\n\n"
+)
+
+RUBRIC_EVALUATION_PROCESS = (
+    "**Process**:\n"
+    "1. Read `.ambient/rubric.md` using the Read tool\n"
+    "2. Evaluate the output against each criterion\n"
+    "3. Call `evaluate_rubric` (via the rubric MCP server) "
+    "with your scores and reasoning\n\n"
+    "**Important**: Always read the rubric first before scoring. "
+    "Provide honest, calibrated scores with clear reasoning.\n\n"
+)
+
+RESTART_TOOL_DESCRIPTION = (
+    "Restart the Claude session to recover from issues, clear state, "
+    "or get a fresh connection. Use this if you detect you're in a "
+    "broken state or need to reset."
+)
+
+
+# ---------------------------------------------------------------------------
+# Prompt builder
+# ---------------------------------------------------------------------------
+
+def build_workspace_context_prompt(
+    repos_cfg: list,
+    workflow_name: str | None,
+    artifacts_path: str,
+    ambient_config: dict,
+    workspace_path: str,
+) -> str:
+    """Generate the workspace context prompt appended to the Claude Code preset.
+
+    Args:
+        repos_cfg: List of repo config dicts.
+        workflow_name: Active workflow name (or None).
+        artifacts_path: Relative path for output artifacts.
+        ambient_config: Parsed ambient.json dict.
+        workspace_path: Absolute workspace root path.
+
+    Returns:
+        Formatted prompt string.
+    """
+    prompt = WORKSPACE_STRUCTURE_HEADER
+
+    # Workflow directory
+    if workflow_name:
+        prompt += (
+            f"**Working Directory**: workflows/{workflow_name}/ "
+            "(workflow logic - do not create files here)\n\n"
+        )
+
+    # Artifacts
+    prompt += f"**Artifacts**: {artifacts_path} (create all output files here)\n\n"
+
+    # Uploaded files
+    file_uploads_path = Path(workspace_path) / "file-uploads"
+    if file_uploads_path.exists() and file_uploads_path.is_dir():
+        try:
+            files = sorted(
+                [f.name for f in file_uploads_path.iterdir() if f.is_file()]
+            )
+            if files:
+                max_display = 10
+                if len(files) <= max_display:
+                    prompt += f"**Uploaded Files**: {', '.join(files)}\n\n"
+                else:
+                    prompt += (
+                        f"**Uploaded Files** ({len(files)} total): "
+                        f"{', '.join(files[:max_display])}, "
+                        f"and {len(files) - max_display} more\n\n"
+                    )
+        except Exception:
+            pass
+    else:
+        prompt += "**Uploaded Files**: None\n\n"
+
+    # Repositories
+    if repos_cfg:
+        session_id = os.getenv("AGENTIC_SESSION_NAME", "").strip()
+        feature_branch = f"ambient/{session_id}" if session_id else None
+
+        repo_names = [
+            repo.get("name", f"repo-{i}") for i, repo in enumerate(repos_cfg)
+        ]
+        if len(repo_names) <= 5:
+            prompt += (
+                f"**Repositories**: "
+                f"{', '.join([f'repos/{name}/' for name in repo_names])}\n"
+            )
+        else:
+            prompt += (
+                f"**Repositories** ({len(repo_names)} total): "
+                f"{', '.join([f'repos/{name}/' for name in repo_names[:5]])}, "
+                f"and {len(repo_names) - 5} more\n"
+            )
+
+        if feature_branch:
+            prompt += (
+                f"**Working Branch**: `{feature_branch}` "
+                "(all repos are on this feature branch)\n\n"
+            )
+        else:
+            prompt += "\n"
+
+        # Git push instructions for auto-push repos
+        auto_push_repos = [
+            repo for repo in repos_cfg if repo.get("autoPush", False)
+        ]
+        if auto_push_repos:
+            push_branch = feature_branch or "ambient/<session-id>"
+            prompt += GIT_PUSH_INSTRUCTIONS_HEADER
+            prompt += GIT_PUSH_INSTRUCTIONS_BODY
+            for repo in auto_push_repos:
+                repo_name = repo.get("name", "unknown")
+                prompt += f"- **repos/{repo_name}/**\n"
+            prompt += GIT_PUSH_STEPS.format(branch=push_branch)
+
+    # MCP integration setup instructions
+    prompt += MCP_INTEGRATIONS_PROMPT
+
+    # Workflow instructions
+    if ambient_config.get("systemPrompt"):
+        prompt += (
+            f"## Workflow Instructions\n"
+            f"{ambient_config['systemPrompt']}\n\n"
+        )
+
+    # Rubric evaluation instructions
+    prompt += _build_rubric_prompt_section(ambient_config)
+
+    return prompt
+
+
+def _build_rubric_prompt_section(ambient_config: dict) -> str:
+    """Build the rubric evaluation section for the system prompt.
+
+    Returns empty string if no rubric config is present.
+    """
+    rubric_config = ambient_config.get("rubric", {})
+    if not rubric_config:
+        return ""
+
+    section = RUBRIC_EVALUATION_HEADER
+    section += RUBRIC_EVALUATION_INTRO
+
+    activation_prompt = rubric_config.get("activationPrompt", "")
+    if activation_prompt:
+        section += f"**When to evaluate**: {activation_prompt}\n\n"
+
+    section += RUBRIC_EVALUATION_PROCESS
+
+    return section
diff --git a/components/runners/claude-code-runner/pyproject.toml b/components/runners/claude-code-runner/pyproject.toml
index a36cafa92..093186cf3 100644
--- a/components/runners/claude-code-runner/pyproject.toml
+++ b/components/runners/claude-code-runner/pyproject.toml
@@ -43,7 +43,8 @@ dev-dependencies = [
 ]
 
 [tool.setuptools]
-py-modules = ["main", "adapter", "context", "observability", "security_utils"]
+py-modules = ["main", "adapter", "auth", "config", "context", "observability", "prompts", "security_utils", "utils", "workspace"]
+packages = ["tools"]
 
 [build-system]
 requires = ["setuptools>=61.0"]
diff --git a/components/runners/claude-code-runner/tests/test_auto_push.py b/components/runners/claude-code-runner/tests/test_auto_push.py
index 1fd600ad6..4351eadff 100644
--- a/components/runners/claude-code-runner/tests/test_auto_push.py
+++ b/components/runners/claude-code-runner/tests/test_auto_push.py
@@ -1,27 +1,28 @@
-"""Unit tests for autoPush functionality in adapter.py."""
+"""Unit tests for autoPush functionality."""
 
 import json
 import os
 import sys
+from pathlib import Path
 from unittest.mock import MagicMock, Mock, patch
 
 import pytest
 
-# Mock ag_ui module before importing adapter
+# Add parent directory to path
+runner_dir = Path(__file__).parent.parent
+if str(runner_dir) not in sys.path:
+    sys.path.insert(0, str(runner_dir))
+
+# Mock ag_ui module before importing modules
 sys.modules["ag_ui"] = Mock()
 sys.modules["ag_ui.core"] = Mock()
-sys.modules["context"] = Mock()
-
 
-class TestGetReposConfig:
-    """Tests for _get_repos_config method."""
+from config import get_repos_config  # type: ignore[import]
+from prompts import build_workspace_context_prompt  # type: ignore[import]
 
-    def setup_method(self):
-        """Set up test fixtures."""
-        # Import here after mocking dependencies
-        from adapter import ClaudeCodeAdapter
 
-        self.adapter = ClaudeCodeAdapter()
+class TestGetReposConfig:
+    """Tests for config.get_repos_config function."""
 
     def test_parse_simple_repo_with_autopush_true(self):
         """Test parsing repo with autoPush=true."""
@@ -36,7 +37,7 @@ def test_parse_simple_repo_with_autopush_true(self):
         )
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert len(result) == 1
         assert result[0]["url"] == "https://github.com/owner/repo.git"
@@ -57,7 +58,7 @@ def test_parse_simple_repo_with_autopush_false(self):
         )
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert len(result) == 1
         assert result[0]["autoPush"] is False
@@ -69,7 +70,7 @@ def test_parse_repo_without_autopush(self):
         )
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert len(result) == 1
         assert result[0]["autoPush"] is False
@@ -97,7 +98,7 @@ def test_parse_multiple_repos_mixed_autopush(self):
         )
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert len(result) == 3
         assert result[0]["autoPush"] is True
@@ -118,7 +119,7 @@ def test_parse_repo_with_explicit_name(self):
         )
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert len(result) == 1
         assert result[0]["name"] == "my-custom-repo"
@@ -127,21 +128,21 @@ def test_parse_repo_with_explicit_name(self):
     def test_parse_empty_repos_json(self):
         """Test parsing empty REPOS_JSON."""
         with patch.dict(os.environ, {"REPOS_JSON": ""}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert result == []
 
     def test_parse_missing_repos_json(self):
         """Test parsing when REPOS_JSON not set."""
         with patch.dict(os.environ, {}, clear=True):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert result == []
 
     def test_parse_invalid_json(self):
         """Test parsing invalid JSON returns empty list."""
         with patch.dict(os.environ, {"REPOS_JSON": "invalid-json{"}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert result == []
 
@@ -150,7 +151,7 @@ def test_parse_non_list_json(self):
         repos_json = json.dumps({"url": "https://github.com/owner/repo.git"})
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert result == []
 
@@ -159,7 +160,7 @@ def test_parse_repo_without_url(self):
         repos_json = json.dumps([{"branch": "main", "autoPush": True}])
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert result == []
 
@@ -175,7 +176,7 @@ def test_derive_repo_name_from_url(self):
             repos_json = json.dumps([{"url": url, "autoPush": True}])
 
             with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-                result = self.adapter._get_repos_config()
+                result = get_repos_config()
 
             assert len(result) == 1
             assert result[0]["name"] == expected_name
@@ -192,7 +193,7 @@ def test_autopush_with_invalid_string_type(self):
         )
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert len(result) == 1
         # Invalid type should default to False
@@ -210,7 +211,7 @@ def test_autopush_with_invalid_number_type(self):
         )
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert len(result) == 1
         # Invalid type should default to False
@@ -228,7 +229,7 @@ def test_autopush_with_null_value(self):
         )
 
         with patch.dict(os.environ, {"REPOS_JSON": repos_json}):
-            result = self.adapter._get_repos_config()
+            result = get_repos_config()
 
         assert len(result) == 1
         # null should default to False
@@ -236,19 +237,7 @@ def test_autopush_with_null_value(self):
 
 
 class TestBuildWorkspaceContextPrompt:
-    """Tests for _build_workspace_context_prompt method."""
-
-    def setup_method(self):
-        """Set up test fixtures."""
-        # Import here after mocking dependencies
-        from adapter import ClaudeCodeAdapter
-
-        self.adapter = ClaudeCodeAdapter()
-
-        # Create a mock context
-        mock_context = MagicMock()
-        mock_context.workspace_path = "/workspace"
-        self.adapter.context = mock_context
+    """Tests for prompts.build_workspace_context_prompt function."""
 
     def test_prompt_includes_git_instructions_with_autopush(self):
         """Test that git push instructions are included when autoPush=true."""
@@ -261,11 +250,12 @@ def test_prompt_includes_git_instructions_with_autopush(self):
             }
         ]
 
-        prompt = self.adapter._build_workspace_context_prompt(
+        prompt = build_workspace_context_prompt(
             repos_cfg=repos_cfg,
             workflow_name=None,
             artifacts_path="artifacts",
             ambient_config={},
+            workspace_path="/workspace",
         )
 
         # Verify git instructions are present
@@ -287,11 +277,12 @@ def test_prompt_excludes_git_instructions_without_autopush(self):
             }
         ]
 
-        prompt = self.adapter._build_workspace_context_prompt(
+        prompt = build_workspace_context_prompt(
             repos_cfg=repos_cfg,
             workflow_name=None,
             artifacts_path="artifacts",
             ambient_config={},
+            workspace_path="/workspace",
         )
 
         # Verify git instructions are NOT present
@@ -323,11 +314,12 @@ def test_prompt_includes_multiple_autopush_repos(self):
             },
         ]
 
-        prompt = self.adapter._build_workspace_context_prompt(
+        prompt = build_workspace_context_prompt(
             repos_cfg=repos_cfg,
             workflow_name=None,
             artifacts_path="artifacts",
             ambient_config={},
+            workspace_path="/workspace",
         )
 
         # Verify both autoPush repos are listed
@@ -364,11 +356,12 @@ def test_prompt_with_workflow(self):
             }
         ]
 
-        prompt = self.adapter._build_workspace_context_prompt(
+        prompt = build_workspace_context_prompt(
             repos_cfg=repos_cfg,
             workflow_name="test-workflow",
             artifacts_path="artifacts",
             ambient_config={},
+            workspace_path="/workspace",
         )
 
         # Should include both workflow info and git instructions
diff --git a/components/runners/claude-code-runner/tests/test_model_mapping.py b/components/runners/claude-code-runner/tests/test_model_mapping.py
index 3e8decfe9..f4ac24610 100644
--- a/components/runners/claude-code-runner/tests/test_model_mapping.py
+++ b/components/runners/claude-code-runner/tests/test_model_mapping.py
@@ -1,5 +1,5 @@
 """
-Test cases for ClaudeCodeAdapter._map_to_vertex_model()
+Test cases for auth.map_to_vertex_model()
 
 This module tests the model name mapping from Anthropic API model names
 to Vertex AI model identifiers.
@@ -10,12 +10,12 @@
 
 import pytest
 
-# Add parent directory to path for importing adapter module
-adapter_dir = Path(__file__).parent.parent
-if str(adapter_dir) not in sys.path:
-    sys.path.insert(0, str(adapter_dir))
+# Add parent directory to path for importing auth module
+runner_dir = Path(__file__).parent.parent
+if str(runner_dir) not in sys.path:
+    sys.path.insert(0, str(runner_dir))
 
-from adapter import ClaudeCodeAdapter  # type: ignore[import]
+from auth import map_to_vertex_model  # type: ignore[import]
 
 
 class TestMapToVertexModel:
@@ -23,77 +23,68 @@ class TestMapToVertexModel:
 
     def test_map_opus_4_5(self):
         """Test mapping for Claude Opus 4.5"""
-        adapter = ClaudeCodeAdapter()
-        result = adapter._map_to_vertex_model("claude-opus-4-5")
+        result = map_to_vertex_model("claude-opus-4-5")
         assert result == "claude-opus-4-5@20251101"
 
     def test_map_opus_4_1(self):
         """Test mapping for Claude Opus 4.1"""
-        adapter = ClaudeCodeAdapter()
-        result = adapter._map_to_vertex_model("claude-opus-4-1")
+        result = map_to_vertex_model("claude-opus-4-1")
         assert result == "claude-opus-4-1@20250805"
 
     def test_map_sonnet_4_5(self):
         """Test mapping for Claude Sonnet 4.5"""
-        adapter = ClaudeCodeAdapter()
-        result = adapter._map_to_vertex_model("claude-sonnet-4-5")
+        result = map_to_vertex_model("claude-sonnet-4-5")
         assert result == "claude-sonnet-4-5@20250929"
 
     def test_map_haiku_4_5(self):
         """Test mapping for Claude Haiku 4.5"""
-        adapter = ClaudeCodeAdapter()
-        result = adapter._map_to_vertex_model("claude-haiku-4-5")
+        result = map_to_vertex_model("claude-haiku-4-5")
         assert result == "claude-haiku-4-5@20251001"
 
     def test_unknown_model_returns_unchanged(self):
         """Test that unknown model names are returned unchanged"""
-        adapter = ClaudeCodeAdapter()
         unknown_model = "claude-unknown-model-99"
-        result = adapter._map_to_vertex_model(unknown_model)
+        result = map_to_vertex_model(unknown_model)
         assert result == unknown_model
 
     def test_empty_string_returns_unchanged(self):
         """Test that empty string is returned unchanged"""
-        adapter = ClaudeCodeAdapter()
-        result = adapter._map_to_vertex_model("")
+        result = map_to_vertex_model("")
         assert result == ""
 
     def test_case_sensitive_mapping(self):
         """Test that model mapping is case-sensitive"""
-        adapter = ClaudeCodeAdapter()
+
         # Uppercase should not match
-        result = adapter._map_to_vertex_model("CLAUDE-OPUS-4-1")
+        result = map_to_vertex_model("CLAUDE-OPUS-4-1")
         assert result == "CLAUDE-OPUS-4-1"  # Should return unchanged
 
     def test_whitespace_in_model_name(self):
         """Test handling of whitespace in model names"""
-        adapter = ClaudeCodeAdapter()
+
         # Model name with whitespace should not match
-        result = adapter._map_to_vertex_model(" claude-opus-4-1 ")
+        result = map_to_vertex_model(" claude-opus-4-1 ")
         assert result == " claude-opus-4-1 "  # Should return unchanged
 
     def test_partial_model_name_no_match(self):
         """Test that partial model names don't match"""
-        adapter = ClaudeCodeAdapter()
-        result = adapter._map_to_vertex_model("claude-opus")
+        result = map_to_vertex_model("claude-opus")
         assert result == "claude-opus"  # Should return unchanged
 
     def test_vertex_model_id_passthrough(self):
         """Test that Vertex AI model IDs are returned unchanged"""
-        adapter = ClaudeCodeAdapter()
         vertex_id = "claude-opus-4-1@20250805"
-        result = adapter._map_to_vertex_model(vertex_id)
+        result = map_to_vertex_model(vertex_id)
         # If already a Vertex ID, should return unchanged
         assert result == vertex_id
 
     def test_all_frontend_models_have_mapping(self):
         """Test that all models from frontend dropdown have valid mappings"""
-        adapter = ClaudeCodeAdapter()
+
 
         # These are the exact model values from the frontend dropdown
         frontend_models = [
             "claude-sonnet-4-5",
-            "claude-opus-4-6",
             "claude-opus-4-5",
             "claude-opus-4-1",
             "claude-haiku-4-5",
@@ -101,33 +92,31 @@ def test_all_frontend_models_have_mapping(self):
 
         expected_mappings = {
             "claude-sonnet-4-5": "claude-sonnet-4-5@20250929",
-            "claude-opus-4-6": "claude-opus-4-6",
             "claude-opus-4-5": "claude-opus-4-5@20251101",
             "claude-opus-4-1": "claude-opus-4-1@20250805",
             "claude-haiku-4-5": "claude-haiku-4-5@20251001",
         }
 
         for model in frontend_models:
-            result = adapter._map_to_vertex_model(model)
+            result = map_to_vertex_model(model)
             assert (
                 result == expected_mappings[model]
             ), f"Model {model} should map to {expected_mappings[model]}, got {result}"
 
     def test_mapping_includes_version_date(self):
-        """Test that mapped models include version dates (except Opus 4.6)"""
-        adapter = ClaudeCodeAdapter()
+        """Test that all mapped models include version dates"""
+
 
-        # Opus 4.6 is the exception - uses simplified naming without @date
-        models_with_dates = [
+        models = [
             "claude-opus-4-5",
             "claude-opus-4-1",
             "claude-sonnet-4-5",
             "claude-haiku-4-5",
         ]
 
-        for model in models_with_dates:
-            result = adapter._map_to_vertex_model(model)
-            # All Vertex AI models (except Opus 4.6) should have @YYYYMMDD format
+        for model in models:
+            result = map_to_vertex_model(model)
+            # All Vertex AI models should have @YYYYMMDD format
             assert "@" in result, f"Mapped model {result} should include @ version date"
             assert (
                 len(result.split("@")) == 2
@@ -140,34 +129,27 @@ def test_mapping_includes_version_date(self):
                 version_date.isdigit()
             ), f"Version date {version_date} should be all digits"
 
-    def test_opus_4_6_no_date_suffix(self):
-        """Test that Opus 4.6 uses simplified naming (no @date suffix)"""
-        adapter = ClaudeCodeAdapter()
-        result = adapter._map_to_vertex_model("claude-opus-4-6")
-        assert result == "claude-opus-4-6"
-        assert "@" not in result, "Opus 4.6 should NOT have @date suffix"
-
     def test_none_input_handling(self):
         """Test that None input raises TypeError (invalid type per signature)"""
-        adapter = ClaudeCodeAdapter()
+
         # Function signature specifies str -> str, so None should raise
         with pytest.raises((TypeError, AttributeError)):
-            adapter._map_to_vertex_model(None)  # type: ignore[arg-type]
+            map_to_vertex_model(None)  # type: ignore[arg-type]
 
     def test_numeric_input_handling(self):
         """Test that numeric input raises TypeError (invalid type per signature)"""
-        adapter = ClaudeCodeAdapter()
+
         # Function signature specifies str -> str, so int should raise
         with pytest.raises((TypeError, AttributeError)):
-            adapter._map_to_vertex_model(123)  # type: ignore[arg-type]
+            map_to_vertex_model(123)  # type: ignore[arg-type]
 
     def test_mapping_consistency(self):
         """Test that mapping is consistent across multiple calls"""
-        adapter = ClaudeCodeAdapter()
+
         model = "claude-sonnet-4-5"
 
         # Call multiple times
-        results = [adapter._map_to_vertex_model(model) for _ in range(5)]
+        results = [map_to_vertex_model(model) for _ in range(5)]
 
         # All results should be identical
         assert all(r == results[0] for r in results)
@@ -179,11 +161,10 @@ class TestModelMappingIntegration:
 
     def test_mapping_matches_available_vertex_models(self):
         """Test that mapped model IDs match the expected Vertex AI format"""
-        adapter = ClaudeCodeAdapter()
 
-        # Expected Vertex AI model ID format: model-name@YYYYMMDD (except Opus 4.6)
+
+        # Expected Vertex AI model ID format: model-name@YYYYMMDD
         models_to_test = [
-            ("claude-opus-4-6", "claude-opus-4-6"),
             ("claude-opus-4-5", "claude-opus-4-5@20251101"),
             ("claude-opus-4-1", "claude-opus-4-1@20250805"),
             ("claude-sonnet-4-5", "claude-sonnet-4-5@20250929"),
@@ -191,78 +172,59 @@ def test_mapping_matches_available_vertex_models(self):
         ]
 
         for input_model, expected_vertex_id in models_to_test:
-            result = adapter._map_to_vertex_model(input_model)
+            result = map_to_vertex_model(input_model)
             assert (
                 result == expected_vertex_id
             ), f"Expected {input_model} to map to {expected_vertex_id}, got {result}"
 
     def test_ui_to_vertex_round_trip(self):
         """Test that UI model selection properly maps to Vertex AI"""
-        adapter = ClaudeCodeAdapter()
+
 
         # Simulate user selecting from UI dropdown
         ui_selections = [
             "claude-sonnet-4-5",  # User selects Sonnet 4.5
-            "claude-opus-4-6",  # User selects Opus 4.6 (newest)
             "claude-opus-4-5",  # User selects Opus 4.5
             "claude-opus-4-1",  # User selects Opus 4.1
             "claude-haiku-4-5",  # User selects Haiku 4.5
         ]
 
         for selection in ui_selections:
-            vertex_model = adapter._map_to_vertex_model(selection)
+            vertex_model = map_to_vertex_model(selection)
 
             # Verify it maps to a valid Vertex AI model ID
             assert vertex_model.startswith("claude-")
-
-            # Opus 4.6 is the exception - no @date suffix
-            if selection == "claude-opus-4-6":
-                assert "@" not in vertex_model
-            else:
-                assert "@" in vertex_model
+            assert "@" in vertex_model
 
             # Verify the base model name is preserved
-            if "@" in vertex_model:
-                base_name = vertex_model.split("@")[0]
-                assert selection in vertex_model or base_name in selection
-            else:
-                assert selection == vertex_model
+            base_name = vertex_model.split("@")[0]
+            assert selection in vertex_model or base_name in selection
 
     def test_end_to_end_vertex_mapping_flow(self):
         """Test complete flow: UI selection → model mapping → Vertex AI call"""
-        adapter = ClaudeCodeAdapter()
+
 
         # Simulate complete flow for each model
         test_scenarios = [
-            {
-                "ui_selection": "claude-opus-4-6",
-                "expected_vertex_id": "claude-opus-4-6",
-                "description": "Newest Opus model (simplified naming)",
-                "has_date_suffix": False,
-            },
             {
                 "ui_selection": "claude-opus-4-5",
                 "expected_vertex_id": "claude-opus-4-5@20251101",
                 "description": "Latest Opus model",
-                "has_date_suffix": True,
             },
             {
                 "ui_selection": "claude-opus-4-1",
                 "expected_vertex_id": "claude-opus-4-1@20250805",
                 "description": "Previous Opus model",
-                "has_date_suffix": True,
             },
             {
                 "ui_selection": "claude-sonnet-4-5",
                 "expected_vertex_id": "claude-sonnet-4-5@20250929",
                 "description": "Balanced model",
-                "has_date_suffix": True,
             },
             {
                 "ui_selection": "claude-haiku-4-5",
                 "expected_vertex_id": "claude-haiku-4-5@20251001",
                 "description": "Fastest model",
-                "has_date_suffix": True,
             },
         ]
 
@@ -271,7 +233,7 @@ def test_end_to_end_vertex_mapping_flow(self):
             ui_model = scenario["ui_selection"]
 
             # Step 2: Backend maps to Vertex AI model ID
-            vertex_model_id = adapter._map_to_vertex_model(ui_model)
+            vertex_model_id = map_to_vertex_model(ui_model)
 
             # Step 3: Verify correct mapping
             assert (
@@ -279,27 +241,21 @@ def test_end_to_end_vertex_mapping_flow(self):
             ), f"{scenario['description']}: Expected {scenario['expected_vertex_id']}, got {vertex_model_id}"
 
             # Step 4: Verify Vertex AI model ID format is valid
-            if scenario["has_date_suffix"]:
-                assert "@" in vertex_model_id
-                parts = vertex_model_id.split("@")
-                assert len(parts) == 2
-                model_name, version_date = parts
-                assert model_name.startswith("claude-")
-                assert len(version_date) == 8  # YYYYMMDD format
-                assert version_date.isdigit()
-            else:
-                # Opus 4.6 uses simplified naming - no @date suffix
-                assert "@" not in vertex_model_id
-                assert vertex_model_id.startswith("claude-")
+            assert "@" in vertex_model_id
+            parts = vertex_model_id.split("@")
+            assert len(parts) == 2
+            model_name, version_date = parts
+            assert model_name.startswith("claude-")
+            assert len(version_date) == 8  # YYYYMMDD format
+            assert version_date.isdigit()
 
     def test_model_ordering_consistency(self):
         """Test that model ordering is consistent between frontend and backend"""
-        adapter = ClaudeCodeAdapter()
 
-        # Expected ordering: Sonnet → Opus 4.6 → Opus 4.5 → Opus 4.1 → Haiku (matches frontend dropdown)
+
+        # Expected ordering: Sonnet → Opus 4.5 → Opus 4.1 → Haiku (matches frontend dropdown)
         expected_order = [
             "claude-sonnet-4-5",
-            "claude-opus-4-6",
             "claude-opus-4-5",
             "claude-opus-4-1",
             "claude-haiku-4-5",
@@ -307,20 +263,11 @@ def test_model_ordering_consistency(self):
 
         # Verify all models map successfully in order
         for model in expected_order:
-            vertex_id = adapter._map_to_vertex_model(model)
-            # Opus 4.6 is the exception - no @date suffix
-            if model == "claude-opus-4-6":
-                assert (
-                    "@" not in vertex_id
-                ), f"Model {model} should use simplified naming"
-            else:
-                assert (
-                    "@" in vertex_id
-                ), f"Model {model} should map to valid Vertex AI ID"
+            vertex_id = map_to_vertex_model(model)
+            assert "@" in vertex_id, f"Model {model} should map to valid Vertex AI ID"
 
         # Verify ordering matches frontend dropdown
         assert expected_order[0] == "claude-sonnet-4-5"  # Balanced (default)
-        assert expected_order[1] == "claude-opus-4-6"  # Newest Opus
-        assert expected_order[2] == "claude-opus-4-5"  # Latest Opus
-        assert expected_order[3] == "claude-opus-4-1"  # Previous Opus
-        assert expected_order[4] == "claude-haiku-4-5"  # Fastest
+        assert expected_order[1] == "claude-opus-4-5"  # Latest Opus
+        assert expected_order[2] == "claude-opus-4-1"  # Previous Opus
+        assert expected_order[3] == "claude-haiku-4-5"  # Fastest
diff --git a/components/runners/claude-code-runner/tests/test_wrapper_vertex.py b/components/runners/claude-code-runner/tests/test_wrapper_vertex.py
index bd14180e3..e5829f36f 100644
--- a/components/runners/claude-code-runner/tests/test_wrapper_vertex.py
+++ b/components/runners/claude-code-runner/tests/test_wrapper_vertex.py
@@ -1,17 +1,24 @@
 """
-Test cases for wrapper._setup_vertex_credentials()
+Test cases for auth.setup_vertex_credentials()
 
 This module tests all error cases and validation logic for Vertex AI credential setup.
 """
 
 import asyncio
 import os
+import sys
 import tempfile
 from pathlib import Path
 from unittest.mock import AsyncMock, MagicMock, patch
 
 import pytest
-from claude_code_runner.wrapper import ClaudeCodeWrapper
+
+# Add parent directory to path
+runner_dir = Path(__file__).parent.parent
+if str(runner_dir) not in sys.path:
+    sys.path.insert(0, str(runner_dir))
+
+from auth import setup_vertex_credentials  # type: ignore[import]
 
 
 class TestSetupVertexCredentials:
@@ -48,10 +55,8 @@ async def test_success_all_valid_credentials(
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
-
         # Execute
-        result = await wrapper._setup_vertex_credentials()
+        result = await setup_vertex_credentials(mock_context)
 
         # Verify
         assert result is not None
@@ -71,11 +76,11 @@ async def test_error_missing_google_application_credentials(self, mock_context):
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute and verify
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "GOOGLE_APPLICATION_CREDENTIALS" in str(exc_info.value)
         assert "not set" in str(exc_info.value)
@@ -90,11 +95,11 @@ async def test_error_empty_google_application_credentials(self, mock_context):
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute and verify
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "GOOGLE_APPLICATION_CREDENTIALS" in str(exc_info.value)
 
@@ -109,11 +114,11 @@ async def test_error_missing_anthropic_vertex_project_id(
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute and verify
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "ANTHROPIC_VERTEX_PROJECT_ID" in str(exc_info.value)
         assert "not set" in str(exc_info.value)
@@ -130,11 +135,11 @@ async def test_error_empty_anthropic_vertex_project_id(
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute and verify
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "ANTHROPIC_VERTEX_PROJECT_ID" in str(exc_info.value)
 
@@ -149,11 +154,11 @@ async def test_error_missing_cloud_ml_region(
             "ANTHROPIC_VERTEX_PROJECT_ID": "test-project-123",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute and verify
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "CLOUD_ML_REGION" in str(exc_info.value)
         assert "not set" in str(exc_info.value)
@@ -170,11 +175,11 @@ async def test_error_empty_cloud_ml_region(
             "CLOUD_ML_REGION": "",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute and verify
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "CLOUD_ML_REGION" in str(exc_info.value)
 
@@ -189,11 +194,11 @@ async def test_error_credentials_file_does_not_exist(self, mock_context):
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute and verify
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "Service account file" in str(exc_info.value)
         assert "does not exist" in str(exc_info.value)
@@ -205,11 +210,11 @@ async def test_error_all_env_vars_missing(self, mock_context):
         # Setup - all vars missing
         mock_context.get_env.side_effect = lambda key: None
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute and verify - should fail on first check
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "GOOGLE_APPLICATION_CREDENTIALS" in str(exc_info.value)
 
@@ -222,11 +227,11 @@ async def test_validation_order_checks_credentials_path_first(self, mock_context
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Should fail on GOOGLE_APPLICATION_CREDENTIALS first
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "GOOGLE_APPLICATION_CREDENTIALS" in str(exc_info.value)
 
@@ -241,11 +246,11 @@ async def test_validation_order_checks_project_id_second(
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Should fail on ANTHROPIC_VERTEX_PROJECT_ID second
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "ANTHROPIC_VERTEX_PROJECT_ID" in str(exc_info.value)
 
@@ -260,11 +265,11 @@ async def test_validation_order_checks_region_third(
             "ANTHROPIC_VERTEX_PROJECT_ID": "test-project-123",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Should fail on CLOUD_ML_REGION third
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "CLOUD_ML_REGION" in str(exc_info.value)
 
@@ -279,11 +284,11 @@ async def test_validation_checks_file_existence_last(self, mock_context):
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Should fail on file existence check last
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "Service account file" in str(exc_info.value)
         assert "does not exist" in str(exc_info.value)
@@ -300,10 +305,10 @@ async def test_logging_output_includes_config_details(
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute
-        await wrapper._setup_vertex_credentials()
+        await setup_vertex_credentials(mock_context)
 
         # Verify logging was called with details
         assert mock_context.send_log.called
@@ -330,11 +335,11 @@ async def test_whitespace_in_env_vars_is_not_trimmed(
             "CLOUD_ML_REGION": "  us-central1  ",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute - depending on implementation, this might succeed or fail
         # If the code doesn't strip whitespace, the values should work
-        result = await wrapper._setup_vertex_credentials()
+        result = await setup_vertex_credentials(mock_context)
 
         # Verify that whitespace is preserved (not stripped)
         assert result["project_id"] == "  test-project-123  "
@@ -350,11 +355,11 @@ async def test_none_value_from_get_env(self, mock_context, temp_credentials_file
             key
         )  # Returns None for other keys
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Should fail when checking for None values
         with pytest.raises(RuntimeError) as exc_info:
-            await wrapper._setup_vertex_credentials()
+            await setup_vertex_credentials(mock_context)
 
         assert "not set" in str(exc_info.value)
 
@@ -371,12 +376,12 @@ async def test_directory_instead_of_file(self, mock_context, tmp_path):
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
+
 
         # Execute and verify
         # Path.exists() returns True for directories, so this might not fail
         # depending on implementation
-        result = await wrapper._setup_vertex_credentials()
+        result = await setup_vertex_credentials(mock_context)
 
         # If implementation only checks exists(), this will pass
         # If it checks is_file(), this should fail
@@ -399,10 +404,10 @@ async def test_relative_path_credentials_file(self, mock_context):
                 "CLOUD_ML_REGION": "us-central1",
             }.get(key)
 
-            wrapper = ClaudeCodeWrapper(mock_context)
+    
 
             # Execute - should work if file exists in current directory
-            result = await wrapper._setup_vertex_credentials()
+            result = await setup_vertex_credentials(mock_context)
 
             assert result is not None
             assert result["credentials_path"] == relative_path
@@ -424,10 +429,8 @@ async def test_special_characters_in_project_id(
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
-
         # Execute
-        result = await wrapper._setup_vertex_credentials()
+        result = await setup_vertex_credentials(mock_context)
 
         # Should accept special characters
         assert result["project_id"] == special_project_id
@@ -452,10 +455,10 @@ async def test_international_region_codes(
                 "CLOUD_ML_REGION": region,
             }.get(key)
 
-            wrapper = ClaudeCodeWrapper(mock_context)
+    
 
             # Execute
-            result = await wrapper._setup_vertex_credentials()
+            result = await setup_vertex_credentials(mock_context)
 
             # Should accept all valid region codes
             assert result["region"] == region
@@ -470,10 +473,8 @@ async def test_return_value_structure(self, mock_context, temp_credentials_file)
             "CLOUD_ML_REGION": "us-central1",
         }.get(key)
 
-        wrapper = ClaudeCodeWrapper(mock_context)
-
         # Execute
-        result = await wrapper._setup_vertex_credentials()
+        result = await setup_vertex_credentials(mock_context)
 
         # Verify structure
         assert isinstance(result, dict)
@@ -506,10 +507,8 @@ async def test_integration_with_real_file_creation(self):
             )
             context.send_log = AsyncMock()
 
-            wrapper = ClaudeCodeWrapper(context)
-
             # Execute
-            result = await wrapper._setup_vertex_credentials()
+            result = await setup_vertex_credentials(context)
 
             # Verify
             assert Path(temp_path).exists()
@@ -544,9 +543,8 @@ async def test_concurrent_calls_to_setup_vertex_credentials(self, tmp_path):
             contexts.append(context)
 
         # Execute concurrently
-        wrappers = [ClaudeCodeWrapper(ctx) for ctx in contexts]
         results = await asyncio.gather(
-            *[wrapper._setup_vertex_credentials() for wrapper in wrappers]
+            *[setup_vertex_credentials(ctx) for ctx in contexts]
         )
 
         # Verify all succeeded
diff --git a/components/runners/claude-code-runner/tools/__init__.py b/components/runners/claude-code-runner/tools/__init__.py
new file mode 100644
index 000000000..0c732c8f2
--- /dev/null
+++ b/components/runners/claude-code-runner/tools/__init__.py
@@ -0,0 +1,15 @@
+"""
+MCP tool definitions for the Claude Code runner.
+
+Tools are created dynamically per-run and registered as in-process
+MCP servers alongside the Claude Agent SDK.
+"""
+
+from tools.rubric import create_rubric_mcp_tool, load_rubric_content
+from tools.session import create_restart_session_tool
+
+__all__ = [
+    "create_restart_session_tool",
+    "load_rubric_content",
+    "create_rubric_mcp_tool",
+]
diff --git a/components/runners/claude-code-runner/tools/rubric.py b/components/runners/claude-code-runner/tools/rubric.py
new file mode 100644
index 000000000..1a4d08df7
--- /dev/null
+++ b/components/runners/claude-code-runner/tools/rubric.py
@@ -0,0 +1,218 @@
+"""
+Rubric evaluation MCP tool — logs a single score to Langfuse.
+
+Scans the workflow's .ambient/ folder for a rubric.md file, then creates
+an evaluate_rubric tool that accepts a score, comment, and metadata.
+The tool makes one ``langfuse.create_score()`` call with the trace ID
+from the current observability context.
+"""
+
+import json as _json
+import logging
+import os
+from pathlib import Path
+from typing import Any
+
+logger = logging.getLogger(__name__)
+
+
+def load_rubric_content(cwd_path: str) -> tuple:
+    """Load rubric content from the workflow's .ambient/ folder.
+
+    Looks for ``.ambient/rubric.md`` — a single markdown file containing
+    the evaluation criteria.
+
+    Returns:
+        Tuple of ``(rubric_content, rubric_config)`` where rubric_content
+        is the markdown string and rubric_config is the ``rubric`` key
+        from ambient.json.  Returns ``(None, {})`` if no rubric found.
+    """
+    ambient_dir = Path(cwd_path) / ".ambient"
+    rubric_content = None
+
+    single_rubric = ambient_dir / "rubric.md"
+    if single_rubric.exists() and single_rubric.is_file():
+        try:
+            rubric_content = single_rubric.read_text(encoding="utf-8")
+            logger.info(f"Loaded rubric from {single_rubric}")
+        except Exception as e:
+            logger.error(f"Failed to read rubric.md: {e}")
+
+    rubric_config: dict = {}
+    try:
+        config_path = ambient_dir / "ambient.json"
+        if config_path.exists():
+            with open(config_path, "r") as f:
+                config = _json.load(f)
+                rubric_config = config.get("rubric", {})
+    except Exception as e:
+        logger.error(f"Failed to load rubric config from ambient.json: {e}")
+
+    return rubric_content, rubric_config
+
+
+def create_rubric_mcp_tool(
+    rubric_content: str,
+    rubric_config: dict,
+    obs: Any,
+    session_id: str,
+    sdk_tool_decorator,
+):
+    """Create a dynamic MCP tool for rubric-based evaluation.
+
+    The tool accepts a score, comment, and optional metadata, then makes
+    a single ``langfuse.create_score()`` call. The ``rubric.schema`` from
+    ambient.json is passed through as the ``metadata`` field's JSON Schema
+    in the tool's input_schema.
+
+    Args:
+        rubric_content: Markdown rubric instructions (for reference only).
+        rubric_config: Config dict with ``activationPrompt`` and ``schema``.
+        obs: ObservabilityManager instance for trace ID.
+        session_id: Current session ID.
+        sdk_tool_decorator: The ``tool`` decorator from ``claude_agent_sdk``.
+
+    Returns:
+        Decorated async tool function.
+    """
+    # JSON Schema format per Claude Agent SDK docs:
+    # https://platform.claude.com/docs/en/agent-sdk/python#tool
+    user_schema = rubric_config.get("schema", {})
+
+    properties: dict = {
+        "score": {"type": "number", "description": "Overall evaluation score."},
+        "comment": {"type": "string", "description": "Evaluation reasoning and commentary."},
+    }
+    if user_schema:
+        properties["metadata"] = user_schema
+
+    required = ["score", "comment"]
+    if user_schema:
+        required.append("metadata")
+
+    input_schema: dict = {
+        "type": "object",
+        "properties": properties,
+        "required": required,
+    }
+
+    tool_description = (
+        "Log a rubric evaluation score to Langfuse. "
+        "Read .ambient/rubric.md FIRST, evaluate the output "
+        "against the criteria, then call this tool with your "
+        "score, comment, and metadata."
+    )
+
+    # Capture references for closure
+    _obs = obs
+    _session_id = session_id
+
+    @sdk_tool_decorator(
+        "evaluate_rubric",
+        tool_description,
+        input_schema,
+    )
+    async def evaluate_rubric_tool(args: dict) -> dict:
+        """Log a single rubric evaluation score to Langfuse."""
+        score = args.get("score")
+        comment = args.get("comment", "")
+        metadata = args.get("metadata")
+
+        # Log to Langfuse
+        success, error = _log_to_langfuse(
+            score=score,
+            comment=comment,
+            metadata=metadata,
+            obs=_obs,
+            session_id=_session_id,
+        )
+
+        if success:
+            return {
+                "content": [
+                    {"type": "text", "text": f"Score {score} logged to Langfuse."}
+                ]
+            }
+        else:
+            return {
+                "content": [
+                    {"type": "text", "text": f"Failed to log score: {error}"}
+                ],
+                "isError": True,
+            }
+
+    return evaluate_rubric_tool
+
+
+def _log_to_langfuse(
+    score: float | None,
+    comment: str,
+    metadata: Any,
+    obs: Any,
+    session_id: str,
+) -> tuple[bool, str | None]:
+    """Make a single langfuse.create_score() call.
+
+    Uses the existing Langfuse client from the ObservabilityManager
+    if available, otherwise creates a new one.
+
+    Returns:
+        (True, None) on success, (False, error_message) on failure.
+    """
+    try:
+        # Try to reuse the session's Langfuse client
+        langfuse_client = getattr(obs, "langfuse_client", None) if obs else None
+
+        if not langfuse_client:
+            # Fall back to creating our own
+            langfuse_enabled = os.getenv(
+                "LANGFUSE_ENABLED", ""
+            ).strip().lower() in ("1", "true", "yes")
+            if not langfuse_enabled:
+                return False, "Langfuse not enabled."
+
+            from langfuse import Langfuse
+
+            public_key = os.getenv("LANGFUSE_PUBLIC_KEY", "").strip()
+            secret_key = os.getenv("LANGFUSE_SECRET_KEY", "").strip()
+            host = os.getenv("LANGFUSE_HOST", "").strip()
+
+            if not (public_key and secret_key and host):
+                return False, "Langfuse credentials missing."
+
+            langfuse_client = Langfuse(
+                public_key=public_key,
+                secret_key=secret_key,
+                host=host,
+            )
+
+        trace_id = obs.get_current_trace_id() if obs else None
+
+        if score is None:
+            return False, "Score value is required (got None)."
+
+        kwargs: dict = {
+            "name": "rubric-evaluation",
+            "value": score,
+            "data_type": "NUMERIC",
+            "comment": comment[:500] if comment else None,
+            "metadata": metadata,
+        }
+        if trace_id:
+            kwargs["trace_id"] = trace_id
+
+        langfuse_client.create_score(**kwargs)
+        langfuse_client.flush()
+
+        logger.info(
+            f"Rubric score logged to Langfuse: "
+            f"value={score}, trace_id={trace_id}"
+        )
+        return True, None
+
+    except ImportError:
+        return False, "Langfuse package not installed."
+    except Exception as e:
+        msg = str(e)
+        logger.error(f"Failed to log rubric score to Langfuse: {msg}")
+        return False, msg
diff --git a/components/runners/claude-code-runner/tools/session.py b/components/runners/claude-code-runner/tools/session.py
new file mode 100644
index 000000000..0c61c94ec
--- /dev/null
+++ b/components/runners/claude-code-runner/tools/session.py
@@ -0,0 +1,46 @@
+"""
+Session control MCP tool — allows Claude to request a session restart.
+"""
+
+import logging
+
+from prompts import RESTART_TOOL_DESCRIPTION
+
+logger = logging.getLogger(__name__)
+
+
+def create_restart_session_tool(adapter_ref, sdk_tool_decorator):
+    """Create the restart_session MCP tool.
+
+    Args:
+        adapter_ref: Reference to the ClaudeCodeAdapter instance
+            (used to set _restart_requested flag).
+        sdk_tool_decorator: The ``tool`` decorator from ``claude_agent_sdk``.
+
+    Returns:
+        Decorated async tool function.
+    """
+
+    @sdk_tool_decorator(
+        "restart_session",
+        RESTART_TOOL_DESCRIPTION,
+        {},
+    )
+    async def restart_session_tool(args: dict) -> dict:
+        """Tool that allows Claude to request a session restart."""
+        adapter_ref._restart_requested = True
+        logger.info("🔄 Session restart requested by Claude via MCP tool")
+        return {
+            "content": [
+                {
+                    "type": "text",
+                    "text": (
+                        "Session restart has been requested. The current run "
+                        "will complete and a fresh session will be established. "
+                        "Your conversation context will be preserved on disk."
+                    ),
+                }
+            ]
+        }
+
+    return restart_session_tool
diff --git a/components/runners/claude-code-runner/utils.py b/components/runners/claude-code-runner/utils.py
new file mode 100644
index 000000000..55b4c63d2
--- /dev/null
+++ b/components/runners/claude-code-runner/utils.py
@@ -0,0 +1,174 @@
+"""
+General utility functions for the Claude Code runner.
+
+Pure functions with no business-logic dependencies — URL parsing,
+secret redaction, subprocess helpers, environment variable expansion.
+"""
+
+import asyncio
+import logging
+import os
+import re
+from datetime import datetime, timezone
+from typing import Any
+from urllib.parse import urlparse, urlunparse
+
+logger = logging.getLogger(__name__)
+
+
+def timestamp() -> str:
+    """Return current UTC timestamp in ISO format."""
+    return datetime.now(timezone.utc).isoformat()
+
+
+def redact_secrets(text: str) -> str:
+    """Redact tokens and secrets from text for safe logging."""
+    if not text:
+        return text
+
+    text = re.sub(r"gh[pousr]_[a-zA-Z0-9]{36,255}", "gh*_***REDACTED***", text)
+    text = re.sub(r"sk-ant-[a-zA-Z0-9\-_]{30,200}", "sk-ant-***REDACTED***", text)
+    text = re.sub(r"pk-lf-[a-zA-Z0-9\-_]{10,100}", "pk-lf-***REDACTED***", text)
+    text = re.sub(r"sk-lf-[a-zA-Z0-9\-_]{10,100}", "sk-lf-***REDACTED***", text)
+    text = re.sub(
+        r"x-access-token:[^@\s]+@", "x-access-token:***REDACTED***@", text
+    )
+    text = re.sub(r"oauth2:[^@\s]+@", "oauth2:***REDACTED***@", text)
+    text = re.sub(r"://[^:@\s]+:[^@\s]+@", "://***REDACTED***@", text)
+    text = re.sub(
+        r'(ANTHROPIC_API_KEY|LANGFUSE_SECRET_KEY|LANGFUSE_PUBLIC_KEY|BOT_TOKEN|GIT_TOKEN)\s*=\s*[^\s\'"]+',
+        r"\1=***REDACTED***",
+        text,
+    )
+    return text
+
+
+def url_with_token(url: str, token: str) -> str:
+    """Add authentication token to a git URL.
+
+    Uses x-access-token for GitHub, oauth2 for GitLab.
+    """
+    if not token or not url.lower().startswith("http"):
+        return url
+    try:
+        parsed = urlparse(url)
+        netloc = parsed.netloc
+        if "@" in netloc:
+            netloc = netloc.split("@", 1)[1]
+
+        hostname = parsed.hostname or ""
+        if "gitlab" in hostname.lower():
+            auth = f"oauth2:{token}@"
+        else:
+            auth = f"x-access-token:{token}@"
+
+        new_netloc = auth + netloc
+        return urlunparse(
+            (
+                parsed.scheme,
+                new_netloc,
+                parsed.path,
+                parsed.params,
+                parsed.query,
+                parsed.fragment,
+            )
+        )
+    except Exception:
+        return url
+
+
+def parse_owner_repo(url: str) -> tuple[str, str, str]:
+    """Return (owner, name, host) from various git URL formats.
+
+    Supports HTTPS, SSH, and shorthand owner/repo formats.
+    """
+    s = (url or "").strip()
+    s = s.removesuffix(".git")
+    host = "github.com"
+    try:
+        if s.startswith("http://") or s.startswith("https://"):
+            p = urlparse(s)
+            host = p.netloc
+            parts = [pt for pt in p.path.split("/") if pt]
+            if len(parts) >= 2:
+                return parts[0], parts[1], host
+        if s.startswith("git@") or ":" in s:
+            s2 = s
+            if s2.startswith("git@"):
+                s2 = s2.replace(":", "/", 1)
+                s2 = s2.replace("git@", "ssh://git@", 1)
+            p = urlparse(s2)
+            host = p.hostname or host
+            parts = [pt for pt in (p.path or "").split("/") if pt]
+            if len(parts) >= 2:
+                return parts[-2], parts[-1], host
+        parts = [pt for pt in s.split("/") if pt]
+        if len(parts) == 2:
+            return parts[0], parts[1], host
+    except Exception:
+        return "", "", host
+    return "", "", host
+
+
+def expand_env_vars(value: Any) -> Any:
+    """Recursively expand ${VAR} and ${VAR:-default} patterns in config values."""
+    if isinstance(value, str):
+        pattern = r"\$\{([^}:]+)(?::-([^}]*))?\}"
+
+        def replace_var(match):
+            var_name = match.group(1)
+            default_val = match.group(2) if match.group(2) is not None else ""
+            return os.environ.get(var_name, default_val)
+
+        return re.sub(pattern, replace_var, value)
+    elif isinstance(value, dict):
+        return {k: expand_env_vars(v) for k, v in value.items()}
+    elif isinstance(value, list):
+        return [expand_env_vars(item) for item in value]
+    return value
+
+
+async def run_cmd(
+    cmd: list,
+    cwd: str | None = None,
+    capture_stdout: bool = False,
+    ignore_errors: bool = False,
+) -> str:
+    """Run a subprocess command asynchronously.
+
+    Args:
+        cmd: Command and arguments list.
+        cwd: Working directory (defaults to current directory).
+        capture_stdout: If True, return stdout text.
+        ignore_errors: If True, don't raise on non-zero exit.
+
+    Returns:
+        stdout text if capture_stdout is True, else empty string.
+
+    Raises:
+        RuntimeError: If command fails and ignore_errors is False.
+    """
+    cmd_safe = [redact_secrets(str(arg)) for arg in cmd]
+    logger.info(f"Running command: {' '.join(cmd_safe)}")
+
+    proc = await asyncio.create_subprocess_exec(
+        *cmd,
+        stdout=asyncio.subprocess.PIPE,
+        stderr=asyncio.subprocess.PIPE,
+        cwd=cwd,
+    )
+    stdout_data, stderr_data = await proc.communicate()
+    stdout_text = stdout_data.decode("utf-8", errors="replace")
+    stderr_text = stderr_data.decode("utf-8", errors="replace")
+
+    if stdout_text.strip():
+        logger.info(f"Command stdout: {redact_secrets(stdout_text.strip())}")
+    if stderr_text.strip():
+        logger.info(f"Command stderr: {redact_secrets(stderr_text.strip())}")
+
+    if proc.returncode != 0 and not ignore_errors:
+        raise RuntimeError(stderr_text or f"Command failed: {' '.join(cmd_safe)}")
+
+    if capture_stdout:
+        return stdout_text
+    return ""
diff --git a/components/runners/claude-code-runner/workspace.py b/components/runners/claude-code-runner/workspace.py
new file mode 100644
index 000000000..0b01e84aa
--- /dev/null
+++ b/components/runners/claude-code-runner/workspace.py
@@ -0,0 +1,251 @@
+"""
+Workspace and path management for the Claude Code runner.
+
+Handles workflow/repo directory setup, workspace validation,
+and prerequisite checking for phase-based commands.
+"""
+
+import logging
+import os
+from pathlib import Path
+from typing import AsyncIterator
+from urllib.parse import urlparse
+
+from context import RunnerContext
+from utils import parse_owner_repo
+
+logger = logging.getLogger(__name__)
+
+
+class PrerequisiteError(RuntimeError):
+    """Raised when slash-command prerequisites are missing."""
+
+    pass
+
+
+def setup_workflow_paths(
+    context: RunnerContext, active_workflow_url: str, repos_cfg: list
+) -> tuple[str, list, str]:
+    """Setup CWD and additional directories for workflow mode.
+
+    Returns:
+        (cwd_path, additional_dirs, derived_workflow_name)
+    """
+    add_dirs: list[str] = []
+    derived_name = None
+    cwd_path = context.workspace_path
+
+    try:
+        _owner, repo, _ = parse_owner_repo(active_workflow_url)
+        derived_name = repo or ""
+        if not derived_name:
+            p = urlparse(active_workflow_url)
+            parts = [pt for pt in (p.path or "").split("/") if pt]
+            if parts:
+                derived_name = parts[-1]
+        derived_name = (derived_name or "").removesuffix(".git").strip()
+
+        if derived_name:
+            workflow_path = str(
+                Path(context.workspace_path) / "workflows" / derived_name
+            )
+            if Path(workflow_path).exists():
+                cwd_path = workflow_path
+                logger.info(f"Using workflow as CWD: {derived_name}")
+            else:
+                logger.warning(
+                    f"Workflow directory not found: {workflow_path}, using default"
+                )
+                cwd_path = str(
+                    Path(context.workspace_path) / "workflows" / "default"
+                )
+        else:
+            cwd_path = str(
+                Path(context.workspace_path) / "workflows" / "default"
+            )
+    except Exception as e:
+        logger.warning(f"Failed to derive workflow name: {e}, using default")
+        cwd_path = str(
+            Path(context.workspace_path) / "workflows" / "default"
+        )
+
+    # Add all repos as additional directories
+    repos_base = Path(context.workspace_path) / "repos"
+    for r in repos_cfg:
+        name = (r.get("name") or "").strip()
+        if name:
+            repo_path = str(repos_base / name)
+            if repo_path not in add_dirs:
+                add_dirs.append(repo_path)
+
+    # Add artifacts and file-uploads directories
+    artifacts_path = str(Path(context.workspace_path) / "artifacts")
+    if artifacts_path not in add_dirs:
+        add_dirs.append(artifacts_path)
+
+    file_uploads_path = str(Path(context.workspace_path) / "file-uploads")
+    if file_uploads_path not in add_dirs:
+        add_dirs.append(file_uploads_path)
+
+    return cwd_path, add_dirs, derived_name
+
+
+def setup_multi_repo_paths(
+    context: RunnerContext, repos_cfg: list
+) -> tuple[str, list]:
+    """Setup CWD and additional directories for multi-repo mode.
+
+    Repos are cloned to /workspace/repos/{name} by both
+    hydrate.sh (init container) and clone_repo_at_runtime().
+
+    Returns:
+        (cwd_path, additional_dirs)
+    """
+    add_dirs: list[str] = []
+    repos_base = Path(context.workspace_path) / "repos"
+
+    main_name = (os.getenv("MAIN_REPO_NAME") or "").strip()
+    if not main_name:
+        idx_raw = (os.getenv("MAIN_REPO_INDEX") or "").strip()
+        try:
+            idx_val = int(idx_raw) if idx_raw else 0
+        except Exception:
+            idx_val = 0
+        if idx_val < 0 or idx_val >= len(repos_cfg):
+            idx_val = 0
+        main_name = (repos_cfg[idx_val].get("name") or "").strip()
+
+    cwd_path = (
+        str(repos_base / main_name) if main_name else context.workspace_path
+    )
+
+    for r in repos_cfg:
+        name = (r.get("name") or "").strip()
+        if not name:
+            continue
+        p = str(repos_base / name)
+        if p != cwd_path:
+            add_dirs.append(p)
+
+    # Add artifacts and file-uploads directories
+    artifacts_path = str(Path(context.workspace_path) / "artifacts")
+    if artifacts_path not in add_dirs:
+        add_dirs.append(artifacts_path)
+
+    file_uploads_path = str(Path(context.workspace_path) / "file-uploads")
+    if file_uploads_path not in add_dirs:
+        add_dirs.append(file_uploads_path)
+
+    return cwd_path, add_dirs
+
+
+async def prepare_workspace(context: RunnerContext) -> None:
+    """Validate workspace prepared by init container.
+
+    The init-hydrate container handles downloading state from S3,
+    cloning repos, and cloning workflows. This just validates and logs.
+    """
+    workspace = Path(context.workspace_path)
+    logger.info(f"Validating workspace at {workspace}")
+
+    hydrated_paths = []
+    for path_name in [".claude", "artifacts", "file-uploads"]:
+        path_dir = workspace / path_name
+        if path_dir.exists():
+            file_count = len([f for f in path_dir.rglob("*") if f.is_file()])
+            if file_count > 0:
+                hydrated_paths.append(f"{path_name} ({file_count} files)")
+
+    if hydrated_paths:
+        logger.info(f"Hydrated from S3: {', '.join(hydrated_paths)}")
+    else:
+        logger.info("No state hydrated (fresh session)")
+
+
+async def validate_prerequisites(context: RunnerContext) -> None:
+    """Validate prerequisite files exist for phase-based slash commands.
+
+    Raises:
+        PrerequisiteError: If a required file is missing.
+    """
+    prompt = context.get_env("INITIAL_PROMPT", "")
+    if not prompt:
+        return
+
+    prompt_lower = prompt.strip().lower()
+
+    prerequisites = {
+        "/speckit.plan": (
+            "spec.md",
+            "Specification file (spec.md) not found. Please run /speckit.specify first.",
+        ),
+        "/speckit.tasks": (
+            "plan.md",
+            "Planning file (plan.md) not found. Please run /speckit.plan first.",
+        ),
+        "/speckit.implement": (
+            "tasks.md",
+            "Tasks file (tasks.md) not found. Please run /speckit.tasks first.",
+        ),
+    }
+
+    for cmd, (required_file, error_msg) in prerequisites.items():
+        if prompt_lower.startswith(cmd):
+            workspace = Path(context.workspace_path)
+            found = False
+
+            if (workspace / required_file).exists():
+                found = True
+                break
+
+            for subdir in workspace.rglob("specs/*/"):
+                if (subdir / required_file).exists():
+                    found = True
+                    break
+
+            if not found:
+                raise PrerequisiteError(error_msg)
+            break
+
+
+async def initialize_workflow_if_set(context: RunnerContext) -> None:
+    """Validate workflow was cloned by init container."""
+    active_workflow_url = (os.getenv("ACTIVE_WORKFLOW_GIT_URL") or "").strip()
+    if not active_workflow_url:
+        return
+
+    try:
+        _owner, repo, _ = parse_owner_repo(active_workflow_url)
+        derived_name = repo or ""
+        if not derived_name:
+            p = urlparse(active_workflow_url)
+            parts = [pt for pt in (p.path or "").split("/") if pt]
+            if parts:
+                derived_name = parts[-1]
+        derived_name = (derived_name or "").removesuffix(".git").strip()
+
+        if not derived_name:
+            logger.warning("Could not derive workflow name from URL")
+            return
+
+        workspace = Path(context.workspace_path)
+        workflow_temp_dir = workspace / "workflows" / f"{derived_name}-clone-temp"
+        workflow_dir = workspace / "workflows" / derived_name
+
+        if workflow_temp_dir.exists():
+            logger.info(
+                f"Workflow {derived_name} cloned by init container "
+                f"at {workflow_temp_dir.name}"
+            )
+        elif workflow_dir.exists():
+            logger.info(
+                f"Workflow {derived_name} available at {workflow_dir.name}"
+            )
+        else:
+            logger.warning(
+                f"Workflow {derived_name} not found "
+                "(init container may have failed to clone)"
+            )
+
+    except Exception as e:
+        logger.error(f"Failed to validate workflow: {e}")

From f2451e42702b5e349ea92a8c04ad3ff66ce9f7c4 Mon Sep 17 00:00:00 2001
From: Gage Krumbach <gkrumbach@gmail.com>
Date: Fri, 6 Feb 2026 12:36:01 -0600
Subject: [PATCH 2/4] feat: enhance integration status messaging and user
 guidance

- Improved the session Integrations accordion with clearer naming and structure, separating workspace and global integrations.
- Added a new GitHub card in the Global section, displaying project integration status.
- Updated the create session modal to include integration status and links, preventing users from creating sessions without data connections.
- Enhanced visual elements with status icons and descriptive tooltips for unconfigured integrations.
- Provided explicit guidance for users on configuring integrations when data connections are not established.

This update aims to streamline user experience and improve clarity in integration management.
---
 components/frontend/tsconfig.json | 30 ++++++++++++++++++++++++++++++
 1 file changed, 30 insertions(+)
 create mode 100644 components/frontend/tsconfig.json

diff --git a/components/frontend/tsconfig.json b/components/frontend/tsconfig.json
new file mode 100644
index 000000000..c1bd93ee4
--- /dev/null
+++ b/components/frontend/tsconfig.json
@@ -0,0 +1,30 @@
+{
+  "compilerOptions": {
+    "target": "ES2017",
+    "lib": ["dom", "dom.iterable", "esnext"],
+    "allowJs": true,
+    "skipLibCheck": true,
+    "strict": true,
+    "noImplicitAny": true,
+    "strictNullChecks": true,
+    "noEmit": true,
+    "esModuleInterop": true,
+    "module": "esnext",
+    "moduleResolution": "bundler",
+    "resolveJsonModule": true,
+    "isolatedModules": true,
+    "jsx": "preserve",
+    "incremental": true,
+    "plugins": [
+      {
+        "name": "next"
+      }
+    ],
+    "baseUrl": ".",
+    "paths": {
+      "@/*": ["./src/*"]
+    }
+  },
+  "include": ["next-env.d.ts", "**/*.ts", "**/*.tsx", ".next/types/**/*.ts"],
+  "exclude": ["node_modules"]
+}

From 79c8e787c4867b34bee6b9f11b8f6a4e71534367 Mon Sep 17 00:00:00 2001
From: Gage Krumbach <gkrumbach@gmail.com>
Date: Fri, 6 Feb 2026 14:06:23 -0600
Subject: [PATCH 3/4] feat: update integration status handling and enhance
 frontend components

- Added FEEDBACK_URL environment variable to deployment configurations for frontend.
- Refactored integration status handling in the frontend, replacing `useProjectIntegrationStatus` with `useIntegrationsStatus` for improved clarity and consistency.
- Updated the Create Session dialog to reflect accurate integration statuses for GitHub, GitLab, and Google Workspace, enhancing user guidance.
- Renamed and reorganized components related to MCP integrations for better structure and readability.
- Enhanced the MCP server status retrieval process in the backend to provide more detailed information about server tools and annotations.

This update aims to improve the user experience by providing clearer integration statuses and enhancing the overall structure of the frontend components.
---
 .github/workflows/components-build-deploy.yml |   6 +-
 .github/workflows/prod-release-deploy.yaml    |   3 +-
 .../accordions/mcp-integrations-accordion.tsx | 551 ++++++++----------
 .../[name]/sessions/[sessionName]/page.tsx    |  12 +-
 .../src/components/create-session-dialog.tsx  | 119 ++--
 .../frontend/src/services/api/integrations.ts |   1 +
 .../frontend/src/services/api/sessions.ts     |  21 +-
 components/runners/claude-code-runner/main.py | 104 ++--
 8 files changed, 404 insertions(+), 413 deletions(-)

diff --git a/.github/workflows/components-build-deploy.yml b/.github/workflows/components-build-deploy.yml
index 04baca254..3681bc3b1 100644
--- a/.github/workflows/components-build-deploy.yml
+++ b/.github/workflows/components-build-deploy.yml
@@ -265,7 +265,8 @@ jobs:
         run: |
           oc set env deployment/frontend -n ambient-code -c frontend \
             GITHUB_APP_SLUG="ambient-code-stage" \
-            VTEAM_VERSION="${{ github.sha }}"
+            VTEAM_VERSION="${{ github.sha }}" \
+            FEEDBACK_URL="https://forms.gle/7XiWrvo6No922DUz6"
 
       - name: Update backend environment variables
         if: needs.detect-changes.outputs.backend == 'true'
@@ -328,7 +329,8 @@ jobs:
         run: |
           oc set env deployment/frontend -n ambient-code -c frontend \
             GITHUB_APP_SLUG="ambient-code-stage" \
-            VTEAM_VERSION="${{ github.sha }}"
+            VTEAM_VERSION="${{ github.sha }}" \
+            FEEDBACK_URL="https://forms.gle/7XiWrvo6No922DUz6"
 
       - name: Update backend environment variables
         run: |
diff --git a/.github/workflows/prod-release-deploy.yaml b/.github/workflows/prod-release-deploy.yaml
index e2e3235d6..694a755f4 100644
--- a/.github/workflows/prod-release-deploy.yaml
+++ b/.github/workflows/prod-release-deploy.yaml
@@ -265,7 +265,8 @@ jobs:
         run: |
           oc set env deployment/frontend -n ambient-code -c frontend \
             GITHUB_APP_SLUG="ambient-code" \
-            VTEAM_VERSION="${{ needs.release.outputs.new_tag }}"
+            VTEAM_VERSION="${{ needs.release.outputs.new_tag }}" \
+            FEEDBACK_URL="https://forms.gle/7XiWrvo6No922DUz6"
 
       - name: Update backend environment variables
         run: |
diff --git a/components/frontend/src/app/projects/[name]/sessions/[sessionName]/components/accordions/mcp-integrations-accordion.tsx b/components/frontend/src/app/projects/[name]/sessions/[sessionName]/components/accordions/mcp-integrations-accordion.tsx
index d6da85ae8..cf4a1da17 100644
--- a/components/frontend/src/app/projects/[name]/sessions/[sessionName]/components/accordions/mcp-integrations-accordion.tsx
+++ b/components/frontend/src/app/projects/[name]/sessions/[sessionName]/components/accordions/mcp-integrations-accordion.tsx
@@ -1,9 +1,8 @@
 'use client'
 
 import { useState, useEffect } from 'react'
-import type { ReactNode } from 'react'
 import Link from 'next/link'
-import { Plug, CheckCircle2, XCircle, AlertCircle, AlertTriangle } from 'lucide-react'
+import { Plug, Link2, CheckCircle2, XCircle, AlertCircle, AlertTriangle, Info, Check, X } from 'lucide-react'
 import {
   AccordionItem,
   AccordionTrigger,
@@ -16,35 +15,32 @@ import {
   TooltipProvider,
   TooltipTrigger,
 } from '@/components/ui/tooltip'
+import {
+  Popover,
+  PopoverContent,
+  PopoverTrigger,
+} from '@/components/ui/popover'
 import { Skeleton } from '@/components/ui/skeleton'
 import { useMcpStatus } from '@/services/queries/use-mcp'
-import { useProjectIntegrationStatus } from '@/services/queries/use-projects'
 import { useIntegrationsStatus } from '@/services/queries/use-integrations'
-import type { McpServer } from '@/services/api/sessions'
+import type { McpServer, McpTool } from '@/services/api/sessions'
 
-type McpIntegrationsAccordionProps = {
+// ─── MCP Servers Accordion ───────────────────────────────────────────────────
+
+type McpServersAccordionProps = {
   projectName: string
   sessionName: string
 }
 
-export function McpIntegrationsAccordion({
+export function McpServersAccordion({
   projectName,
   sessionName,
-}: McpIntegrationsAccordionProps) {
+}: McpServersAccordionProps) {
   const [placeholderTimedOut, setPlaceholderTimedOut] = useState(false)
 
-  // Fetch real MCP status from runner
   const { data: mcpStatus, isPending: mcpPending } = useMcpStatus(projectName, sessionName)
   const mcpServers = mcpStatus?.servers || []
 
-  const { data: integrationStatus, isPending: integrationStatusPending } =
-    useProjectIntegrationStatus(projectName)
-  const githubConfigured = integrationStatus?.github ?? false
-
-  const { data: integrationsStatus } = useIntegrationsStatus()
-  const gitlabConfigured = integrationsStatus?.gitlab?.connected ?? false
-
-  // Show skeleton cards until we have MCP servers or 2 min elapsed (backend returns empty when runner not ready)
   const showPlaceholders =
     mcpPending || (mcpServers.length === 0 && !placeholderTimedOut)
 
@@ -54,49 +50,50 @@ export function McpIntegrationsAccordion({
       return
     }
     if (!mcpStatus) return
-    const t = setTimeout(() => setPlaceholderTimedOut(true), 15 * 1000) // 15 seconds
+    const t = setTimeout(() => setPlaceholderTimedOut(true), 15 * 1000)
     return () => clearTimeout(t)
   }, [mcpStatus, mcpServers.length])
 
-  // Collect all MCP servers
-  const allServers = [...mcpServers]
-
-  // Ensure core integrations always appear (even if not in API response)
-  if (!showPlaceholders) {
-    // Webfetch - always available
-    const hasWebfetch = allServers.some((s) => s.name === 'webfetch')
-    if (!hasWebfetch) {
-      allServers.push({
-        name: 'webfetch',
-        displayName: 'Webfetch',
-        status: 'disconnected',
-        authenticated: undefined,
-        authMessage: 'Fetches web content for the session.',
-      } as McpServer)
-    }
-
-    // Google Workspace - show as not configured if missing
-    const hasGoogleWorkspace = allServers.some((s) => s.name === 'google-workspace')
-    if (!hasGoogleWorkspace) {
-      allServers.push({
-        name: 'google-workspace',
-        displayName: 'Google Workspace',
-        status: 'disconnected',
-        authenticated: false,
-        authMessage: undefined,
-      } as McpServer)
+  const getStatusIcon = (server: McpServer) => {
+    switch (server.status) {
+      case 'configured':
+      case 'connected':
+        return <CheckCircle2 className="h-4 w-4 text-green-600" />
+      case 'error':
+        return <XCircle className="h-4 w-4 text-red-600" />
+      case 'disconnected':
+      default:
+        return <AlertCircle className="h-4 w-4 text-gray-400" />
     }
+  }
 
-    // Jira - workspace-level integration
-    const hasJira = allServers.some((s) => s.name === 'mcp-atlassian')
-    if (!hasJira) {
-      allServers.push({
-        name: 'mcp-atlassian',
-        displayName: 'Jira',
-        status: 'disconnected',
-        authenticated: false,
-        authMessage: undefined,
-      } as McpServer)
+  const getStatusBadge = (server: McpServer) => {
+    switch (server.status) {
+      case 'configured':
+        return (
+          <Badge variant="outline" className="text-xs bg-blue-50 text-blue-700 border-blue-200">
+            Configured
+          </Badge>
+        )
+      case 'connected':
+        return (
+          <Badge variant="outline" className="text-xs bg-green-50 text-green-700 border-green-200">
+            Connected
+          </Badge>
+        )
+      case 'error':
+        return (
+          <Badge variant="outline" className="text-xs bg-red-50 text-red-700 border-red-200">
+            Error
+          </Badge>
+        )
+      case 'disconnected':
+      default:
+        return (
+          <Badge variant="outline" className="text-xs bg-gray-50 text-gray-700 border-gray-200">
+            Disconnected
+          </Badge>
+        )
     }
   }
 
@@ -115,65 +112,186 @@ export function McpIntegrationsAccordion({
     </div>
   )
 
-  const renderGitHubCard = () =>
-    integrationStatusPending ? (
-      renderCardSkeleton()
-    ) : (
-    <div
-      key="github"
-      className="flex items-start justify-between gap-3 p-3 border rounded-lg bg-background/50"
+  const renderAnnotationBadge = (key: string, value: boolean) => (
+    <Badge
+      key={key}
+      variant="outline"
+      className={`text-[10px] px-1.5 py-0 font-normal gap-0.5 ${
+        value
+          ? 'bg-green-50 text-green-700 border-green-200 dark:bg-green-950/30 dark:text-green-400 dark:border-green-800'
+          : 'bg-red-50 text-red-700 border-red-200 dark:bg-red-950/30 dark:text-red-400 dark:border-red-800'
+      }`}
     >
-      <div className="flex-1 min-w-0">
-        <div className="flex items-center gap-2">
-          <div className="flex-shrink-0">
-            {githubConfigured ? (
-              <CheckCircle2 className="h-4 w-4 text-green-600" />
-            ) : (
-              <TooltipProvider>
-                <Tooltip>
-                  <TooltipTrigger asChild>
-                    <span className="inline-flex">
-                      <AlertTriangle className="h-4 w-4 text-amber-500" />
-                    </span>
-                  </TooltipTrigger>
-                  <TooltipContent>
-                    <p>not configured</p>
-                  </TooltipContent>
-                </Tooltip>
-              </TooltipProvider>
+      {value ? <Check className="h-2.5 w-2.5" /> : <X className="h-2.5 w-2.5" />}
+      {key}
+    </Badge>
+  )
+
+  const renderToolRow = (tool: McpTool) => {
+    const annotations = Object.entries(tool.annotations).filter(
+      ([, v]) => typeof v === 'boolean'
+    )
+    return (
+      <div key={tool.name} className="flex items-center justify-between gap-2 py-1.5 px-1">
+        <span className="text-xs font-mono truncate">{tool.name}</span>
+        {annotations.length > 0 && (
+          <div className="flex items-center gap-1 flex-shrink-0">
+            {annotations.map(([k, v]) => renderAnnotationBadge(k, v as boolean))}
+          </div>
+        )}
+      </div>
+    )
+  }
+
+  const renderServerCard = (server: McpServer) => {
+    const tools = server.tools ?? []
+    const toolCount = tools.length
+
+    return (
+      <div
+        key={server.name}
+        className="flex items-start justify-between gap-3 p-3 border rounded-lg bg-background/50"
+      >
+        <div className="flex-1 min-w-0">
+          <div className="flex items-center gap-2">
+            <div className="flex-shrink-0">
+              {getStatusIcon(server)}
+            </div>
+            <h4 className="font-medium text-sm">{server.displayName}</h4>
+            {server.version && (
+              <span className="text-[10px] text-muted-foreground">v{server.version}</span>
+            )}
+            {toolCount > 0 && (
+              <Popover>
+                <PopoverTrigger asChild>
+                  <button
+                    type="button"
+                    className="inline-flex items-center gap-1 text-[10px] text-muted-foreground hover:text-foreground transition-colors"
+                  >
+                    <Info className="h-3 w-3" />
+                    <span>{toolCount} {toolCount === 1 ? 'tool' : 'tools'}</span>
+                  </button>
+                </PopoverTrigger>
+                <PopoverContent
+                  align="start"
+                  className="w-80 p-0"
+                >
+                  <div className="px-3 py-2 border-b">
+                    <p className="text-xs font-medium">
+                      {server.displayName} — {toolCount} {toolCount === 1 ? 'tool' : 'tools'}
+                    </p>
+                  </div>
+                  <div className="max-h-64 overflow-y-auto divide-y">
+                    {tools.map((tool) => renderToolRow(tool))}
+                  </div>
+                </PopoverContent>
+              </Popover>
             )}
           </div>
-          <h4 className="font-medium text-sm">GitHub</h4>
         </div>
-        <p className="text-xs text-muted-foreground mt-0.5">
-          {githubConfigured ? (
-            'MCP access to GitHub repositories.'
-          ) : (
+        <div className="flex-shrink-0">
+          {getStatusBadge(server)}
+        </div>
+      </div>
+    )
+  }
+
+  return (
+    <AccordionItem value="mcp-servers" className="border rounded-lg px-3 bg-card">
+      <AccordionTrigger className="text-base font-semibold hover:no-underline py-3">
+        <div className="flex items-center gap-2">
+          <Plug className="h-4 w-4" />
+          <span>MCP Servers</span>
+          {!showPlaceholders && mcpServers.length > 0 && (
+            <Badge variant="outline" className="text-[10px] px-2 py-0.5">
+              {mcpServers.length}
+            </Badge>
+          )}
+        </div>
+      </AccordionTrigger>
+      <AccordionContent className="px-1 pb-3">
+        <div className="space-y-2">
+          {showPlaceholders ? (
             <>
-              Session started without GitHub MCP. Configure{' '}
-              <Link href="/integrations" className="text-primary hover:underline">
-                Integrations
-              </Link>{' '}
-              and start a new session.
+              {renderCardSkeleton()}
+              {renderCardSkeleton()}
             </>
+          ) : mcpServers.length > 0 ? (
+            mcpServers.map((server) => renderServerCard(server))
+          ) : (
+            <p className="text-xs text-muted-foreground py-2">
+              No MCP servers available for this session.
+            </p>
           )}
-        </p>
+        </div>
+      </AccordionContent>
+    </AccordionItem>
+  )
+}
+
+// ─── Integrations Accordion ──────────────────────────────────────────────────
+
+export function IntegrationsAccordion() {
+  const { data: integrationsStatus, isPending } = useIntegrationsStatus()
+
+  const githubConfigured = integrationsStatus?.github?.active != null
+  const gitlabConfigured = integrationsStatus?.gitlab?.connected ?? false
+  const jiraConfigured = integrationsStatus?.jira?.connected ?? false
+  const googleConfigured = integrationsStatus?.google?.connected ?? false
+
+  const integrations = [
+    {
+      key: 'github',
+      name: 'GitHub',
+      configured: githubConfigured,
+      configuredMessage: 'Authenticated. Git push and repository access enabled.',
+    },
+    {
+      key: 'gitlab',
+      name: 'GitLab',
+      configured: gitlabConfigured,
+      configuredMessage: 'Authenticated. Git push and repository access enabled.',
+    },
+    {
+      key: 'google',
+      name: 'Google Workspace',
+      configured: googleConfigured,
+      configuredMessage: 'Authenticated. Drive, Calendar, and Gmail access enabled.',
+    },
+    {
+      key: 'jira',
+      name: 'Jira',
+      configured: jiraConfigured,
+      configuredMessage: 'Authenticated. Issue and project access enabled.',
+    },
+  ].sort((a, b) => a.name.localeCompare(b.name))
+
+  const configuredCount = integrations.filter((i) => i.configured).length
+
+  const renderCardSkeleton = () => (
+    <div
+      className="flex items-start justify-between gap-3 p-3 border rounded-lg bg-background/50"
+      aria-hidden
+    >
+      <div className="flex-1 min-w-0 space-y-2">
+        <div className="flex items-center gap-2">
+          <Skeleton className="h-4 w-4 rounded-full flex-shrink-0" />
+          <Skeleton className="h-4 w-20" />
+        </div>
+        <Skeleton className="h-3 w-full max-w-[240px]" />
       </div>
     </div>
-    )
+  )
 
-  const renderGitLabCard = () =>
-    integrationStatusPending ? (
-      renderCardSkeleton()
-    ) : (
+  const renderIntegrationCard = (integration: (typeof integrations)[number]) => (
     <div
-      key="gitlab"
+      key={integration.key}
       className="flex items-start justify-between gap-3 p-3 border rounded-lg bg-background/50"
     >
       <div className="flex-1 min-w-0">
         <div className="flex items-center gap-2">
           <div className="flex-shrink-0">
-            {gitlabConfigured ? (
+            {integration.configured ? (
               <CheckCircle2 className="h-4 w-4 text-green-600" />
             ) : (
               <TooltipProvider>
@@ -184,244 +302,77 @@ export function McpIntegrationsAccordion({
                     </span>
                   </TooltipTrigger>
                   <TooltipContent>
-                    <p>not configured</p>
+                    <p>Not configured</p>
                   </TooltipContent>
                 </Tooltip>
               </TooltipProvider>
             )}
           </div>
-          <h4 className="font-medium text-sm">GitLab</h4>
+          <h4 className="font-medium text-sm">{integration.name}</h4>
         </div>
         <p className="text-xs text-muted-foreground mt-0.5">
-          {gitlabConfigured ? (
-            'MCP access to GitLab repositories.'
+          {integration.configured ? (
+            integration.configuredMessage
           ) : (
             <>
-              Session started without GitLab MCP. Configure{' '}
+              Not connected.{' '}
               <Link href="/integrations" className="text-primary hover:underline">
-                Integrations
+                Set up
               </Link>{' '}
-              and start a new session.
+              to enable {integration.name} access.
             </>
           )}
         </p>
       </div>
     </div>
-    )
-
-  const renderServerCard = (server: McpServer) => (
-    <div
-      key={server.name}
-      className="flex items-start justify-between gap-3 p-3 border rounded-lg bg-background/50"
-    >
-      <div className="flex-1 min-w-0">
-        <div className="flex items-center gap-2">
-          <div className="flex-shrink-0">
-            {server.authenticated === false ? (
-              <TooltipProvider>
-                <Tooltip>
-                  <TooltipTrigger asChild>
-                    <span className="inline-flex">{getStatusIcon(server)}</span>
-                  </TooltipTrigger>
-                  <TooltipContent>
-                    <p>not configured</p>
-                  </TooltipContent>
-                </Tooltip>
-              </TooltipProvider>
-            ) : (
-              getStatusIcon(server)
-            )}
-          </div>
-          <h4 className="font-medium text-sm">{getDisplayName(server)}</h4>
-{server.name === 'mcp-atlassian' && server.authenticated === true && (
-                      <Badge variant="secondary" className="text-xs font-normal">
-                        read only
-                      </Badge>
-                    )}
-        </div>
-        {getDescription(server) && (
-          <p className="text-xs text-muted-foreground mt-0.5">
-            {getDescription(server)}
-          </p>
-        )}
-      </div>
-      <div className="flex-shrink-0">
-        {getRightContent(server)}
-      </div>
-    </div>
   )
 
-  const getDisplayName = (server: McpServer) =>
-    server.name === 'mcp-atlassian' ? 'Jira' : server.displayName
-
-  const getDescription = (server: McpServer): ReactNode => {
-    if (server.name === 'webfetch') return 'Fetches web content for the session.'
-    if (server.name === 'mcp-atlassian') {
-      if (server.authenticated === false) {
-        return (
-          <>
-            Session started without Jira MCP. Configure{' '}
-            <Link href="/integrations" className="text-primary hover:underline">
-              Integrations
-            </Link>{' '}
-            and start a new session.
-          </>
-        )
-      }
-      return 'MCP access to Jira issues and projects.'
-    }
-    if (server.name === 'google-workspace') {
-      if (server.authenticated === false) {
-        return (
-          <>
-            Session started without Google Workspace MCP. Configure{' '}
-            <Link href="/integrations" className="text-primary hover:underline">
-              Integrations
-            </Link>{' '}
-            and start a new session.
-          </>
-        )
-      }
-      return 'MCP access to Google Drive files.'
-    }
-    return server.authMessage ?? null
-  }
-
-  const getStatusIcon = (server: McpServer) => {
-    // If we have auth info, use that for the icon
-    if (server.authenticated !== undefined) {
-      if (server.authenticated === true) {
-        return <CheckCircle2 className="h-4 w-4 text-green-600" />
-      } else if (server.authenticated === null) {
-        // Null = needs refresh/uncertain state
-        return <AlertCircle className="h-4 w-4 text-amber-500" />
-      } else {
-        // False = not authenticated/not configured
-        return <AlertTriangle className="h-4 w-4 text-amber-500" />
-      }
-    }
-
-    // Fall back to status-based icons
-    switch (server.status) {
-      case 'configured':
-      case 'connected':
-        return <CheckCircle2 className="h-4 w-4 text-green-600" />
-      case 'error':
-        return <XCircle className="h-4 w-4 text-red-600" />
-      case 'disconnected':
-      default:
-        return <AlertCircle className="h-4 w-4 text-gray-400" />
-    }
-  }
-
-  const getRightContent = (server: McpServer) => {
-    // Webfetch: no badge
-    if (server.name === 'webfetch') return null
-
-    // Jira not authenticated: no link (description explains to configure and start new session)
-
-    // Google Workspace not authenticated: no link (description explains to configure and start new session)
-
-    // Jira connected: no badge
-    if (server.name === 'mcp-atlassian' && server.authenticated === true) return null
-
-    // Authenticated: show badge (with optional tooltip)
-    if (server.authenticated === true) {
-      const badge = (
-        <Badge variant="outline" className="text-xs bg-green-50 text-green-700 border-green-200">
-          <CheckCircle2 className="h-3 w-3 mr-1" />
-          Authenticated
-        </Badge>
-      )
-      if (server.authMessage) {
-        return (
-          <TooltipProvider>
-            <Tooltip>
-              <TooltipTrigger asChild>{badge}</TooltipTrigger>
-              <TooltipContent>
-                <p>{server.authMessage}</p>
-              </TooltipContent>
-            </Tooltip>
-          </TooltipProvider>
-        )
-      }
-      return badge
-    }
-
-    // Other servers with auth status but not authenticated: no badge (only Jira/Google get links above)
-    if (server.authenticated === false) return null
-
-    // Fall back to status-based badges (for servers without auth info; webfetch already returns null)
-    switch (server.status) {
-      case 'configured':
-        return (
-          <Badge variant="outline" className="text-xs bg-blue-50 text-blue-700 border-blue-200">
-            Configured
-          </Badge>
-        )
-      case 'connected':
-        return (
-          <Badge variant="outline" className="text-xs bg-green-50 text-green-700 border-green-200">
-            Connected
-          </Badge>
-        )
-      case 'error':
-        return (
-          <Badge variant="outline" className="text-xs bg-red-50 text-red-700 border-red-200">
-            Error
-          </Badge>
-        )
-      case 'disconnected':
-      default:
-        return (
-          <Badge variant="outline" className="text-xs bg-gray-50 text-gray-700 border-gray-200">
-            Disconnected
-          </Badge>
-        )
-    }
-  }
-
-  // Combine all integrations (GitHub + GitLab + all MCP servers)
-  type IntegrationItem =
-    | { type: 'github'; displayName: string }
-    | { type: 'gitlab'; displayName: string }
-    | { type: 'server'; displayName: string; server: McpServer }
-  const allIntegrations: IntegrationItem[] = [
-    { type: 'github' as const, displayName: 'GitHub' },
-    { type: 'gitlab' as const, displayName: 'GitLab' },
-    ...allServers.map((server) => ({ type: 'server' as const, displayName: getDisplayName(server), server })),
-  ].sort((a, b) => a.displayName.localeCompare(b.displayName))
-
   return (
-    <>
-    <AccordionItem value="mcp-integrations" className="border rounded-lg px-3 bg-card">
+    <AccordionItem value="integrations" className="border rounded-lg px-3 bg-card">
       <AccordionTrigger className="text-base font-semibold hover:no-underline py-3">
         <div className="flex items-center gap-2">
-          <Plug className="h-4 w-4" />
+          <Link2 className="h-4 w-4" />
           <span>Integrations</span>
+          {!isPending && (
+            <Badge variant="outline" className="text-[10px] px-2 py-0.5">
+              {configuredCount}/{integrations.length}
+            </Badge>
+          )}
         </div>
       </AccordionTrigger>
       <AccordionContent className="px-1 pb-3">
         <div className="space-y-2">
-          {showPlaceholders ? (
+          {isPending ? (
             <>
               {renderCardSkeleton()}
               {renderCardSkeleton()}
+              {renderCardSkeleton()}
             </>
           ) : (
-            allIntegrations.map((item) => {
-              if (item.type === 'github') {
-                return <div key="github">{renderGitHubCard()}</div>
-              } else if (item.type === 'gitlab') {
-                return <div key="gitlab">{renderGitLabCard()}</div>
-              } else {
-                return renderServerCard(item.server)
-              }
-            })
+            integrations.map((integration) => renderIntegrationCard(integration))
           )}
         </div>
       </AccordionContent>
     </AccordionItem>
+  )
+}
+
+// ─── Legacy export (renders both) ────────────────────────────────────────────
+
+type McpIntegrationsAccordionProps = {
+  projectName: string
+  sessionName: string
+}
+
+/** @deprecated Use McpServersAccordion + IntegrationsAccordion separately */
+export function McpIntegrationsAccordion({
+  projectName,
+  sessionName,
+}: McpIntegrationsAccordionProps) {
+  return (
+    <>
+      <McpServersAccordion projectName={projectName} sessionName={sessionName} />
+      <IntegrationsAccordion />
     </>
   )
 }
diff --git a/components/frontend/src/app/projects/[name]/sessions/[sessionName]/page.tsx b/components/frontend/src/app/projects/[name]/sessions/[sessionName]/page.tsx
index 169ec1697..cb99f514c 100644
--- a/components/frontend/src/app/projects/[name]/sessions/[sessionName]/page.tsx
+++ b/components/frontend/src/app/projects/[name]/sessions/[sessionName]/page.tsx
@@ -60,7 +60,7 @@ import { ManageRemoteDialog } from "./components/modals/manage-remote-dialog";
 import { WorkflowsAccordion } from "./components/accordions/workflows-accordion";
 import { RepositoriesAccordion } from "./components/accordions/repositories-accordion";
 import { ArtifactsAccordion } from "./components/accordions/artifacts-accordion";
-import { McpIntegrationsAccordion } from "./components/accordions/mcp-integrations-accordion";
+import { McpServersAccordion, IntegrationsAccordion } from "./components/accordions/mcp-integrations-accordion";
 import { WelcomeExperience } from "./components/welcome-experience";
 // Extracted hooks and utilities
 import { useGitOperations } from "./hooks/use-git-operations";
@@ -92,7 +92,7 @@ import {
   useOOTBWorkflows,
   useWorkflowMetadata,
 } from "@/services/queries/use-workflows";
-import { useProjectIntegrationStatus } from "@/services/queries/use-projects";
+import { useIntegrationsStatus } from "@/services/queries/use-integrations";
 import { useMutation } from "@tanstack/react-query";
 import { FeedbackProvider } from "@/contexts/FeedbackContext";
 
@@ -187,8 +187,8 @@ export default function ProjectSessionDetailPage({
   const continueMutation = useContinueSession();
   
   // Check integration status
-  const { data: integrationStatus } = useProjectIntegrationStatus(projectName);
-  const githubConfigured = integrationStatus?.github ?? false;
+  const { data: integrationsStatus } = useIntegrationsStatus();
+  const githubConfigured = integrationsStatus?.github?.active != null;
   
   // Get current user for feedback context
   const { data: currentUser } = useCurrentUser();
@@ -1636,11 +1636,13 @@ export default function ProjectSessionDetailPage({
                       onNavigateBack={artifactsOps.navigateBack}
                     />
 
-                    <McpIntegrationsAccordion
+                    <McpServersAccordion
                       projectName={projectName}
                       sessionName={sessionName}
                     />
 
+                    <IntegrationsAccordion />
+
                     {/* File Explorer */}
                     <AccordionItem
                       value="file-explorer"
diff --git a/components/frontend/src/components/create-session-dialog.tsx b/components/frontend/src/components/create-session-dialog.tsx
index e0b493c88..f25ec3770 100644
--- a/components/frontend/src/components/create-session-dialog.tsx
+++ b/components/frontend/src/components/create-session-dialog.tsx
@@ -32,11 +32,8 @@ import {
   SelectTrigger,
   SelectValue,
 } from "@/components/ui/select";
-import { Badge } from "@/components/ui/badge";
 import type { CreateAgenticSessionRequest } from "@/types/agentic-session";
 import { useCreateSession } from "@/services/queries/use-sessions";
-import { useProjectIntegrationStatus } from "@/services/queries/use-projects";
-import { useIntegrationSecrets } from "@/services/queries/use-secrets";
 import { useIntegrationsStatus } from "@/services/queries/use-integrations";
 import { errorToast } from "@/hooks/use-toast";
 
@@ -73,17 +70,12 @@ export function CreateSessionDialog({
   const router = useRouter();
   const createSessionMutation = useCreateSession();
 
-  const { data: integrationStatus } = useProjectIntegrationStatus(projectName);
-  const { data: integrationSecrets } = useIntegrationSecrets(projectName);
   const { data: integrationsStatus } = useIntegrationsStatus();
 
-  const githubConfigured = integrationStatus?.github ?? false;
+  const githubConfigured = integrationsStatus?.github?.active != null;
   const gitlabConfigured = integrationsStatus?.gitlab?.connected ?? false;
-  const byKey = integrationSecrets
-    ? Object.fromEntries(integrationSecrets.map((s) => [s.key, s.value]))
-    : {};
-  const atlassianConfigured =
-    !!(byKey.JIRA_URL?.trim() && byKey.JIRA_PROJECT?.trim() && byKey.JIRA_EMAIL?.trim() && byKey.JIRA_API_TOKEN?.trim());
+  const atlassianConfigured = integrationsStatus?.jira?.connected ?? false;
+  const googleConfigured = integrationsStatus?.google?.connected ?? false;
 
   const form = useForm<FormValues>({
     resolver: zodResolver(formSchema),
@@ -201,24 +193,21 @@ export function CreateSessionDialog({
                 )}
               />
 
-              {/* Integration status (same visual style as integrations accordion), alphabetical: Jira, GitHub, Google Workspace */}
+              {/* Integration auth status */}
               <div className="w-full space-y-2">
                 <FormLabel>Integrations</FormLabel>
-                {/* Jira card */}
-                {atlassianConfigured ? (
+                {/* GitHub card */}
+                {githubConfigured ? (
                   <div className="flex items-start justify-between gap-3 p-3 border rounded-lg bg-background/50">
                     <div className="flex-1 min-w-0">
                       <div className="flex items-center gap-2">
                         <div className="flex-shrink-0">
                           <CheckCircle2 className="h-4 w-4 text-green-600" />
                         </div>
-                        <h4 className="font-medium text-sm">Jira</h4>
-                        <Badge variant="secondary" className="text-xs font-normal">
-                          read only
-                        </Badge>
+                        <h4 className="font-medium text-sm">GitHub</h4>
                       </div>
                       <p className="text-xs text-muted-foreground mt-0.5">
-                        MCP access to Jira issues and projects.
+                        Authenticated. Git push and repository access enabled.
                       </p>
                     </div>
                   </div>
@@ -228,32 +217,29 @@ export function CreateSessionDialog({
                       <AlertTriangle className="h-4 w-4 text-amber-500" />
                     </div>
                     <div className="flex-1 min-w-0">
-                      <h4 className="font-medium text-sm">Jira</h4>
+                      <h4 className="font-medium text-sm">GitHub</h4>
                       <p className="text-xs text-muted-foreground mt-0.5">
-                        Configure{" "}
-                        <Link
-                          href="/integrations"
-                          className="text-primary hover:underline"
-                        >
-                          Integrations
+                        Not connected.{" "}
+                        <Link href="/integrations" className="text-primary hover:underline">
+                          Set up
                         </Link>{" "}
-                        to access Jira MCP in this session.
+                        to enable repository access.
                       </p>
                     </div>
                   </div>
                 )}
-                {/* GitHub card */}
-                {githubConfigured ? (
+                {/* GitLab card */}
+                {gitlabConfigured ? (
                   <div className="flex items-start justify-between gap-3 p-3 border rounded-lg bg-background/50">
                     <div className="flex-1 min-w-0">
                       <div className="flex items-center gap-2">
                         <div className="flex-shrink-0">
                           <CheckCircle2 className="h-4 w-4 text-green-600" />
                         </div>
-                        <h4 className="font-medium text-sm">GitHub</h4>
+                        <h4 className="font-medium text-sm">GitLab</h4>
                       </div>
                       <p className="text-xs text-muted-foreground mt-0.5">
-                        MCP access to GitHub repositories.
+                        Authenticated. Git push and repository access enabled.
                       </p>
                     </div>
                   </div>
@@ -263,29 +249,29 @@ export function CreateSessionDialog({
                       <AlertTriangle className="h-4 w-4 text-amber-500" />
                     </div>
                     <div className="flex-1 min-w-0">
-                      <h4 className="font-medium text-sm">GitHub</h4>
+                      <h4 className="font-medium text-sm">GitLab</h4>
                       <p className="text-xs text-muted-foreground mt-0.5">
-                        Configure{" "}
+                        Not connected.{" "}
                         <Link href="/integrations" className="text-primary hover:underline">
-                          Integrations
+                          Set up
                         </Link>{" "}
-                        to access GitHub MCP in this session.
+                        to enable repository access.
                       </p>
                     </div>
                   </div>
                 )}
-                {/* GitLab card */}
-                {gitlabConfigured ? (
+                {/* Google Workspace card */}
+                {googleConfigured ? (
                   <div className="flex items-start justify-between gap-3 p-3 border rounded-lg bg-background/50">
                     <div className="flex-1 min-w-0">
                       <div className="flex items-center gap-2">
                         <div className="flex-shrink-0">
                           <CheckCircle2 className="h-4 w-4 text-green-600" />
                         </div>
-                        <h4 className="font-medium text-sm">GitLab</h4>
+                        <h4 className="font-medium text-sm">Google Workspace</h4>
                       </div>
                       <p className="text-xs text-muted-foreground mt-0.5">
-                        MCP access to GitLab repositories.
+                        Authenticated. Drive, Calendar, and Gmail access enabled.
                       </p>
                     </div>
                   </div>
@@ -295,33 +281,52 @@ export function CreateSessionDialog({
                       <AlertTriangle className="h-4 w-4 text-amber-500" />
                     </div>
                     <div className="flex-1 min-w-0">
-                      <h4 className="font-medium text-sm">GitLab</h4>
+                      <h4 className="font-medium text-sm">Google Workspace</h4>
                       <p className="text-xs text-muted-foreground mt-0.5">
-                        Configure{" "}
+                        Not connected.{" "}
                         <Link href="/integrations" className="text-primary hover:underline">
-                          Integrations
+                          Set up
                         </Link>{" "}
-                        to access GitLab MCP in this session.
+                        to enable Drive, Calendar, and Gmail access.
                       </p>
                     </div>
                   </div>
                 )}
-                {/* Google Workspace card */}
-                <div className="flex items-start gap-3 p-3 border rounded-lg bg-background/50">
-                  <div className="flex-shrink-0">
-                    <AlertTriangle className="h-4 w-4 text-amber-500" />
+                {/* Jira card */}
+                {atlassianConfigured ? (
+                  <div className="flex items-start justify-between gap-3 p-3 border rounded-lg bg-background/50">
+                    <div className="flex-1 min-w-0">
+                      <div className="flex items-center gap-2">
+                        <div className="flex-shrink-0">
+                          <CheckCircle2 className="h-4 w-4 text-green-600" />
+                        </div>
+                        <h4 className="font-medium text-sm">Jira</h4>
+                      </div>
+                      <p className="text-xs text-muted-foreground mt-0.5">
+                        Authenticated. Issue and project access enabled.
+                      </p>
+                    </div>
                   </div>
-                  <div className="flex-1 min-w-0">
-                    <h4 className="font-medium text-sm">Google Workspace</h4>
-                    <p className="text-xs text-muted-foreground mt-0.5">
-                      Configure{" "}
-                      <Link href="/integrations" className="text-primary hover:underline">
-                        Integrations
-                      </Link>{" "}
-                      to access Google Workspace MCP in this session.
-                    </p>
+                ) : (
+                  <div className="flex items-start gap-3 p-3 border rounded-lg bg-background/50">
+                    <div className="flex-shrink-0">
+                      <AlertTriangle className="h-4 w-4 text-amber-500" />
+                    </div>
+                    <div className="flex-1 min-w-0">
+                      <h4 className="font-medium text-sm">Jira</h4>
+                      <p className="text-xs text-muted-foreground mt-0.5">
+                        Not connected.{" "}
+                        <Link
+                          href="/integrations"
+                          className="text-primary hover:underline"
+                        >
+                          Set up
+                        </Link>{" "}
+                        to enable issue and project access.
+                      </p>
+                    </div>
                   </div>
-                </div>
+                )}
               </div>
 
               <DialogFooter>
diff --git a/components/frontend/src/services/api/integrations.ts b/components/frontend/src/services/api/integrations.ts
index 978b07cbc..58bd24317 100644
--- a/components/frontend/src/services/api/integrations.ts
+++ b/components/frontend/src/services/api/integrations.ts
@@ -10,6 +10,7 @@ export type IntegrationsStatus = {
     pat: {
       configured: boolean
       updatedAt?: string
+      valid?: boolean
     }
     active?: 'app' | 'pat'
   }
diff --git a/components/frontend/src/services/api/sessions.ts b/components/frontend/src/services/api/sessions.ts
index 2da194054..bd55d9d28 100644
--- a/components/frontend/src/services/api/sessions.ts
+++ b/components/frontend/src/services/api/sessions.ts
@@ -17,14 +17,25 @@ import type {
   PaginationParams,
 } from '@/types/api';
 
+export type McpToolAnnotations = {
+  readOnly?: boolean;
+  destructive?: boolean;
+  idempotent?: boolean;
+  openWorld?: boolean;
+  [key: string]: boolean | undefined;
+};
+
+export type McpTool = {
+  name: string;
+  annotations: McpToolAnnotations;
+};
+
 export type McpServer = {
   name: string;
   displayName: string;
-  status: 'configured' | 'connected' | 'disconnected' | 'error';
-  authenticated?: boolean | null; // true = valid, false = invalid, null = needs refresh/uncertain, undefined = not checked
-  authMessage?: string;
-  source?: string;
-  command?: string;
+  status: string;
+  version?: string;
+  tools?: McpTool[];
 };
 
 export type McpStatusResponse = {
diff --git a/components/runners/claude-code-runner/main.py b/components/runners/claude-code-runner/main.py
index f38af794e..d609e1550 100644
--- a/components/runners/claude-code-runner/main.py
+++ b/components/runners/claude-code-runner/main.py
@@ -665,28 +665,24 @@ def _check_mcp_authentication(server_name: str) -> tuple[bool | None, str | None
 @app.get("/mcp/status")
 async def get_mcp_status():
     """
-    Returns MCP servers configured for this session with authentication status.
-    Goes straight to the source - uses adapter's _load_mcp_config() method.
-
-    For known integrations (Google, Jira), also checks if credentials are present.
+    Returns MCP server connection status by using the SDK's get_mcp_status() method.
+    Spins up a minimal ClaudeSDKClient, queries MCP status, then tears it down.
     """
     try:
         global adapter
 
-        if not adapter:
+        if not adapter or not adapter.context:
             return {
                 "servers": [],
                 "totalCount": 0,
                 "message": "Adapter not initialized yet",
             }
 
-        mcp_servers_list = []
-
-        # Get the working directory (same logic as adapter uses)
-        workspace_path = (
-            adapter.context.workspace_path if adapter.context else "/workspace"
-        )
+        from claude_agent_sdk import ClaudeAgentOptions, ClaudeSDKClient
+        import config as runner_config
 
+        # Resolve working directory (same logic as adapter)
+        workspace_path = adapter.context.workspace_path or "/workspace"
         active_workflow_url = os.getenv("ACTIVE_WORKFLOW_GIT_URL", "").strip()
         cwd_path = workspace_path
 
@@ -696,41 +692,63 @@ async def get_mcp_status():
             if os.path.exists(workflow_path):
                 cwd_path = workflow_path
 
-        # Load MCP config using the config module (same as adapter does during runs)
-        import config as runner_config
-        mcp_config = runner_config.load_mcp_config(adapter.context, cwd_path)
-        logger.info(f"MCP config: {mcp_config}")
-
-        if mcp_config:
-            for server_name, server_config in mcp_config.items():
-                # Check authentication status for known servers (Google, Jira)
-                is_authenticated, auth_message = _check_mcp_authentication(server_name)
-
-                # Platform servers are built-in (webfetch), workflow servers come from config
-                is_platform = server_name == "webfetch"
-
-                server_info = {
-                    "name": server_name,
-                    "displayName": server_name.replace("-", " ")
-                    .replace("_", " ")
-                    .title(),
-                    "status": "configured",
-                    "command": server_config.get("command", ""),
-                    "source": "platform" if is_platform else "workflow",
-                }
+        # Load MCP server config (same config the adapter uses for runs)
+        mcp_servers = runner_config.load_mcp_config(adapter.context, cwd_path) or {}
 
-                # Only include auth fields for servers we know how to check
-                if is_authenticated is not None:
-                    server_info["authenticated"] = is_authenticated
-                    server_info["authMessage"] = auth_message
+        # Build minimal options — just enough to initialise MCP servers
+        options = ClaudeAgentOptions(
+            cwd=cwd_path,
+            permission_mode="acceptEdits",
+            mcp_servers=mcp_servers,
+        )
 
-                mcp_servers_list.append(server_info)
+        client = ClaudeSDKClient(options=options)
+        try:
+            logger.info("MCP Status: Connecting ephemeral SDK client...")
+            await client.connect()
+
+            # Use the SDK's public get_mcp_status() method (added in v0.1.23)
+            sdk_status = await client.get_mcp_status()
+            logger.info("MCP Status: SDK returned:\n%s", json.dumps(sdk_status, indent=2, default=str))
+
+            # SDK returns: { mcpServers: [{ name, status, serverInfo: { name, version }, scope, tools }] }
+            raw_servers = []
+            if isinstance(sdk_status, dict):
+                raw_servers = sdk_status.get("mcpServers", [])
+            elif isinstance(sdk_status, list):
+                raw_servers = sdk_status
+
+            servers_list = []
+            for srv in raw_servers:
+                if not isinstance(srv, dict):
+                    continue
+                server_info = srv.get("serverInfo") or {}
+                raw_tools = srv.get("tools") or []
+                tools = [
+                    {
+                        "name": t.get("name", ""),
+                        "annotations": {
+                            k: v for k, v in (t.get("annotations") or {}).items()
+                        },
+                    }
+                    for t in raw_tools
+                    if isinstance(t, dict)
+                ]
+                servers_list.append({
+                    "name": srv.get("name", ""),
+                    "displayName": server_info.get("name", srv.get("name", "")),
+                    "status": srv.get("status", "unknown"),
+                    "version": server_info.get("version", ""),
+                    "tools": tools,
+                })
 
-        return {
-            "servers": mcp_servers_list,
-            "totalCount": len(mcp_servers_list),
-            "note": "Status shows 'configured' - check 'authenticated' field for credential status",
-        }
+            return {
+                "servers": servers_list,
+                "totalCount": len(servers_list),
+            }
+        finally:
+            logger.info("MCP Status: Disconnecting ephemeral SDK client...")
+            await client.disconnect()
 
     except Exception as e:
         logger.error(f"Failed to get MCP status: {e}", exc_info=True)

From 9bdfeba0db0adf8c84516ce8604fc82b861c3f67 Mon Sep 17 00:00:00 2001
From: Gage Krumbach <gkrumbach@gmail.com>
Date: Fri, 6 Feb 2026 14:19:39 -0600
Subject: [PATCH 4/4] feat: enhance MCP server status handling with session
 phase integration

- Added `sessionPhase` prop to `McpServersAccordion` to conditionally fetch MCP status based on the session's running state.
- Updated status display logic to improve user experience by showing placeholders only when the session is not running or when MCP status is pending.
- Enhanced visual elements in the MCP servers accordion for better clarity and usability.

This update aims to provide more accurate status information and improve the overall functionality of the MCP server integration.
---
 .../accordions/mcp-integrations-accordion.tsx | 22 ++++++++++++-------
 .../[name]/sessions/[sessionName]/page.tsx    |  1 +
 2 files changed, 15 insertions(+), 8 deletions(-)

diff --git a/components/frontend/src/app/projects/[name]/sessions/[sessionName]/components/accordions/mcp-integrations-accordion.tsx b/components/frontend/src/app/projects/[name]/sessions/[sessionName]/components/accordions/mcp-integrations-accordion.tsx
index cf4a1da17..604cf2b5a 100644
--- a/components/frontend/src/app/projects/[name]/sessions/[sessionName]/components/accordions/mcp-integrations-accordion.tsx
+++ b/components/frontend/src/app/projects/[name]/sessions/[sessionName]/components/accordions/mcp-integrations-accordion.tsx
@@ -30,29 +30,33 @@ import type { McpServer, McpTool } from '@/services/api/sessions'
 type McpServersAccordionProps = {
   projectName: string
   sessionName: string
+  sessionPhase?: string
 }
 
 export function McpServersAccordion({
   projectName,
   sessionName,
+  sessionPhase,
 }: McpServersAccordionProps) {
   const [placeholderTimedOut, setPlaceholderTimedOut] = useState(false)
 
-  const { data: mcpStatus, isPending: mcpPending } = useMcpStatus(projectName, sessionName)
+  // Only fetch MCP status once the session is actually running (runner pod ready)
+  const isRunning = sessionPhase === 'Running'
+  const { data: mcpStatus, isPending: mcpPending } = useMcpStatus(projectName, sessionName, isRunning)
   const mcpServers = mcpStatus?.servers || []
 
   const showPlaceholders =
-    mcpPending || (mcpServers.length === 0 && !placeholderTimedOut)
+    !isRunning || mcpPending || (mcpServers.length === 0 && !placeholderTimedOut)
 
   useEffect(() => {
     if (mcpServers.length > 0) {
       setPlaceholderTimedOut(false)
       return
     }
-    if (!mcpStatus) return
+    if (!isRunning || !mcpStatus) return
     const t = setTimeout(() => setPlaceholderTimedOut(true), 15 * 1000)
     return () => clearTimeout(t)
-  }, [mcpStatus, mcpServers.length])
+  }, [mcpStatus, mcpServers.length, isRunning])
 
   const getStatusIcon = (server: McpServer) => {
     switch (server.status) {
@@ -132,8 +136,8 @@ export function McpServersAccordion({
       ([, v]) => typeof v === 'boolean'
     )
     return (
-      <div key={tool.name} className="flex items-center justify-between gap-2 py-1.5 px-1">
-        <span className="text-xs font-mono truncate">{tool.name}</span>
+      <div key={tool.name} className="flex items-center justify-between gap-3 px-3 py-2">
+        <code className="text-xs truncate">{tool.name}</code>
         {annotations.length > 0 && (
           <div className="flex items-center gap-1 flex-shrink-0">
             {annotations.map(([k, v]) => renderAnnotationBadge(k, v as boolean))}
@@ -158,6 +162,8 @@ export function McpServersAccordion({
               {getStatusIcon(server)}
             </div>
             <h4 className="font-medium text-sm">{server.displayName}</h4>
+          </div>
+          <div className="flex items-center gap-2 mt-1 ml-6">
             {server.version && (
               <span className="text-[10px] text-muted-foreground">v{server.version}</span>
             )}
@@ -176,12 +182,12 @@ export function McpServersAccordion({
                   align="start"
                   className="w-80 p-0"
                 >
-                  <div className="px-3 py-2 border-b">
+                  <div className="px-3 py-2.5 border-b bg-muted/30">
                     <p className="text-xs font-medium">
                       {server.displayName} — {toolCount} {toolCount === 1 ? 'tool' : 'tools'}
                     </p>
                   </div>
-                  <div className="max-h-64 overflow-y-auto divide-y">
+                  <div className="max-h-72 overflow-y-auto">
                     {tools.map((tool) => renderToolRow(tool))}
                   </div>
                 </PopoverContent>
diff --git a/components/frontend/src/app/projects/[name]/sessions/[sessionName]/page.tsx b/components/frontend/src/app/projects/[name]/sessions/[sessionName]/page.tsx
index cb99f514c..b3fc6dcf5 100644
--- a/components/frontend/src/app/projects/[name]/sessions/[sessionName]/page.tsx
+++ b/components/frontend/src/app/projects/[name]/sessions/[sessionName]/page.tsx
@@ -1639,6 +1639,7 @@ export default function ProjectSessionDetailPage({
                     <McpServersAccordion
                       projectName={projectName}
                       sessionName={sessionName}
+                      sessionPhase={phase}
                     />
 
                     <IntegrationsAccordion />