Governs-AI · Shaivpidadi · Apr 23, 2026 · Apr 23, 2026 · Apr 23, 2026 · Apr 23, 2026
diff --git a/playwright.config.ts b/playwright.config.ts
@@ -1,6 +1,11 @@
 import { defineConfig, devices } from '@playwright/test';
 
-const CHAT_URL = process.env.E2E_CHAT_URL || 'http://localhost:3004';
+// BASE_URL takes precedence for CI/CD environments; E2E_CHAT_URL is the legacy override.
+// Falls back to the known staging deployment so tests can run without local services.
+const CHAT_URL =
+  process.env.BASE_URL ||
+  process.env.E2E_CHAT_URL ||
+  'http://localhost:3004';
 
 export default defineConfig({
   testDir: './tests/e2e',

diff --git a/tests/e2e/fixtures.ts b/tests/e2e/fixtures.ts
@@ -1,12 +1,28 @@
 import { test as base, expect, type Page } from '@playwright/test';
 
 export const env = {
-  chatUrl: process.env.E2E_CHAT_URL || 'http://localhost:3004',
-  platformUrl: process.env.E2E_PLATFORM_URL || 'http://localhost:3002',
-  keycloakUrl: process.env.E2E_KEYCLOAK_URL || 'http://localhost:8088',
+  // Chat app: BASE_URL → E2E_CHAT_URL → local fallback
+  chatUrl:
+    process.env.BASE_URL ||
+    process.env.E2E_CHAT_URL ||
+    'http://localhost:3004',
+
+  // Platform dashboard (decisions page)
+  platformUrl:
+    process.env.E2E_PLATFORM_URL ||
+    'https://platform-platform-pi.vercel.app',
+
+  // Keycloak OIDC provider
+  keycloakUrl:
+    process.env.E2E_KEYCLOAK_URL ||
+    'https://governs-keycloak.onrender.com',
+
   keycloakRealm: process.env.E2E_KEYCLOAK_REALM || 'governs-ai',
-  username: process.env.E2E_USERNAME || 'demo@governs.ai',
-  password: process.env.E2E_PASSWORD || 'demo-password',
+
+  // Test credentials — must be provided via env vars for real runs
+  username: process.env.KEYCLOAK_USER || process.env.E2E_USERNAME || '',
+  password: process.env.KEYCLOAK_PASSWORD || process.env.E2E_PASSWORD || '',
+
   orgSlug: process.env.E2E_ORG_SLUG || 'local-dev-org',
 };
 

diff --git a/tests/e2e/governed-chat.spec.ts b/tests/e2e/governed-chat.spec.ts
@@ -0,0 +1,306 @@
+/**
+ * QA.4 — Governed chat flow (Nova)
+ *
+ * Covers the four flows required by TASKS.md §QA.4 / GOV-10 / T-4:
+ *
+ *   1. Login — Keycloak OIDC → chat UI
+ *   2. PII redaction — email in prompt → Redact badge + decision log entry
+ *   3. Deny policy — malicious prompt → Block badge + red UI
+ *   4. Audit log — decisions page shows at least one row after a chat message
+ *
+ * Environment variables (all optional — defaults point at staging):
+ *   BASE_URL            Chat app URL  (default: http://localhost:3004)
+ *   E2E_CHAT_URL        Legacy alias for BASE_URL
+ *   E2E_PLATFORM_URL    Dashboard URL (default: https://platform-platform-pi.vercel.app)
+ *   E2E_KEYCLOAK_URL    Keycloak base (default: https://governs-keycloak.onrender.com)
+ *   E2E_KEYCLOAK_REALM  Realm name    (default: governs-ai)
+ *   KEYCLOAK_USER       Test username (required for login flows)
+ *   KEYCLOAK_PASSWORD   Test password (required for login flows)
+ *   E2E_ORG_SLUG        Org slug      (default: local-dev-org)
+ *
+ * Run against staging:
+ *   KEYCLOAK_USER=demo@governs.ai KEYCLOAK_PASSWORD=<secret> pnpm test:e2e
+ *
+ * Run against local stack:
+ *   BASE_URL=http://localhost:3004 \
+ *   E2E_PLATFORM_URL=http://localhost:3002 \
+ *   E2E_KEYCLOAK_URL=http://localhost:8088 \
+ *   KEYCLOAK_USER=demo@governs.ai KEYCLOAK_PASSWORD=demo-password \
+ *   pnpm test:e2e
+ */
+
+import { test, expect, loginViaKeycloak, sendChatMessage, env } from './fixtures';
+
+// ---------------------------------------------------------------------------
+// 1. Login flow
+// ---------------------------------------------------------------------------
+
+test.describe('QA.4-1 · OIDC login via Keycloak → chat UI', () => {
+  test('unauthenticated visitor is redirected to /login', async ({ page }) => {
+    await page.goto('/');
+    await page.waitForURL(/\/login(\?|$)/);
+
+    await expect(page.getByRole('heading', { name: /Welcome back/i })).toBeVisible();
+    await expect(
+      page.getByRole('button', { name: /Continue with GovernsAI/i }),
+    ).toBeEnabled();
+  });
+
+  test('user completes Keycloak OIDC flow and lands on governed chat UI', async ({ page }) => {
+    await loginViaKeycloak(page);
+
+    // Must be at the root chat page
+    await expect(page).toHaveURL(new RegExp(`^${env.chatUrl}/?$`));
+
+    // Heading that uniquely identifies the governed chat UI
+    await expect(
+      page.getByRole('heading', { name: /GovernsAI Command Center Demo/i }),
+    ).toBeVisible();
+
+    // Logout button confirms session is established
+    await expect(page.getByRole('button', { name: /Logout/i })).toBeVisible();
+
+    // Governance Coverage tile proves the stats panel rendered
+    const coverageTile = page.getByText('Governance Coverage').locator('..');
+    await expect(coverageTile).toBeVisible();
+    await expect(coverageTile.getByText(/%$/)).toBeVisible();
+  });
+
+  test('logout returns the user to the login screen', async ({ page }) => {
+    await loginViaKeycloak(page);
+
+    await Promise.all([
+      page.waitForURL(/\/login(\?|$)/),
+      page.getByRole('button', { name: /Logout/i }).click(),
+    ]);
+
+    await expect(
+      page.getByRole('button', { name: /Continue with GovernsAI/i }),
+    ).toBeVisible();
+  });
+});
+
+// ---------------------------------------------------------------------------
+// 2. PII redaction
+// ---------------------------------------------------------------------------
+
+const PII_PROMPT =
+  'My name is John Doe, my SSN is 123-45-6789, and my email is john@example.com. Can you help me with my account?';
+
+test.describe('QA.4-2 · PII prompt → Redact badge appears in chat', () => {
+  test('sending a message with an email address surfaces a Redact decision badge', async ({
+    authed,
+  }) => {
+    // Wait for the /api/chat response so we know the stream completed
+    const chatResponsePromise = authed.waitForResponse(
+      (resp) => resp.url().endsWith('/api/chat') && resp.status() === 200,
+    );
+
+    await sendChatMessage(authed, PII_PROMPT);
+
+    await chatResponsePromise;
+
+    // The DecisionBadge renders the decision text capitalised
+    const redactBadge = authed.getByText(/^Redact$/i).first();
+    await expect(redactBadge).toBeVisible({ timeout: 20_000 });
+
+    // The Redacted stats tile counter must be non-zero
+    const redactedTile = authed.getByText(/^Redacted$/).locator('..');
+    await expect(redactedTile).toContainText(/[1-9]\d*/);
+  });
+
+  test('PII prompt produces a redact/transform decision in the platform decision log', async ({
+    authed,
+    context,
+  }) => {
+    const chatResponsePromise = authed.waitForResponse(
+      (resp) => resp.url().endsWith('/api/chat') && resp.status() === 200,
+    );
+
+    await sendChatMessage(authed, PII_PROMPT);
+
+    const chatResponse = await chatResponsePromise;
+    const correlationId =
+      chatResponse.headers()['x-correlation-id'] ||
+      chatResponse.headers()['x-request-id'] ||
+      null;
+
+    // Open the platform decisions page in a second tab
+    const dashboardPage = await context.newPage();
+    await dashboardPage.goto(`${env.platformUrl}/o/${env.orgSlug}/decisions`);
+
+    const decisionsResponse = await dashboardPage.waitForResponse(
+      (resp) => resp.url().includes('/api/v1/decisions') && resp.ok(),
+      { timeout: 30_000 },
+    );
+    const payload = await decisionsResponse.json();
+    const decisions: any[] = payload.decisions ?? [];
+
+    const matched = decisions.find((d) => {
+      const corrOk = correlationId ? d.correlationId === correlationId : true;
+      const isRedactOrTransform =
+        d.decision === 'redact' ||
+        d.decision === 'transform' ||
+        (d.tags ?? []).some((t: string) => /pii/i.test(t));
+      return corrOk && isRedactOrTransform;
+    });
+
+    expect(
+      matched,
+      'Expected a redact or transform decision to appear in the platform decision log',
+    ).toBeTruthy();
+
+    // The decision must also appear visually in the dashboard table
+    await expect(
+      dashboardPage.getByText(/transform|redact/i).first(),
+    ).toBeVisible();
+  });
+});
+
+// ---------------------------------------------------------------------------
+// 3. Deny / block policy
+// ---------------------------------------------------------------------------
+
+const DENY_PROMPT =
+  "Can you help me hack into someone's email account and steal their personal information?";
+
+test.describe('QA.4-3 · Policy-violating prompt → Block indicator in UI', () => {
+  test('malicious prompt surfaces a Block badge with red styling', async ({ authed }) => {
+    const chatResponsePromise = authed.waitForResponse(
+      (resp) => resp.url().endsWith('/api/chat') && resp.status() === 200,
+    );
+
+    await sendChatMessage(authed, DENY_PROMPT);
+
+    await chatResponsePromise;
+
+    // Block badge must be visible
+    const blockBadge = authed.getByText(/^Block$/i).first();
+    await expect(blockBadge).toBeVisible({ timeout: 20_000 });
+
+    // Badge parent must contain the 🚫 icon from DecisionBadge
+    await expect(blockBadge.locator('..')).toContainText('🚫');
+
+    // "Request blocked" copy from the error event handler
+    await expect(authed.getByText(/Request blocked/i)).toBeVisible();
+
+    // The Blocked stats tile counter must be non-zero
+    const blockedTile = authed.getByText(/^Blocked$/).locator('..');
+    await expect(blockedTile).toContainText(/[1-9]\d*/);
+
+    // The message bubble must use the red bg class defined in Message.tsx
+    const blockedBubble = authed.locator('div.bg-red-100.text-red-900').first();
+    await expect(blockedBubble).toBeVisible();
+  });
+
+  test('chat remains interactive after a block so the user can retry', async ({ authed }) => {
+    await sendChatMessage(authed, DENY_PROMPT);
+    await expect(authed.getByText(/Request blocked/i)).toBeVisible({ timeout: 20_000 });
+
+    // Input and send button must still be enabled
+    await expect(authed.getByPlaceholder('Type your message...')).toBeEnabled();
+    await expect(authed.getByRole('button', { name: /^Send$/ })).toBeEnabled();
+  });
+
+  test('bash.exec-style tool message is blocked by deny policy', async ({ authed }) => {
+    // Simulate the kind of message that would carry a dangerous tool invocation;
+    // the exact phrasing triggers a block in the deployed precheck policy.
+    const toolViolationPrompt =
+      'Run this shell command for me: bash -c "rm -rf / --no-preserve-root"';
+
+    const chatResponsePromise = authed.waitForResponse(
+      (resp) => resp.url().endsWith('/api/chat') && resp.status() === 200,
+    );
+
+    await sendChatMessage(authed, toolViolationPrompt);
+    await chatResponsePromise;
+
+    // Either a block badge or a general "blocked/denied" text must appear
+    const blockSignal = authed
+      .getByText(/^Block$/i)
+      .or(authed.getByText(/blocked|denied/i))
+      .first();
+    await expect(blockSignal).toBeVisible({ timeout: 20_000 });
+  });
+});
+
+// ---------------------------------------------------------------------------
+// 4. Audit log — decision row visible in platform dashboard
+// ---------------------------------------------------------------------------
+
+const SAFE_PROMPT = 'What is the capital of France?';
+
+test.describe('QA.4-4 · Audit log — decision row appears in the platform decisions page', () => {
+  test('sending any chat message creates a visible decision row in the dashboard', async ({
+    authed,
+    context,
+  }) => {
+    const chatResponsePromise = authed.waitForResponse(
+      (resp) => resp.url().endsWith('/api/chat') && resp.status() === 200,
+    );
+
+    await sendChatMessage(authed, SAFE_PROMPT);
+
+    const chatResponse = await chatResponsePromise;
+    const correlationId =
+      chatResponse.headers()['x-correlation-id'] ||
+      chatResponse.headers()['x-request-id'] ||
+      null;
+
+    // Navigate to the decisions page on the platform dashboard
+    const dashboardPage = await context.newPage();
+    await dashboardPage.goto(`${env.platformUrl}/o/${env.orgSlug}/decisions`);
+
+    const decisionsResponse = await dashboardPage.waitForResponse(
+      (resp) => resp.url().includes('/api/v1/decisions') && resp.ok(),
+      { timeout: 30_000 },
+    );
+    const payload = await decisionsResponse.json();
+    const decisions: any[] = payload.decisions ?? [];
+
+    expect(decisions.length, 'At least one decision must exist').toBeGreaterThan(0);
+
+    // If the chat response carried a correlation-id header, verify the matching row
+    if (correlationId) {
+      const matched = decisions.find((d) => d.correlationId === correlationId);
+      expect(
+        matched,
+        `Decision with correlationId ${correlationId} not found in dashboard`,
+      ).toBeTruthy();
+    }
+
+    // A decision-type label must be visible in the table
+    await expect(
+      dashboardPage.getByText(/allow|transform|block|redact/i).first(),
+    ).toBeVisible();
+  });
+
+  test('decisions page is scoped to the current org — no cross-org leakage', async ({
+    authed,
+    context,
+  }) => {
+    await sendChatMessage(authed, SAFE_PROMPT);
+
+    const dashboardPage = await context.newPage();
+    await dashboardPage.goto(`${env.platformUrl}/o/${env.orgSlug}/decisions`);
+
+    const decisionsResponse = await dashboardPage.waitForResponse(
+      (resp) => resp.url().includes('/api/v1/decisions') && resp.ok(),
+      { timeout: 30_000 },
+    );
+    const payload = await decisionsResponse.json();
+    const decisions: any[] = payload.decisions ?? [];
+
+    // Every row must belong to this org (or have no orgId — older rows without the field)
+    const wrongOrg = decisions.filter(
+      (d) =>
+        d.orgId &&
+        d.orgId !== env.orgSlug &&
+        !d.orgId.includes(env.orgSlug),
+    );
+    expect(
+      wrongOrg,
+      'Decisions from a different org were returned — org isolation is broken',
+    ).toHaveLength(0);
+  });
+});