diff --git a/.gitignore b/.gitignore
index 66bfb0f..17a9f02 100644
--- a/.gitignore
+++ b/.gitignore
@@ -186,6 +186,7 @@ eng_plans/
 
 # RL training artifacts
 rl/models/*.zip
+!rl/models/cuttle_rl_final.zip
 rl/logs/
 
 .DS_Store
diff --git a/Makefile b/Makefile
index 7b87083..0533d60 100644
--- a/Makefile
+++ b/Makefile
@@ -14,6 +14,14 @@ run:
 
 run-with-rl:
 	source $(VENV_NAME)/bin/activate && PYTHONPATH=$(CURRENT_DIR) python main_with_rl_ai.py
+
+# Dockerized dev environment (backend + Vite)
+dev:
+	docker compose -f docker-compose.dev.yaml up --build -d
+
+dev-down:
+	docker compose -f docker-compose.dev.yaml down
+
 # Generate documentation using pdoc
 docs:
 	source $(VENV_NAME)/bin/activate && PYTHONPATH=$(CURRENT_DIR) python docs.py
@@ -57,4 +65,4 @@ test-rl:
 	@echo "Quick RL training test with action masking (10K timesteps, ~2-3 minutes)..."
 	source $(VENV_NAME)/bin/activate && PYTHONPATH=$(CURRENT_DIR) python -c \
 		"from rl import config; config.TRAINING_CONFIG['total_timesteps'] = 10000; \
-		exec(open('rl/train.py').read())"
\ No newline at end of file
+		exec(open('rl/train.py').read())"
diff --git a/README.md b/README.md
index c4a6d1b..a247234 100644
--- a/README.md
+++ b/README.md
@@ -2,6 +2,7 @@
 
 
 # Set Up
+## Local dev (no Docker)
 ## Create a virtual environment
 
 ```bash
@@ -9,6 +10,11 @@ python3 -m venv cuttle-bot-3.12
 source ./cuttle-bot-3.12/bin/activate
 ```
 
+Or use the Makefile helper (requires `python3.12` on PATH):
+
+```bash
+make setup
+```
 
 ## Install requirements
 
@@ -16,8 +22,42 @@ source ./cuttle-bot-3.12/bin/activate
 pip install -r requirements.txt
 ```
 
+## Run the dev servers
+
+Backend API (FastAPI + reload):
+
+```bash
+uvicorn server.app:app --reload --host 0.0.0.0 --port 8000
+```
+
+Frontend (Vite):
+
+```bash
+cd web && npm run dev
+```
+
+Open http://localhost:5173
+
+## Docker dev (hot reload)
+
+```bash
+make dev
+```
+
+Open http://localhost:5173 (API at http://localhost:8000).
+
 ## Set up AI player
 
+The game currently supports two types of AI players: RL based AI, and LLM based AI.
+
+### RL based AI
+
+The repo comes with a model zip file which is loaded into the game server. 
+
+The model can be trained locally (see later sections). 
+
+### LLM Based AI
+
 The AI player uses ollama to generate actions. You'll need to install ollama and set up a model.
 
 Follow the installation guide here: https://github.com/ollama/ollama
@@ -101,3 +141,4 @@ Adjust training parameters in `rl/config.py`:
 - Models saved to: `rl/models/`
 - Training logs: `rl/logs/` (view with TensorBoard)
 - Checkpoints every 10K timesteps
+- Checkpoints are gitignored, but the final model named `cuttle_rl_final.zip` is tracked with version control (git)
diff --git a/codex-workflows/codex_mcp.py b/codex-workflows/codex_mcp.py
deleted file mode 100644
index 3e65a53..0000000
--- a/codex-workflows/codex_mcp.py
+++ /dev/null
@@ -1,51 +0,0 @@
-import asyncio
-import os
-import shlex
-
-from dotenv import load_dotenv
-
-from agents import Agent, Runner, set_default_openai_api
-from agents.mcp import MCPServerStdio
-
-load_dotenv(override=True)
-set_default_openai_api(os.getenv("OPENAI_API_KEY"))
-
-
-async def main() -> None:
-    command = os.getenv("CODEX_MCP_COMMAND", "npx")
-    args = shlex.split(
-        os.getenv("CODEX_MCP_ARGS", "-y @openai/codex mcp-server")
-    )
-    async with MCPServerStdio(
-        name="Codex CLI",
-        params={
-            "command": command,
-            "args": args,
-        },
-        client_session_timeout_seconds=360000,
-    ) as codex_mcp_server:
-        developer_agent = Agent(
-            name="Game Developer",
-            instructions=(
-                "You are an expert in building simple games using basic html + css + javascript with no dependencies. "
-                "Save your work in a file called index.html in the current directory. "
-                "Always call codex with \"approval-policy\": \"never\" and \"sandbox\": \"workspace-write\"."
-            ),
-            mcp_servers=[codex_mcp_server],
-        )
-
-        designer_agent = Agent(
-            name="Game Designer",
-            instructions=(
-                "You are an indie game connoisseur. Come up with an idea for a single page html + css + javascript game that a developer could build in about 50 lines of code. "
-                "Format your request as a 3 sentence design brief for a game developer and call the Game Developer coder with your idea."
-            ),
-            model="gpt-5",
-            handoffs=[developer_agent],
-        )
-
-        await Runner.run(designer_agent, "Implement a fun new game!")
-
-
-if __name__ == "__main__":
-    asyncio.run(main())
diff --git a/codex-workflows/index.html b/codex-workflows/index.html
deleted file mode 100644
index 92d0cd2..0000000
--- a/codex-workflows/index.html
+++ /dev/null
@@ -1,391 +0,0 @@
-<!doctype html>
-<html lang="en">
-<head>
-<meta charset="utf-8" />
-<meta name="viewport" content="width=device-width, initial-scale=1" />
-<title>Arc Snap</title>
-<style>
-  :root {
-    color-scheme: light;
-    --bg-1: #f2e9da;
-    --bg-2: #e0d0b7;
-    --ink: #201a16;
-    --muted: #6e645a;
-    --track: #3b342e;
-    --accent: #f26a4f;
-    --accent-soft: #f4c95c;
-    --panel: rgba(255, 255, 255, 0.7);
-  }
-
-  * { box-sizing: border-box; }
-
-  body {
-    margin: 0;
-    min-height: 100vh;
-    display: flex;
-    align-items: center;
-    justify-content: center;
-    background:
-      radial-gradient(700px 450px at 15% 10%, rgba(255, 255, 255, 0.8), rgba(255, 255, 255, 0)),
-      radial-gradient(620px 380px at 85% 15%, rgba(255, 226, 196, 0.7), rgba(255, 226, 196, 0)),
-      linear-gradient(150deg, var(--bg-1), var(--bg-2));
-    color: var(--ink);
-    font-family: "Space Grotesk", "Avenir Next", "Trebuchet MS", sans-serif;
-  }
-
-  .shell {
-    width: min(92vw, 540px);
-    display: grid;
-    gap: 12px;
-    justify-items: center;
-    text-align: center;
-  }
-
-  h1 {
-    margin: 0;
-    font-size: clamp(1.8rem, 4vw, 2.6rem);
-    letter-spacing: 0.04em;
-  }
-
-  .hud {
-    width: 100%;
-    display: flex;
-    justify-content: space-between;
-    font-size: 0.75rem;
-    letter-spacing: 0.2em;
-    text-transform: uppercase;
-    background: var(--panel);
-    padding: 10px 16px;
-    border-radius: 999px;
-    color: var(--muted);
-  }
-
-  #game {
-    width: min(80vw, 460px);
-    height: min(80vw, 460px);
-    border-radius: 24px;
-    background: rgba(255, 255, 255, 0.5);
-    box-shadow: 0 22px 60px rgba(0, 0, 0, 0.18);
-    outline: none;
-  }
-
-  #game:focus-visible {
-    box-shadow: 0 0 0 4px rgba(242, 106, 79, 0.35), 0 22px 60px rgba(0, 0, 0, 0.18);
-  }
-
-  .message {
-    min-height: 1.5rem;
-    color: var(--muted);
-    white-space: pre-line;
-  }
-
-  .restart {
-    border: none;
-    padding: 10px 22px;
-    border-radius: 999px;
-    background: var(--accent);
-    color: #fff;
-    font-weight: 600;
-    letter-spacing: 0.1em;
-    text-transform: uppercase;
-    cursor: pointer;
-    transition: transform 0.15s ease, box-shadow 0.2s ease;
-  }
-
-  .restart:hover {
-    transform: translateY(-2px);
-    box-shadow: 0 10px 20px rgba(242, 106, 79, 0.35);
-  }
-
-  @media (max-width: 520px) {
-    .hud { font-size: 0.65rem; }
-  }
-</style>
-</head>
-<body>
-  <main class="shell">
-    <h1>Arc Snap</h1>
-    <div class="hud">
-      <div>Score <span id="score">0</span></div>
-      <div>Best <span id="best">0</span></div>
-      <div>Lives <span id="lives">1</span></div>
-    </div>
-    <canvas id="game" tabindex="0" aria-label="Arc Snap timing game"></canvas>
-    <div id="message" class="message">Click or tap to start</div>
-    <button id="restart" class="restart" hidden>Restart</button>
-  </main>
-
-<script>
-  const canvas = document.getElementById("game");
-  const ctx = canvas.getContext("2d");
-  const scoreEl = document.getElementById("score");
-  const bestEl = document.getElementById("best");
-  const livesEl = document.getElementById("lives");
-  const messageEl = document.getElementById("message");
-  const restartBtn = document.getElementById("restart");
-
-  const TAU = Math.PI * 2;
-  const bestKey = "arc-snap-best";
-
-  let viewSize = 420;
-  let pixelRatio = window.devicePixelRatio || 1;
-
-  const state = {
-    running: false,
-    gameOver: false,
-    score: 0,
-    best: Number.parseInt(localStorage.getItem(bestKey) || "0", 10),
-    speed: 2.2,
-    angle: 0,
-    sliceStart: 0,
-    sliceSize: 1.1,
-    minSlice: 0.35,
-    flash: 0,
-    flashMax: 0,
-    flashColor: "242, 201, 92",
-    pause: 0,
-    lives: 1,
-    messageTimer: 0
-  };
-
-  const clamp = (value, min, max) => Math.min(max, Math.max(min, value));
-
-  const normalizeAngle = (angle) => {
-    let a = angle % TAU;
-    if (a < 0) a += TAU;
-    return a;
-  };
-
-  const isAngleInSlice = (angle, start, size) => {
-    if (size >= TAU) return true;
-    const a = normalizeAngle(angle);
-    const s = normalizeAngle(start);
-    const e = normalizeAngle(start + size);
-    if (s <= e) return a >= s && a <= e;
-    return a >= s || a <= e;
-  };
-
-  const updateHud = () => {
-    scoreEl.textContent = state.score;
-    bestEl.textContent = state.best;
-    livesEl.textContent = state.lives > 0 ? "x".repeat(state.lives) : "0";
-  };
-
-  const setMessage = (text, duration) => {
-    messageEl.textContent = text;
-    state.messageTimer = duration || 0;
-  };
-
-  const flash = (color, duration) => {
-    state.flashColor = color;
-    state.flash = duration;
-    state.flashMax = duration;
-  };
-
-  const randomSlice = () => {
-    state.sliceStart = Math.random() * TAU;
-  };
-
-  const resetRun = () => {
-    state.score = 0;
-    state.speed = 2.2;
-    state.angle = 0;
-    state.sliceSize = 1.1;
-    state.pause = 0;
-    state.lives = 1;
-    state.gameOver = false;
-    state.running = false;
-    randomSlice();
-    updateHud();
-    setMessage("Click or tap to start", 0);
-    restartBtn.hidden = true;
-  };
-
-  const startRun = () => {
-    state.running = true;
-    state.gameOver = false;
-    setMessage("", 0);
-    restartBtn.hidden = true;
-  };
-
-  const endRun = () => {
-    state.running = false;
-    state.gameOver = true;
-    setMessage(`Game Over\nScore ${state.score}\nClick or tap to restart`, 0);
-    restartBtn.hidden = false;
-  };
-
-  const handleHit = () => {
-    state.score += 1;
-    if (state.score > state.best) {
-      state.best = state.score;
-      localStorage.setItem(bestKey, String(state.best));
-    }
-    state.speed *= 1.06;
-    state.sliceSize = Math.max(state.minSlice, state.sliceSize * 0.92);
-    state.pause = 0.12;
-    randomSlice();
-    flash("244, 201, 92", 0.22);
-    setMessage("Snap!", 0.4);
-    updateHud();
-  };
-
-  const handleMiss = () => {
-    state.pause = 0.16;
-    if (state.lives > 0) {
-      state.lives -= 1;
-      flash("242, 106, 79", 0.25);
-      setMessage("Close! One life used.", 0.6);
-      randomSlice();
-      updateHud();
-      return;
-    }
-    endRun();
-  };
-
-  const attemptSnap = () => {
-    if (!state.running || state.gameOver) return;
-    const hit = isAngleInSlice(state.angle, state.sliceStart, state.sliceSize);
-    if (hit) handleHit();
-    else handleMiss();
-  };
-
-  const handleAction = () => {
-    if (state.gameOver) {
-      resetRun();
-      startRun();
-      return;
-    }
-    if (!state.running) {
-      startRun();
-      return;
-    }
-    attemptSnap();
-  };
-
-  const resizeCanvas = () => {
-    pixelRatio = window.devicePixelRatio || 1;
-    viewSize = clamp(Math.min(window.innerWidth, window.innerHeight) * 0.72, 260, 520);
-    canvas.style.width = `${viewSize}px`;
-    canvas.style.height = `${viewSize}px`;
-    canvas.width = Math.round(viewSize * pixelRatio);
-    canvas.height = Math.round(viewSize * pixelRatio);
-    ctx.setTransform(pixelRatio, 0, 0, pixelRatio, 0, 0);
-  };
-
-  const draw = () => {
-    const w = viewSize;
-    const h = viewSize;
-    ctx.clearRect(0, 0, w, h);
-
-    const centerX = w / 2;
-    const centerY = h / 2;
-    const radius = w * 0.32;
-    const ringWidth = radius * 0.22;
-
-    const glow = ctx.createRadialGradient(centerX, centerY, radius * 0.1, centerX, centerY, radius * 1.4);
-    glow.addColorStop(0, "rgba(255, 255, 255, 0.9)");
-    glow.addColorStop(1, "rgba(255, 255, 255, 0)");
-    ctx.fillStyle = glow;
-    ctx.beginPath();
-    ctx.arc(centerX, centerY, radius + ringWidth, 0, TAU);
-    ctx.fill();
-
-    ctx.save();
-    ctx.translate(centerX, centerY);
-
-    ctx.lineWidth = ringWidth;
-    ctx.strokeStyle = "#3b342e";
-    ctx.beginPath();
-    ctx.arc(0, 0, radius, 0, TAU);
-    ctx.stroke();
-
-    ctx.lineCap = "round";
-    ctx.strokeStyle = "#f26a4f";
-    ctx.lineWidth = ringWidth * 0.9;
-    ctx.beginPath();
-    ctx.arc(0, 0, radius, state.sliceStart - Math.PI / 2, state.sliceStart + state.sliceSize - Math.PI / 2);
-    ctx.stroke();
-
-    ctx.rotate(state.angle - Math.PI / 2);
-    ctx.strokeStyle = "#201a16";
-    ctx.lineWidth = 3;
-    ctx.beginPath();
-    ctx.moveTo(-radius * 0.08, 0);
-    ctx.lineTo(radius, 0);
-    ctx.stroke();
-
-    ctx.fillStyle = "#201a16";
-    ctx.beginPath();
-    ctx.moveTo(radius, 0);
-    ctx.lineTo(radius - 14, -6);
-    ctx.lineTo(radius - 14, 6);
-    ctx.closePath();
-    ctx.fill();
-
-    ctx.restore();
-
-    ctx.fillStyle = "#201a16";
-    ctx.beginPath();
-    ctx.arc(centerX, centerY, ringWidth * 0.22, 0, TAU);
-    ctx.fill();
-
-    if (state.flash > 0) {
-      const intensity = state.flashMax > 0 ? state.flash / state.flashMax : 0;
-      ctx.strokeStyle = `rgba(${state.flashColor}, ${intensity})`;
-      ctx.lineWidth = ringWidth * 1.15;
-      ctx.beginPath();
-      ctx.arc(centerX, centerY, radius, 0, TAU);
-      ctx.stroke();
-    }
-  };
-
-  let lastTime = performance.now();
-  const tick = (time) => {
-    const delta = Math.min((time - lastTime) / 1000, 0.05);
-    lastTime = time;
-
-    if (state.messageTimer > 0) {
-      state.messageTimer = Math.max(0, state.messageTimer - delta);
-      if (state.messageTimer === 0 && state.running) messageEl.textContent = "";
-    }
-
-    if (state.running) {
-      if (state.pause > 0) {
-        state.pause = Math.max(0, state.pause - delta);
-      } else {
-        state.angle = normalizeAngle(state.angle + state.speed * delta);
-      }
-    }
-
-    if (state.flash > 0) state.flash = Math.max(0, state.flash - delta);
-
-    draw();
-    requestAnimationFrame(tick);
-  };
-
-  canvas.addEventListener("pointerdown", (event) => {
-    event.preventDefault();
-    handleAction();
-  });
-
-  window.addEventListener("keydown", (event) => {
-    if (event.code !== "Space" && event.key !== "Enter") return;
-    event.preventDefault();
-    handleAction();
-  });
-
-  restartBtn.addEventListener("click", () => {
-    resetRun();
-    startRun();
-  });
-
-  window.addEventListener("resize", resizeCanvas);
-
-  resizeCanvas();
-  updateHud();
-  draw();
-  requestAnimationFrame(tick);
-</script>
-</body>
-</html>
diff --git a/docker-compose.dev.yaml b/docker-compose.dev.yaml
new file mode 100644
index 0000000..da4d8ad
--- /dev/null
+++ b/docker-compose.dev.yaml
@@ -0,0 +1,34 @@
+version: "3.9"
+
+services:
+  backend:
+    image: python:3.11-slim
+    working_dir: /app
+    volumes:
+      - ./server:/app/server
+      - ./game:/app/game
+      - ./rl:/app/rl
+      - ./requirements.txt:/app/requirements.txt:ro
+    command: sh -c "pip install --no-cache-dir -r requirements.txt && uvicorn server.app:app --host 0.0.0.0 --port 8000 --reload"
+    ports:
+      - "8000:8000"
+    environment:
+      PYTHONDONTWRITEBYTECODE: "1"
+      PYTHONUNBUFFERED: "1"
+
+  frontend:
+    image: node:20-slim
+    working_dir: /app
+    volumes:
+      - ./web:/app
+      - web-node-modules:/app/node_modules
+    command: sh -c "if [ ! -x node_modules/.bin/vite ]; then npm ci; fi; npm run dev -- --host 0.0.0.0 --port 5173"
+    ports:
+      - "5173:5173"
+    environment:
+      VITE_API_PROXY_TARGET: "http://backend:8000"
+    depends_on:
+      - backend
+
+volumes:
+  web-node-modules:
diff --git a/rl/models/cuttle_rl_final.zip b/rl/models/cuttle_rl_final.zip
new file mode 100644
index 0000000..d45786d
Binary files /dev/null and b/rl/models/cuttle_rl_final.zip differ
diff --git a/web/vite.config.ts b/web/vite.config.ts
index 8d02698..78a7b32 100644
--- a/web/vite.config.ts
+++ b/web/vite.config.ts
@@ -1,18 +1,24 @@
 import { defineConfig } from 'vitest/config'
+import { loadEnv } from 'vite'
 import react from '@vitejs/plugin-react'
 
 // https://vite.dev/config/
-export default defineConfig({
-  plugins: [react()],
-  server: {
-    proxy: {
-      '/api': 'http://localhost:8000',
+export default defineConfig(({ mode }) => {
+  const env = loadEnv(mode, process.cwd(), 'VITE_')
+  const apiProxyTarget = env.VITE_API_PROXY_TARGET || 'http://localhost:8000'
+
+  return {
+    plugins: [react()],
+    server: {
+      proxy: {
+        '/api': apiProxyTarget,
+      },
+    },
+    test: {
+      environment: 'jsdom',
+      setupFiles: './src/test/setup.ts',
+      globals: true,
+      include: ['tests/unit/**/*.spec.ts', 'tests/unit/**/*.spec.tsx'],
     },
-  },
-  test: {
-    environment: 'jsdom',
-    setupFiles: './src/test/setup.ts',
-    globals: true,
-    include: ['tests/unit/**/*.spec.ts', 'tests/unit/**/*.spec.tsx'],
-  },
+  }
 })