diff --git a/packages/core/src/elevenlabs/index.ts b/packages/core/src/elevenlabs/index.ts
index 977740358..c73aba9b7 100644
--- a/packages/core/src/elevenlabs/index.ts
+++ b/packages/core/src/elevenlabs/index.ts
@@ -17,3 +17,12 @@ export {
 export type { ElevenLabsVoice, SynthesizeOptions } from "./client.js";
 export { generateSoundEffect, clampSfxDuration, SFX_BOUNDS } from "./sfx.js";
 export type { GenerateSfxOptions, GenerateSfxResult } from "./sfx.js";
+export {
+  generateMusic,
+  generateMusicAndWait,
+  getMusicJob,
+  downloadMusic,
+  clampMusicDuration,
+  MUSIC_BOUNDS,
+} from "./music.js";
+export type { GenerateMusicOptions, MusicJob, MusicJobStatus } from "./music.js";
diff --git a/packages/core/src/elevenlabs/music.ts b/packages/core/src/elevenlabs/music.ts
new file mode 100644
index 000000000..269298e8e
--- /dev/null
+++ b/packages/core/src/elevenlabs/music.ts
@@ -0,0 +1,184 @@
+/**
+ * ElevenLabs Music client (Eleven v3 Music). Unlike SFX which is synchronous
+ * (request → mp3 in one round-trip), music is an async job:
+ *
+ *     POST /v1/music                  → { music_id, status: "processing" }
+ *     GET  /v1/music/:id              → { status: "completed", audio_url }
+ *     GET  audio_url                  → mp3 bytes
+ *
+ * Callers want either the bytes (most common) or the job id (for progress
+ * UIs). `generateMusicAndWait` does the full poll-then-download flow with
+ * geometric backoff. The studio route exposes the job id immediately so the
+ * UI can show "generating…" without freezing the request.
+ */
+
+import { ElevenLabsError } from "./client.js";
+
+const API_BASE = "https://api.elevenlabs.io/v1";
+
+/** Music length bounds. The API supports up to ~5min in practice; we cap
+ *  shorter to avoid runaway generations on user typos. */
+export const MUSIC_BOUNDS = {
+  durationMin: 10,
+  durationMax: 300,
+  promptMaxChars: 1500,
+} as const;
+
+export type MusicJobStatus = "processing" | "completed" | "failed";
+
+export interface MusicJob {
+  id: string;
+  status: MusicJobStatus;
+  /** Set once status === "completed". Direct-download URL for the mp3. */
+  audioUrl?: string;
+  /** Reported by the API on failed jobs. */
+  errorMessage?: string;
+}
+
+export interface GenerateMusicOptions {
+  durationMs?: number;
+  outputFormat?: "mp3_44100_128" | "mp3_44100_192";
+}
+
+export function clampMusicDuration(durationSeconds: number): number {
+  if (!Number.isFinite(durationSeconds)) return 60;
+  return Math.max(MUSIC_BOUNDS.durationMin, Math.min(MUSIC_BOUNDS.durationMax, durationSeconds));
+}
+
+/**
+ * Submit a music-generation request. Returns the job id immediately so the
+ * caller can show progress. Caller must poll `getMusicJob` (or use
+ * `generateMusicAndWait`) to retrieve the audio.
+ */
+export async function generateMusic(
+  apiKey: string,
+  prompt: string,
+  opts: GenerateMusicOptions = {},
+): Promise<MusicJob> {
+  if (!prompt || !prompt.trim()) {
+    throw new ElevenLabsError("generateMusic: prompt is required");
+  }
+  const trimmed = prompt.trim();
+  if (trimmed.length > MUSIC_BOUNDS.promptMaxChars) {
+    throw new ElevenLabsError(
+      `generateMusic: prompt too long (max ${MUSIC_BOUNDS.promptMaxChars} chars)`,
+    );
+  }
+  const body: Record<string, unknown> = { prompt: trimmed };
+  if (typeof opts.durationMs === "number") {
+    body.music_length_ms = Math.round(
+      Math.max(
+        MUSIC_BOUNDS.durationMin * 1000,
+        Math.min(MUSIC_BOUNDS.durationMax * 1000, opts.durationMs),
+      ),
+    );
+  }
+  if (opts.outputFormat) body.output_format = opts.outputFormat;
+
+  const res = await fetch(`${API_BASE}/music`, {
+    method: "POST",
+    headers: {
+      "xi-api-key": apiKey,
+      "Content-Type": "application/json",
+      Accept: "application/json",
+    },
+    body: JSON.stringify(body),
+  });
+  if (!res.ok) {
+    let detail = "";
+    try {
+      const text = await res.text();
+      detail = text.length > 500 ? text.slice(0, 500) + "…" : text;
+    } catch {
+      /* ignore */
+    }
+    throw new ElevenLabsError(
+      `generateMusic: ${res.status} ${res.statusText}${detail ? ` — ${detail}` : ""}`,
+      res.status,
+    );
+  }
+  const json = (await res.json()) as {
+    music_id?: string;
+    status?: MusicJobStatus;
+    audio_url?: string;
+  };
+  if (!json.music_id) {
+    throw new ElevenLabsError("generateMusic: response missing music_id");
+  }
+  return {
+    id: json.music_id,
+    status: json.status ?? "processing",
+    ...(json.audio_url ? { audioUrl: json.audio_url } : {}),
+  };
+}
+
+export async function getMusicJob(apiKey: string, jobId: string): Promise<MusicJob> {
+  const res = await fetch(`${API_BASE}/music/${encodeURIComponent(jobId)}`, {
+    headers: { "xi-api-key": apiKey, Accept: "application/json" },
+  });
+  if (!res.ok) {
+    throw new ElevenLabsError(`getMusicJob: ${res.status} ${res.statusText}`, res.status);
+  }
+  const json = (await res.json()) as {
+    music_id?: string;
+    status?: MusicJobStatus;
+    audio_url?: string;
+    error_message?: string;
+  };
+  return {
+    id: json.music_id ?? jobId,
+    status: json.status ?? "processing",
+    ...(json.audio_url ? { audioUrl: json.audio_url } : {}),
+    ...(json.error_message ? { errorMessage: json.error_message } : {}),
+  };
+}
+
+/**
+ * Submit + poll until completed. Geometric backoff: 2s, 4s, 8s, max 30s.
+ * Total wait capped at `maxWaitMs` (default 5min). Throws ElevenLabsError on
+ * failure or timeout.
+ */
+export async function generateMusicAndWait(
+  apiKey: string,
+  prompt: string,
+  opts: GenerateMusicOptions & { maxWaitMs?: number; onProgress?: (job: MusicJob) => void } = {},
+): Promise<{ jobId: string; audioUrl: string }> {
+  const job = await generateMusic(apiKey, prompt, opts);
+  if (job.status === "completed" && job.audioUrl) {
+    return { jobId: job.id, audioUrl: job.audioUrl };
+  }
+  if (job.status === "failed") {
+    throw new ElevenLabsError(`generateMusic: job failed — ${job.errorMessage ?? "no detail"}`);
+  }
+  const maxWait = opts.maxWaitMs ?? 300_000;
+  const start = Date.now();
+  let delay = 2000;
+  while (Date.now() - start < maxWait) {
+    await new Promise((r) => setTimeout(r, delay));
+    delay = Math.min(delay * 2, 30_000);
+    const next = await getMusicJob(apiKey, job.id);
+    opts.onProgress?.(next);
+    if (next.status === "completed" && next.audioUrl) {
+      return { jobId: next.id, audioUrl: next.audioUrl };
+    }
+    if (next.status === "failed") {
+      throw new ElevenLabsError(`generateMusic: job failed — ${next.errorMessage ?? "no detail"}`);
+    }
+  }
+  throw new ElevenLabsError(
+    `generateMusic: timed out after ${maxWait}ms waiting for job ${job.id}`,
+  );
+}
+
+/**
+ * Download a completed job's mp3 bytes. The audio_url is signed and short-
+ * lived — call this immediately after `generateMusicAndWait` returns.
+ */
+export async function downloadMusic(audioUrl: string): Promise<Uint8Array> {
+  const res = await fetch(audioUrl);
+  if (!res.ok) {
+    throw new ElevenLabsError(`downloadMusic: ${res.status} ${res.statusText}`, res.status);
+  }
+  const bytes = new Uint8Array(await res.arrayBuffer());
+  return bytes;
+}
diff --git a/packages/core/src/gemini/client.ts b/packages/core/src/gemini/client.ts
new file mode 100644
index 000000000..a595496c7
--- /dev/null
+++ b/packages/core/src/gemini/client.ts
@@ -0,0 +1,283 @@
+/**
+ * Gemini REST client — narrow surface for the two operations we actually use:
+ *   1. uploadFile(): push an mp4 / image to Gemini's Files API
+ *   2. generateStructured<T>(): call generateContent with a function tool
+ *      and return the parsed input
+ *
+ * Mirrors the Anthropic client.ts shape so the studio routes have a uniform
+ * "callStructuredTool / callMultimodalStructured" surface for both providers.
+ *
+ * Why direct REST (no @google/genai SDK):
+ * - The SDK pulls in a lot of code we don't need (gRPC fallbacks, Vertex AI
+ *   auth, batch APIs). For the two endpoints we use, fetch+JSON is ~80 lines.
+ * - Lockstep version compatibility with Anthropic's pattern matters more
+ *   than SDK affordances we won't use.
+ */
+
+import { readFileSync, statSync } from "node:fs";
+import { basename } from "node:path";
+
+const API_BASE = "https://generativelanguage.googleapis.com/v1beta";
+const UPLOAD_BASE = "https://generativelanguage.googleapis.com/upload/v1beta";
+
+/** Default model for vision/video work. Flash is sufficient for retention
+ *  review, scroll-test, and image analysis at our scope. Pro is reserved
+ *  for multi-video comparison work that doesn't ship in this PR. */
+export const DEFAULT_GEMINI_MODEL = "gemini-2.5-flash";
+
+export class GeminiError extends Error {
+  status?: number;
+  constructor(message: string, status?: number) {
+    super(message);
+    this.name = "GeminiError";
+    this.status = status;
+  }
+}
+
+async function ensureOk(res: Response, label: string): Promise<void> {
+  if (res.ok) return;
+  let detail = "";
+  try {
+    const text = await res.text();
+    detail = text.length > 800 ? text.slice(0, 800) + "…" : text;
+  } catch {
+    /* ignore */
+  }
+  throw new GeminiError(
+    `${label}: ${res.status} ${res.statusText}${detail ? ` — ${detail}` : ""}`,
+    res.status,
+  );
+}
+
+// ── File upload ──────────────────────────────────────────────────────────────
+
+export interface UploadedFile {
+  /** "files/abc123" — used as `file_uri` in subsequent generateContent calls. */
+  uri: string;
+  /** Polled until "ACTIVE" before the file is usable in prompts. */
+  state: "PROCESSING" | "ACTIVE" | "FAILED";
+  mimeType: string;
+  name: string;
+  sizeBytes: number;
+}
+
+interface FilesApiResponse {
+  file?: {
+    name?: string;
+    uri?: string;
+    state?: "PROCESSING" | "ACTIVE" | "FAILED";
+    mimeType?: string;
+    sizeBytes?: string | number;
+  };
+}
+
+/**
+ * Upload a local file (mp4 / image) to Gemini's Files API. Uses the resumable
+ * protocol: 1 init request to negotiate, then one body POST. The studio
+ * server is on the trusted side of the project boundary so we read the file
+ * synchronously — saves a stream wiring we don't need.
+ *
+ * Caller must poll `getFile()` until state === "ACTIVE" before using the
+ * URI in a generateContent call. `uploadAndWait()` does that wait inline.
+ */
+export async function uploadFile(
+  apiKey: string,
+  filePath: string,
+  mimeType: string,
+): Promise<UploadedFile> {
+  const stat = statSync(filePath);
+  const sizeBytes = stat.size;
+  const displayName = basename(filePath);
+
+  // Step 1: init — get the upload URL.
+  const initRes = await fetch(`${UPLOAD_BASE}/files?key=${encodeURIComponent(apiKey)}`, {
+    method: "POST",
+    headers: {
+      "X-Goog-Upload-Protocol": "resumable",
+      "X-Goog-Upload-Command": "start",
+      "X-Goog-Upload-Header-Content-Length": String(sizeBytes),
+      "X-Goog-Upload-Header-Content-Type": mimeType,
+      "Content-Type": "application/json",
+    },
+    body: JSON.stringify({ file: { display_name: displayName } }),
+  });
+  await ensureOk(initRes, "uploadFile: init");
+  const uploadUrl = initRes.headers.get("X-Goog-Upload-URL");
+  if (!uploadUrl) {
+    throw new GeminiError("uploadFile: server did not return X-Goog-Upload-URL header");
+  }
+
+  // Step 2: upload the bytes. We POST the whole file at once — fine for the
+  // sub-100MB videos the studio renders.
+  const bytes = readFileSync(filePath);
+  const putRes = await fetch(uploadUrl, {
+    method: "POST",
+    headers: {
+      "Content-Length": String(sizeBytes),
+      "X-Goog-Upload-Offset": "0",
+      "X-Goog-Upload-Command": "upload, finalize",
+    },
+    body: new Uint8Array(bytes),
+  });
+  await ensureOk(putRes, "uploadFile: upload");
+  const json = (await putRes.json()) as FilesApiResponse;
+  if (!json.file?.uri) {
+    throw new GeminiError("uploadFile: response missing file.uri");
+  }
+  return {
+    uri: json.file.uri,
+    state: json.file.state ?? "PROCESSING",
+    mimeType: json.file.mimeType ?? mimeType,
+    name: json.file.name ?? "",
+    sizeBytes:
+      typeof json.file.sizeBytes === "number"
+        ? json.file.sizeBytes
+        : Number.parseInt(String(json.file.sizeBytes ?? sizeBytes), 10),
+  };
+}
+
+/**
+ * Poll the Files API for a single file's state. Used by `uploadAndWait()` and
+ * by callers that want to surface progress in the studio.
+ */
+export async function getFile(apiKey: string, fileName: string): Promise<UploadedFile> {
+  const res = await fetch(`${API_BASE}/${fileName}?key=${encodeURIComponent(apiKey)}`);
+  await ensureOk(res, "getFile");
+  const json = (await res.json()) as FilesApiResponse["file"];
+  if (!json?.uri) throw new GeminiError("getFile: response missing uri");
+  return {
+    uri: json.uri,
+    state: json.state ?? "PROCESSING",
+    mimeType: json.mimeType ?? "",
+    name: json.name ?? "",
+    sizeBytes:
+      typeof json.sizeBytes === "number"
+        ? json.sizeBytes
+        : Number.parseInt(String(json.sizeBytes ?? 0), 10),
+  };
+}
+
+/**
+ * Upload + poll until ACTIVE. Backoff is geometric: 1s, 2s, 4s, max 30s
+ * between polls; max 60s total wait. Throws GeminiError on FAILED or
+ * timeout — callers should treat both as user-actionable errors.
+ */
+export async function uploadAndWait(
+  apiKey: string,
+  filePath: string,
+  mimeType: string,
+  opts: { maxWaitMs?: number } = {},
+): Promise<UploadedFile> {
+  const initial = await uploadFile(apiKey, filePath, mimeType);
+  if (initial.state === "ACTIVE") return initial;
+  if (initial.state === "FAILED") {
+    throw new GeminiError(`uploadFile: server reported FAILED for ${initial.name}`);
+  }
+  const maxWait = opts.maxWaitMs ?? 60_000;
+  const start = Date.now();
+  let delay = 1000;
+  let last = initial;
+  while (Date.now() - start < maxWait) {
+    await new Promise((r) => setTimeout(r, delay));
+    delay = Math.min(delay * 2, 30_000);
+    last = await getFile(apiKey, last.name);
+    if (last.state === "ACTIVE") return last;
+    if (last.state === "FAILED") {
+      throw new GeminiError(`uploadFile: server reported FAILED for ${last.name}`);
+    }
+  }
+  throw new GeminiError(
+    `uploadFile: timed out after ${maxWait}ms waiting for ${last.name} to reach ACTIVE`,
+  );
+}
+
+// ── Structured tool call ─────────────────────────────────────────────────────
+
+export interface ToolFunctionDeclaration {
+  name: string;
+  description: string;
+  parameters: Record<string, unknown>;
+}
+
+export interface GenerateContentUsage {
+  promptTokenCount?: number;
+  candidatesTokenCount?: number;
+  totalTokenCount?: number;
+}
+
+interface GenerateContentResponse {
+  candidates?: Array<{
+    content?: {
+      parts?: Array<{
+        functionCall?: {
+          name: string;
+          args: unknown;
+        };
+        text?: string;
+      }>;
+    };
+    finishReason?: string;
+  }>;
+  usageMetadata?: GenerateContentUsage;
+}
+
+export interface GeminiPart {
+  text?: string;
+  fileData?: { fileUri: string; mimeType: string };
+  inlineData?: { mimeType: string; data: string }; // base64
+}
+
+/**
+ * Call Gemini's generateContent endpoint with a single function declaration.
+ * The model is forced to call the function; we parse and return its args.
+ *
+ * Mirrors callStructuredTool() from anthropic/client.ts so the storyline
+ * routes can swap providers per task without learning two prompt shapes.
+ */
+export async function generateStructured<T>(
+  apiKey: string,
+  opts: {
+    model?: string;
+    parts: GeminiPart[];
+    systemInstruction?: string;
+    tool: ToolFunctionDeclaration;
+    temperature?: number;
+    maxOutputTokens?: number;
+  },
+): Promise<{ result: T; usage: GenerateContentUsage }> {
+  const model = opts.model ?? DEFAULT_GEMINI_MODEL;
+  const url = `${API_BASE}/models/${encodeURIComponent(model)}:generateContent?key=${encodeURIComponent(apiKey)}`;
+  const body: Record<string, unknown> = {
+    contents: [{ role: "user", parts: opts.parts }],
+    tools: [{ functionDeclarations: [opts.tool] }],
+    toolConfig: {
+      functionCallingConfig: { mode: "ANY", allowedFunctionNames: [opts.tool.name] },
+    },
+    generationConfig: {
+      temperature: opts.temperature ?? 0.4,
+      maxOutputTokens: opts.maxOutputTokens ?? 2048,
+    },
+  };
+  if (opts.systemInstruction && opts.systemInstruction.trim().length > 0) {
+    body.systemInstruction = { parts: [{ text: opts.systemInstruction }] };
+  }
+
+  const res = await fetch(url, {
+    method: "POST",
+    headers: { "Content-Type": "application/json" },
+    body: JSON.stringify(body),
+  });
+  await ensureOk(res, "generateStructured");
+  const json = (await res.json()) as GenerateContentResponse;
+  const candidate = json.candidates?.[0];
+  const fnCall = candidate?.content?.parts?.find((p) => p.functionCall);
+  if (!fnCall?.functionCall || fnCall.functionCall.name !== opts.tool.name) {
+    throw new GeminiError(
+      `generateStructured: model did not return a "${opts.tool.name}" function call; finishReason=${candidate?.finishReason ?? "unknown"}`,
+    );
+  }
+  return {
+    result: fnCall.functionCall.args as T,
+    usage: json.usageMetadata ?? {},
+  };
+}
diff --git a/packages/core/src/gemini/env.ts b/packages/core/src/gemini/env.ts
new file mode 100644
index 000000000..cf7473e15
--- /dev/null
+++ b/packages/core/src/gemini/env.ts
@@ -0,0 +1,40 @@
+import {
+  loadKey,
+  getKeyStatus,
+  writeKeyToEnvFile,
+  type KeySource,
+  type KeyStatus,
+} from "../secrets/envKey.js";
+
+/**
+ * Gemini API key loader. Mirrors the Anthropic env loader so the studio
+ * key panel can present both keys with the same UX.
+ *
+ * Looked-up names in priority order:
+ *   1. process.env.GEMINI_API_KEY
+ *   2. <project>/.env GEMINI_API_KEY
+ *   3. ~/.config/hyperframes/global.env GEMINI_API_KEY
+ *
+ * Google's docs sometimes use GOOGLE_API_KEY for the same key — we accept
+ * the canonical GEMINI_API_KEY here and let users alias if needed. Keeping
+ * to one name avoids the "I set the wrong env var" debugging trap.
+ */
+
+const KEY_NAME = "GEMINI_API_KEY";
+
+export type GeminiKeySource = KeySource;
+export type GeminiKeyStatus = KeyStatus;
+
+export function loadGeminiKey(projectDir?: string): string | null {
+  return loadKey(KEY_NAME, projectDir);
+}
+
+export function getGeminiKeyStatus(projectDir?: string): GeminiKeyStatus {
+  return getKeyStatus(KEY_NAME, projectDir);
+}
+
+export function writeGeminiKeyToEnvFile(envPath: string, value: string | null): void {
+  writeKeyToEnvFile(envPath, KEY_NAME, value);
+}
+
+export const GEMINI_KEY_NAME = KEY_NAME;
diff --git a/packages/core/src/gemini/index.ts b/packages/core/src/gemini/index.ts
new file mode 100644
index 000000000..46cf22901
--- /dev/null
+++ b/packages/core/src/gemini/index.ts
@@ -0,0 +1,21 @@
+export {
+  loadGeminiKey,
+  getGeminiKeyStatus,
+  writeGeminiKeyToEnvFile,
+  GEMINI_KEY_NAME,
+} from "./env.js";
+export type { GeminiKeySource, GeminiKeyStatus } from "./env.js";
+export {
+  uploadFile,
+  uploadAndWait,
+  getFile,
+  generateStructured,
+  GeminiError,
+  DEFAULT_GEMINI_MODEL,
+} from "./client.js";
+export type {
+  UploadedFile,
+  ToolFunctionDeclaration,
+  GenerateContentUsage,
+  GeminiPart,
+} from "./client.js";
diff --git a/packages/core/src/script/assemble.ts b/packages/core/src/script/assemble.ts
index 8412b9731..42bccb752 100644
--- a/packages/core/src/script/assemble.ts
+++ b/packages/core/src/script/assemble.ts
@@ -9,6 +9,7 @@ import type { PlannedScene, PlannedScript, SceneTransition } from "./types.js";
 import type { ImageEntry, ImageManifest } from "../images/index.js";
 import type { VisualDirectionPlan } from "./visualDirector.js";
 import { readSfxManifest, resolveSfxStartForScene, type SfxEntry } from "./sfx/manifest.js";
+import { readMusicManifest, resolveMusicSpan, type SceneSpan } from "./music/manifest.js";
 
 export interface AssembleOptions {
   projectDir: string;
@@ -87,6 +88,12 @@ export function assembleMaster(planned: PlannedScript, opts: AssembleOptions): A
     list.push(entry);
     sfxBySceneId.set(entry.sceneId, list);
   }
+
+  // Music manifest: read here, emit AFTER the scene loop so we know each
+  // scene's absolute cursor position. Music tracks span multiple scenes so
+  // they need the full scene-span table to compute start + declared duration.
+  const musicManifest = readMusicManifest(opts.projectDir);
+  const sceneSpansForMusic: SceneSpan[] = [];
   const sceneVisibility: Array<{
     id: string;
     start: number;
@@ -223,10 +230,28 @@ export function assembleMaster(planned: PlannedScript, opts: AssembleOptions): A
       transitionIn,
       transitionInMs,
     });
+    sceneSpansForMusic.push({ id: scene.id, start: cursor, duration: sceneTotal });
     cursor += sceneTotal;
   }
 
   const total = cursor;
+
+  // Music tracks land on track 2. Each track's window comes from
+  // resolveMusicSpan (start = first covered scene, duration = audio length
+  // capped to covered span). Volume + duck attributes go to the producer's
+  // audio mixer at render time.
+  for (const entry of musicManifest.entries) {
+    const span = resolveMusicSpan(entry, sceneSpansForMusic, total);
+    if (span.declaredDuration <= 0) continue;
+    const labelAttr = entry.label ? ` data-timeline-label="${escapeAttr(entry.label)}"` : "";
+    const volumeAttr =
+      typeof entry.volumeDb === "number" ? ` data-volume-db="${entry.volumeDb.toFixed(1)}"` : "";
+    const duckAttr =
+      typeof entry.duckDb === "number" ? ` data-music-duck-db="${entry.duckDb.toFixed(1)}"` : "";
+    audioTags.push(
+      `  <audio id="hf-music-${entry.id}" src="${escapeAttr(entry.path)}" data-start="${span.start.toFixed(2)}" data-duration="${span.declaredDuration.toFixed(2)}" data-track-index="2" data-timeline-group="music"${labelAttr}${volumeAttr}${duckAttr} preload="auto"></audio>`,
+    );
+  }
   const title = planned.meta.title ? escapeText(planned.meta.title) : "HyperFrames Video";
 
   // The hyperframes runtime composes its own master from elements with
diff --git a/packages/core/src/script/music/manifest.test.ts b/packages/core/src/script/music/manifest.test.ts
new file mode 100644
index 000000000..fcbf2d117
--- /dev/null
+++ b/packages/core/src/script/music/manifest.test.ts
@@ -0,0 +1,76 @@
+import { describe, it, expect } from "vitest";
+import { resolveMusicSpan, type MusicEntry, type SceneSpan } from "./manifest";
+
+const baseEntry: Pick<MusicEntry, "scenesCovered" | "durationSeconds"> = {
+  scenesCovered: [],
+  durationSeconds: 60,
+};
+
+const SCENES: SceneSpan[] = [
+  { id: "s01", start: 0, duration: 5 },
+  { id: "s02", start: 5, duration: 8 },
+  { id: "s03", start: 13, duration: 6 },
+  { id: "s04", start: 19, duration: 4 },
+];
+const TOTAL = 23;
+
+describe("resolveMusicSpan", () => {
+  it("empty scenesCovered = full-video span, capped at audio length", () => {
+    expect(resolveMusicSpan({ scenesCovered: [], durationSeconds: 30 }, SCENES, TOTAL)).toEqual({
+      start: 0,
+      declaredDuration: 23,
+    });
+  });
+
+  it("empty scenesCovered with audio shorter than total stays at audio length", () => {
+    expect(resolveMusicSpan({ scenesCovered: [], durationSeconds: 10 }, SCENES, TOTAL)).toEqual({
+      start: 0,
+      declaredDuration: 10,
+    });
+  });
+
+  it("single-scene cover spans that scene only", () => {
+    expect(resolveMusicSpan({ ...baseEntry, scenesCovered: ["s02"] }, SCENES, TOTAL)).toEqual({
+      start: 5,
+      declaredDuration: 8,
+    });
+  });
+
+  it("contiguous multi-scene cover spans first start to last end", () => {
+    // s02 starts 5 + s03 ends 19 → start=5, duration=14
+    expect(
+      resolveMusicSpan({ scenesCovered: ["s02", "s03"], durationSeconds: 60 }, SCENES, TOTAL),
+    ).toEqual({ start: 5, declaredDuration: 14 });
+  });
+
+  it("non-contiguous cover (s01 + s04) spans the outer hull", () => {
+    // s01 starts 0 + s04 ends 23 → start=0, duration=23
+    expect(
+      resolveMusicSpan({ scenesCovered: ["s01", "s04"], durationSeconds: 60 }, SCENES, TOTAL),
+    ).toEqual({ start: 0, declaredDuration: 23 });
+  });
+
+  it("scenesCovered referencing unknown ids falls back to full video", () => {
+    expect(
+      resolveMusicSpan({ scenesCovered: ["doesnt-exist"], durationSeconds: 30 }, SCENES, TOTAL),
+    ).toEqual({ start: 0, declaredDuration: 23 });
+  });
+
+  it("audio longer than covered scenes clips to covered duration", () => {
+    expect(
+      resolveMusicSpan({ scenesCovered: ["s01"], durationSeconds: 60 }, SCENES, TOTAL),
+    ).toEqual({ start: 0, declaredDuration: 5 });
+  });
+
+  it("audio shorter than covered scenes uses audio length", () => {
+    expect(
+      resolveMusicSpan({ scenesCovered: ["s01", "s02", "s03"], durationSeconds: 7 }, SCENES, TOTAL),
+    ).toEqual({ start: 0, declaredDuration: 7 });
+  });
+
+  it("scenesCovered out of order resolves correctly (uses min/max not first/last)", () => {
+    expect(
+      resolveMusicSpan({ scenesCovered: ["s04", "s02"], durationSeconds: 60 }, SCENES, TOTAL),
+    ).toEqual({ start: 5, declaredDuration: 18 });
+  });
+});
diff --git a/packages/core/src/script/music/manifest.ts b/packages/core/src/script/music/manifest.ts
new file mode 100644
index 000000000..937f040db
--- /dev/null
+++ b/packages/core/src/script/music/manifest.ts
@@ -0,0 +1,157 @@
+import { existsSync, mkdirSync, readFileSync, writeFileSync } from "node:fs";
+import { dirname, join } from "node:path";
+
+/**
+ * Music manifest — lives at `<project>/assets/music/music.manifest.json`.
+ * Mirrors the SFX manifest pattern with one structural difference: a music
+ * track spans MULTIPLE scenes (an underscore covers a whole act, a stinger
+ * covers a single transition). Anchoring is therefore a `scenesCovered: []`
+ * array instead of a single anchor.
+ *
+ * The assembler computes the absolute start/end on the master timeline by
+ * looking up the first and last scene's cumulative offsets. Each track's
+ * audio file lives at `assets/music/<id>.mp3` next to the manifest.
+ */
+
+export const MUSIC_DIR = "assets/music";
+export const MUSIC_MANIFEST = "music.manifest.json";
+export const MUSIC_MANIFEST_VERSION = 1;
+
+export type MusicRole = "underscore" | "stinger" | "intro" | "outro";
+
+export interface MusicEntry {
+  id: string;
+  /** Text prompt sent to ElevenLabs. Surfaced in the studio for context. */
+  prompt: string;
+  /** Path under the project root: `assets/music/<id>.mp3`. */
+  path: string;
+  /** Measured length of the file (seconds). The assembler uses this directly
+   *  as `data-duration` so the timeline shows the real footprint. */
+  durationSeconds: number;
+  /** Ordered scene ids the track plays under. Empty list = whole video. */
+  scenesCovered: string[];
+  /** Loose tag for UI grouping. Doesn't affect playback. */
+  role: MusicRole;
+  /** Optional human label (e.g. "investigative bed"). Defaults to a prompt
+   *  truncation when not supplied. */
+  label?: string;
+  /** Volume in dB. Default 0 (full). The producer's audio mixer reads
+   *  data-volume-db to apply this at render time. */
+  volumeDb?: number;
+  /** Sidechain duck depth in dB applied during voiceover windows. -12 is the
+   *  default for cinematic reels — voiceover stays clear without making the
+   *  music feel cut. */
+  duckDb?: number;
+  /** ISO timestamp the entry was created. */
+  createdAt: string;
+}
+
+export interface MusicManifest {
+  version: number;
+  entries: MusicEntry[];
+}
+
+export function emptyManifest(): MusicManifest {
+  return { version: MUSIC_MANIFEST_VERSION, entries: [] };
+}
+
+export function readMusicManifest(projectDir: string): MusicManifest {
+  const path = join(projectDir, MUSIC_DIR, MUSIC_MANIFEST);
+  if (!existsSync(path)) return emptyManifest();
+  try {
+    const raw = JSON.parse(readFileSync(path, "utf-8")) as Partial<MusicManifest>;
+    if (!raw || typeof raw !== "object") return emptyManifest();
+    const entries = Array.isArray(raw.entries) ? raw.entries.filter(isValidEntry) : [];
+    return { version: MUSIC_MANIFEST_VERSION, entries };
+  } catch {
+    return emptyManifest();
+  }
+}
+
+export function writeMusicManifest(projectDir: string, manifest: MusicManifest): void {
+  const path = join(projectDir, MUSIC_DIR, MUSIC_MANIFEST);
+  mkdirSync(dirname(path), { recursive: true });
+  writeFileSync(path, JSON.stringify(manifest, null, 2) + "\n");
+}
+
+export function appendMusicEntry(projectDir: string, entry: MusicEntry): MusicManifest {
+  const manifest = readMusicManifest(projectDir);
+  manifest.entries.push(entry);
+  writeMusicManifest(projectDir, manifest);
+  return manifest;
+}
+
+export function removeMusicEntry(projectDir: string, entryId: string): MusicManifest {
+  const manifest = readMusicManifest(projectDir);
+  manifest.entries = manifest.entries.filter((e) => e.id !== entryId);
+  writeMusicManifest(projectDir, manifest);
+  return manifest;
+}
+
+function isValidEntry(value: unknown): value is MusicEntry {
+  if (!value || typeof value !== "object") return false;
+  const e = value as Record<string, unknown>;
+  return (
+    typeof e.id === "string" &&
+    typeof e.prompt === "string" &&
+    typeof e.path === "string" &&
+    typeof e.durationSeconds === "number" &&
+    Array.isArray(e.scenesCovered) &&
+    e.scenesCovered.every((s: unknown) => typeof s === "string") &&
+    typeof e.role === "string" &&
+    typeof e.createdAt === "string"
+  );
+}
+
+/**
+ * Compute a music track's absolute start time + the duration the assembler
+ * should declare on its `<audio data-duration>`. The track's *audio file*
+ * may be longer than the scenes it covers — in that case the player clips
+ * playback to the covered window.
+ *
+ * Returns:
+ *   - start: absolute time on the master timeline where the track begins
+ *   - declaredDuration: how long the assembler says the track should play.
+ *     min(audio length, sum of covered scenes' durations).
+ *
+ * Pure helper — exported for tests so the math is exercised without disk.
+ */
+export interface SceneSpan {
+  id: string;
+  start: number;
+  duration: number;
+}
+
+export function resolveMusicSpan(
+  entry: Pick<MusicEntry, "scenesCovered" | "durationSeconds">,
+  sceneSpans: SceneSpan[],
+  totalDuration: number,
+): { start: number; declaredDuration: number } {
+  // Empty scenesCovered = play under the whole video.
+  if (!entry.scenesCovered || entry.scenesCovered.length === 0) {
+    return {
+      start: 0,
+      declaredDuration: Math.min(entry.durationSeconds, totalDuration),
+    };
+  }
+  const indexById = new Map(sceneSpans.map((s) => [s.id, s]));
+  const covered = entry.scenesCovered
+    .map((id) => indexById.get(id))
+    .filter((s): s is SceneSpan => s != null);
+  if (covered.length === 0) {
+    // None of the named scenes exist in the script (probably reordered or
+    // deleted). Fall back to the whole video so the track still plays —
+    // better than the user wondering why the music vanished.
+    return {
+      start: 0,
+      declaredDuration: Math.min(entry.durationSeconds, totalDuration),
+    };
+  }
+  const start = Math.min(...covered.map((s) => s.start));
+  const end = Math.max(...covered.map((s) => s.start + s.duration));
+  const coveredDuration = Math.max(0, end - start);
+  return {
+    start,
+    declaredDuration: Math.min(entry.durationSeconds, coveredDuration),
+  };
+}
diff --git a/packages/core/src/studio-api/routes/storyline.ts b/packages/core/src/studio-api/routes/storyline.ts
index 1a07e67da..25ab3b545 100644
--- a/packages/core/src/studio-api/routes/storyline.ts
+++ b/packages/core/src/studio-api/routes/storyline.ts
@@ -22,6 +22,28 @@ import {
   type SfxAnchor,
   type SfxEntry,
 } from "../../script/sfx/manifest.js";
+import {
+  generateMusicAndWait,
+  downloadMusic,
+  clampMusicDuration,
+  MUSIC_BOUNDS,
+} from "../../elevenlabs/music.js";
+import {
+  appendMusicEntry,
+  readMusicManifest,
+  removeMusicEntry,
+  MUSIC_DIR,
+  type MusicEntry,
+  type MusicRole,
+} from "../../script/music/manifest.js";
+import {
+  GeminiError,
+  generateStructured as generateGeminiStructured,
+  loadGeminiKey,
+  uploadAndWait as uploadGeminiFile,
+  DEFAULT_GEMINI_MODEL,
+  type GeminiPart,
+} from "../../gemini/index.js";
 
 type Scene = SceneRef;
 
@@ -553,6 +575,352 @@ export function registerStorylineRoutes(api: Hono, adapter: StudioApiAdapter): v
     const manifest = removeSfxEntry(project.dir, entryId);
     return c.json({ ok: true, manifest });
   });
+
+  // ── Milestone B: ElevenLabs Music ────────────────────────────────────────
+
+  // POST /api/projects/:id/storyline/music-suggest
+  // Haiku reads the whole storyline + active theme + a free-form vibe prompt
+  // and returns 1-3 track plans (prompt, scenesCovered, durationS, role).
+  // Synchronous Haiku call — fast, cheap, sub-second.
+  api.post("/projects/:id/storyline/music-suggest", async (c) => {
+    const project = await adapter.resolveProject(c.req.param("id"));
+    if (!project) return c.json({ error: "not found" }, 404);
+    let body: { vibe?: string };
+    try {
+      body = (await c.req.json()) as { vibe?: string };
+    } catch {
+      return c.json({ error: "invalid JSON body" }, 400);
+    }
+    const vibe = (body.vibe ?? "").trim();
+    if (!vibe) return c.json({ error: "vibe is required" }, 400);
+    if (vibe.length > 500) return c.json({ error: "vibe too long (max 500 chars)" }, 400);
+
+    const script = loadScript(project.dir);
+    if (!script) return c.json({ error: "no planned script found" }, 404);
+    const apiKey = loadAnthropicKey(project.dir);
+    if (!apiKey) return c.json({ error: "ANTHROPIC_API_KEY not set" }, 401);
+
+    const activeTheme = resolveActiveTheme(project.dir);
+    const onCostEvent = loggerSink(new CostLogger(project.dir));
+    const start = Date.now();
+    try {
+      const { result, usage } = await callStructuredTool<MusicSuggestToolInput>(apiKey, {
+        model: HAIKU_MODEL,
+        system: buildMusicSuggestSystem(activeTheme.name, activeTheme.description),
+        user: buildMusicSuggestUser(script, vibe),
+        tool: MUSIC_SUGGEST_TOOL,
+        maxTokens: 1500,
+        temperature: 0.4,
+      });
+      onCostEvent(
+        "script.storyline.music.suggest",
+        {
+          kind: "anthropic",
+          model: HAIKU_MODEL,
+          inputTokens: usage.input_tokens,
+          outputTokens: usage.output_tokens,
+        },
+        Date.now() - start,
+        { sceneCount: script.scenes.length, vibeLen: vibe.length },
+      );
+      return c.json(buildMusicSuggestResponse(result, script));
+    } catch (err) {
+      if (err instanceof AnthropicError) {
+        return c.json({ error: `Haiku call failed: ${err.message}` }, 502);
+      }
+      return c.json({ error: err instanceof Error ? err.message : String(err) }, 500);
+    }
+  });
+
+  // POST /api/projects/:id/storyline/music-generate
+  // Take one suggestion (prompt + durationSeconds + scenesCovered) and turn
+  // it into an mp3 on disk. Polled job — can take 30-60s. Server holds the
+  // request open; the studio shows a "generating…" spinner.
+  api.post("/projects/:id/storyline/music-generate", async (c) => {
+    const project = await adapter.resolveProject(c.req.param("id"));
+    if (!project) return c.json({ error: "not found" }, 404);
+    let body: MusicGenerateBody;
+    try {
+      body = (await c.req.json()) as MusicGenerateBody;
+    } catch {
+      return c.json({ error: "invalid JSON body" }, 400);
+    }
+    if (!body.prompt || body.prompt.trim().length === 0) {
+      return c.json({ error: "prompt is required" }, 400);
+    }
+    if (body.prompt.length > MUSIC_BOUNDS.promptMaxChars) {
+      return c.json({ error: `prompt too long (max ${MUSIC_BOUNDS.promptMaxChars} chars)` }, 400);
+    }
+    const apiKey = loadElevenLabsKey(project.dir);
+    if (!apiKey) {
+      return c.json({ error: "ELEVENLABS_API_KEY not set. Add it to <project>/.env." }, 401);
+    }
+    const role: MusicRole =
+      body.role === "stinger" || body.role === "intro" || body.role === "outro"
+        ? body.role
+        : "underscore";
+    const durationSeconds = clampMusicDuration(body.durationSeconds ?? 60);
+    const scenesCovered = Array.isArray(body.scenesCovered)
+      ? body.scenesCovered.filter((s): s is string => typeof s === "string")
+      : [];
+
+    const onCostEvent = loggerSink(new CostLogger(project.dir));
+    const start = Date.now();
+    try {
+      const { audioUrl } = await generateMusicAndWait(apiKey, body.prompt.trim(), {
+        durationMs: Math.round(durationSeconds * 1000),
+      });
+      const bytes = await downloadMusic(audioUrl);
+      const entryId = mintMusicId();
+      const relativePath = `${MUSIC_DIR}/${entryId}.mp3`;
+      const absPath = join(project.dir, relativePath);
+      mkdirSync(join(project.dir, MUSIC_DIR), { recursive: true });
+      writeFileSync(absPath, bytes);
+      const entry: MusicEntry = {
+        id: entryId,
+        prompt: body.prompt.trim(),
+        path: relativePath,
+        durationSeconds,
+        scenesCovered,
+        role,
+        ...(typeof body.label === "string" && body.label.trim().length > 0
+          ? { label: body.label.trim() }
+          : {}),
+        ...(typeof body.volumeDb === "number" ? { volumeDb: body.volumeDb } : {}),
+        // Default duck of -12dB during voiceover windows. The producer's
+        // mixer applies a sidechain duck at render time.
+        duckDb: typeof body.duckDb === "number" ? body.duckDb : -12,
+        createdAt: new Date().toISOString(),
+      };
+      appendMusicEntry(project.dir, entry);
+      onCostEvent(
+        "script.storyline.music.generate",
+        // ElevenLabs Music is billed per generation (not per character) — we
+        // synthesise a 1-character entry so the existing cost shape applies.
+        { kind: "elevenlabs", voiceId: "music", characters: 1 },
+        Date.now() - start,
+        { entryId, durationSeconds, scenesCovered: scenesCovered.length, role },
+      );
+      return c.json({ ok: true, entry });
+    } catch (err) {
+      if (err instanceof ElevenLabsError) {
+        return c.json({ error: `ElevenLabs Music failed: ${err.message}` }, 502);
+      }
+      return c.json({ error: err instanceof Error ? err.message : String(err) }, 500);
+    }
+  });
+
+  // GET /api/projects/:id/storyline/music
+  api.get("/projects/:id/storyline/music", async (c) => {
+    const project = await adapter.resolveProject(c.req.param("id"));
+    if (!project) return c.json({ error: "not found" }, 404);
+    return c.json({ manifest: readMusicManifest(project.dir) });
+  });
+
+  // DELETE /api/projects/:id/storyline/music/:entryId
+  api.delete("/projects/:id/storyline/music/:entryId", async (c) => {
+    const project = await adapter.resolveProject(c.req.param("id"));
+    if (!project) return c.json({ error: "not found" }, 404);
+    const entryId = c.req.param("entryId");
+    if (!entryId) return c.json({ error: "entryId required" }, 400);
+    const manifest = removeMusicEntry(project.dir, entryId);
+    return c.json({ ok: true, manifest });
+  });
+
+  // ── Milestone C: Gemini render review ────────────────────────────────────
+
+  // POST /api/projects/:id/storyline/render-review
+  // Body: { renderPath?: string }   — defaults to the most recent render in
+  //                                   <project>/renders/
+  // Uploads the MP4 to Gemini Files API, prompts with the script meta, and
+  // returns structured retention feedback. Persists the result to
+  // `<project>/.hyperframes/render-reviews/<timestamp>.json` so the studio
+  // can show historical reviews without re-running.
+  api.post("/projects/:id/storyline/render-review", async (c) => {
+    const project = await adapter.resolveProject(c.req.param("id"));
+    if (!project) return c.json({ error: "not found" }, 404);
+    let body: { renderPath?: string };
+    try {
+      body = (await c.req.json().catch(() => ({}))) as { renderPath?: string };
+    } catch {
+      body = {};
+    }
+    const apiKey = loadGeminiKey(project.dir);
+    if (!apiKey) {
+      return c.json({ error: "GEMINI_API_KEY not set. Add it to <project>/.env." }, 401);
+    }
+
+    const script = loadScript(project.dir);
+    if (!script) return c.json({ error: "no planned script found" }, 404);
+
+    // Resolve the render path. Caller can specify; otherwise we pick the
+    // most recent .mp4 under <project>/renders/.
+    let renderRel = body.renderPath ?? findMostRecentRender(project.dir);
+    if (!renderRel) {
+      return c.json(
+        {
+          error: "no rendered MP4 found. Run a render first (or pass renderPath in the body).",
+        },
+        404,
+      );
+    }
+    if (renderRel.startsWith("/")) renderRel = renderRel.slice(1);
+    const absRenderPath = join(project.dir, renderRel);
+    if (!existsSync(absRenderPath)) {
+      return c.json({ error: `render not found at ${renderRel}` }, 404);
+    }
+
+    const onCostEvent = loggerSink(new CostLogger(project.dir));
+    const start = Date.now();
+    try {
+      const uploaded = await uploadGeminiFile(apiKey, absRenderPath, "video/mp4");
+      const sceneTimings = computeSceneTimings(script);
+      const { result, usage } = await generateGeminiStructured<RenderReviewToolInput>(apiKey, {
+        model: DEFAULT_GEMINI_MODEL,
+        parts: [
+          { fileData: { fileUri: uploaded.uri, mimeType: uploaded.mimeType } },
+          { text: buildRenderReviewUser(script, sceneTimings) },
+        ],
+        systemInstruction: buildRenderReviewSystem(),
+        tool: anthropicToGeminiTool(RENDER_REVIEW_TOOL),
+        temperature: 0.3,
+        maxOutputTokens: 4096,
+      });
+      onCostEvent(
+        "script.storyline.render.review",
+        {
+          kind: "gemini",
+          model: DEFAULT_GEMINI_MODEL,
+          promptTokens: usage.promptTokenCount ?? 0,
+          outputTokens: usage.candidatesTokenCount ?? 0,
+        },
+        Date.now() - start,
+        { renderPath: renderRel, sceneCount: script.scenes.length },
+      );
+      const review = buildRenderReviewResponse(result, script);
+      // Persist for historical retrieval. Soft fail — review still goes back
+      // to the caller even if the disk write fails.
+      try {
+        const reviewsDir = join(project.dir, ".hyperframes", "render-reviews");
+        mkdirSync(reviewsDir, { recursive: true });
+        const reviewPath = join(reviewsDir, `${Date.now()}.json`);
+        writeFileSync(
+          reviewPath,
+          JSON.stringify({ ...review, renderPath: renderRel }, null, 2) + "\n",
+        );
+      } catch {
+        /* ignore */
+      }
+      return c.json({ ...review, renderPath: renderRel });
+    } catch (err) {
+      if (err instanceof GeminiError) {
+        return c.json({ error: `Gemini call failed: ${err.message}` }, 502);
+      }
+      return c.json({ error: err instanceof Error ? err.message : String(err) }, 500);
+    }
+  });
+
+  // GET /api/projects/:id/storyline/render-review
+  // Returns the most recent persisted review (if any), so reloading the
+  // Storyline tab shows the last review without re-running Gemini.
+  api.get("/projects/:id/storyline/render-review", async (c) => {
+    const project = await adapter.resolveProject(c.req.param("id"));
+    if (!project) return c.json({ error: "not found" }, 404);
+    const review = loadMostRecentRenderReview(project.dir);
+    return c.json({ review });
+  });
+
+  // ── Milestone E: Per-scene scroll test ───────────────────────────────────
+
+  // POST /api/projects/:id/storyline/scroll-test
+  // Body: { sceneId }
+  // Picks 3 frames from the scene (start / mid / end) by sampling the
+  // rendered MP4, sends them + the narration to Gemini, asks "would they
+  // scroll?". Drops a SceneSuggestion patch for the proposed fix.
+  api.post("/projects/:id/storyline/scroll-test", async (c) => {
+    const ctx = await loadActionContext(c.req.param("id"), c, adapter);
+    if ("errorRes" in ctx) return ctx.errorRes;
+    const { project, scene } = ctx;
+    const apiKey = loadGeminiKey(project.dir);
+    if (!apiKey) return c.json({ error: "GEMINI_API_KEY not set" }, 401);
+
+    const script = loadScript(project.dir);
+    if (!script) return c.json({ error: "no planned script found" }, 404);
+    const renderRel = findMostRecentRender(project.dir);
+    if (!renderRel) {
+      return c.json({ error: "no rendered MP4 found — render first to enable scroll tests." }, 404);
+    }
+    const absRenderPath = join(project.dir, renderRel);
+    if (!existsSync(absRenderPath)) {
+      return c.json({ error: `render not found at ${renderRel}` }, 404);
+    }
+
+    const sceneTimings = computeSceneTimings(script);
+    const sceneTime = sceneTimings.find((t) => t.sceneId === scene.id);
+    if (!sceneTime) {
+      return c.json({ error: `couldn't compute timing for ${scene.id}` }, 500);
+    }
+
+    // Frame extraction needs ffmpeg — leverage the same probe adapter the
+    // studio already wires up for audio duration. If absent we degrade to
+    // sending only the narration text, no frames; Gemini will still produce
+    // a reasonable "would they scroll?" verdict from the text alone.
+    let frameParts: GeminiPart[] = [];
+    if (adapter.extractVideoFrameToBytes) {
+      const sampleAt = [
+        sceneTime.start + Math.min(0.5, sceneTime.duration / 6),
+        sceneTime.start + sceneTime.duration / 2,
+        sceneTime.start + Math.max(0, sceneTime.duration - 0.5),
+      ];
+      try {
+        for (const t of sampleAt) {
+          const bytes = await adapter.extractVideoFrameToBytes(absRenderPath, t);
+          if (bytes) {
+            frameParts.push({
+              inlineData: {
+                mimeType: "image/jpeg",
+                data: Buffer.from(bytes).toString("base64"),
+              },
+            });
+          }
+        }
+      } catch {
+        // Frame sampling is best-effort — if ffmpeg fails on one frame the
+        // scroll test still runs with what we got.
+        frameParts = [];
+      }
+    }
+
+    const onCostEvent = loggerSink(new CostLogger(project.dir));
+    const start = Date.now();
+    try {
+      const { result, usage } = await generateGeminiStructured<ScrollTestToolInput>(apiKey, {
+        model: DEFAULT_GEMINI_MODEL,
+        parts: [...frameParts, { text: buildScrollTestUser(scene) }],
+        systemInstruction: buildScrollTestSystem(),
+        tool: anthropicToGeminiTool(SCROLL_TEST_TOOL),
+        temperature: 0.3,
+        maxOutputTokens: 768,
+      });
+      onCostEvent(
+        "script.storyline.scrollTest",
+        {
+          kind: "gemini",
+          model: DEFAULT_GEMINI_MODEL,
+          promptTokens: usage.promptTokenCount ?? 0,
+          outputTokens: usage.candidatesTokenCount ?? 0,
+        },
+        Date.now() - start,
+        { sceneId: scene.id, frameCount: frameParts.length },
+      );
+      return c.json(buildScrollTestResponse(result, scene));
+    } catch (err) {
+      if (err instanceof GeminiError) {
+        return c.json({ error: `Gemini call failed: ${err.message}` }, 502);
+      }
+      return c.json({ error: err instanceof Error ? err.message : String(err) }, 500);
+    }
+  });
 }
 
 // ── SFX action types & helpers ───────────────────────────────────────────────
@@ -1711,4 +2079,599 @@ export const __testing = {
   buildProjectIntentResponse,
   loadImageManifestSummary,
   pickSceneWindow,
+  buildRenderReviewResponse,
+  buildScrollTestResponse,
+  buildMusicSuggestResponse,
+  computeSceneTimings,
+  findMostRecentRender,
+};
+
+// ── Music helpers ────────────────────────────────────────────────────────────
+
+interface MusicSuggestToolInput {
+  tracks?: Array<{
+    prompt?: string;
+    durationSeconds?: number;
+    role?: string;
+    scenesCovered?: string[];
+    label?: string;
+    rationale?: string;
+  }>;
+  overallNote?: string;
+}
+
+interface MusicGenerateBody {
+  prompt?: string;
+  durationSeconds?: number;
+  role?: MusicRole;
+  scenesCovered?: string[];
+  label?: string;
+  volumeDb?: number;
+  duckDb?: number;
+}
+
+const MUSIC_SUGGEST_TOOL: ToolDefinition = {
+  name: "propose_music_tracks",
+  description:
+    "Propose 1-3 background music tracks for a planned video. Each track has a generation prompt, the scenes it underscores, a target duration, and a one-sentence rationale.",
+  input_schema: {
+    type: "object",
+    properties: {
+      overallNote: {
+        type: "string",
+        description: "1-2 sentences on the overall musical strategy across the video.",
+      },
+      tracks: {
+        type: "array",
+        minItems: 1,
+        maxItems: 3,
+        items: {
+          type: "object",
+          properties: {
+            prompt: {
+              type: "string",
+              description:
+                "ElevenLabs Music prompt — be visceral and specific. 'investigative documentary, tense pulse, low strings' beats 'sad music'.",
+            },
+            durationSeconds: {
+              type: "number",
+              minimum: 10,
+              maximum: 300,
+              description:
+                "Target duration in seconds. Underscore tracks usually run 30-90s; stingers 5-15s.",
+            },
+            role: {
+              type: "string",
+              enum: ["underscore", "stinger", "intro", "outro"],
+              description:
+                "underscore = continuous bed under multiple scenes. stinger = punctuates a transition. intro/outro = scene 1 / final scene only.",
+            },
+            scenesCovered: {
+              type: "array",
+              items: { type: "string" },
+              description:
+                "Ordered scene ids the track plays under. Empty = whole video. Underscore tracks should cover 2-6 scenes (a coherent act); stingers cover 1.",
+            },
+            label: {
+              type: "string",
+              description: "Short human label (e.g. 'investigative bed').",
+            },
+            rationale: {
+              type: "string",
+              description: "One sentence on what this track does for the video's emotional arc.",
+            },
+          },
+          required: ["prompt", "durationSeconds", "role", "scenesCovered", "rationale"],
+        },
+      },
+    },
+    required: ["tracks", "overallNote"],
+  },
 };
+
+function buildMusicSuggestSystem(themeName: string, themeDescription: string): string {
+  return [
+    "# Music director",
+    "",
+    "You're scoring a Reels-style explainer video. Read the script + active theme + the user's vibe prompt and propose 1-3 background music tracks.",
+    "",
+    "Rules:",
+    "1. NARRATION IS PRIMARY. Music supports voiceover; never competes with it.",
+    "2. Underscore tracks should cover 2-6 contiguous scenes (an act). Stingers punctuate transitions.",
+    "3. Be specific in prompts: instruments, tempo, mood, era. ElevenLabs Music respects detail.",
+    "4. Match the theme's energy — match if you can name what feels off otherwise.",
+    "5. Default duck during voiceover is -12dB. Don't propose anything that needs less ducking unless silence is rare.",
+    "",
+    `## Active theme: ${themeName}`,
+    themeDescription ? `Description: ${themeDescription}` : "",
+  ]
+    .filter((s) => s.length > 0)
+    .join("\n");
+}
+
+function buildMusicSuggestUser(script: Script, vibe: string): string {
+  const lines = script.scenes
+    .map((s, i) => `${i + 1}. ${s.id} · ${s.template}${s.hook ? " · HOOK" : ""}\n   ${s.text}`)
+    .join("\n");
+  return [
+    "## User's vibe",
+    vibe,
+    "",
+    `## Script (${script.scenes.length} scenes)`,
+    lines,
+    "",
+    "Now call propose_music_tracks with 1-3 tracks that score the video.",
+  ].join("\n");
+}
+
+interface MusicSuggestionResponse {
+  overallNote: string;
+  tracks: Array<{
+    id: string;
+    prompt: string;
+    durationSeconds: number;
+    role: MusicRole;
+    scenesCovered: string[];
+    label: string;
+    rationale: string;
+  }>;
+}
+
+function buildMusicSuggestResponse(
+  raw: MusicSuggestToolInput,
+  script: Script,
+): MusicSuggestionResponse {
+  const knownSceneIds = new Set(script.scenes.map((s) => s.id));
+  const tracks: MusicSuggestionResponse["tracks"] = [];
+  for (const t of raw.tracks ?? []) {
+    if (!t || typeof t.prompt !== "string" || t.prompt.trim().length === 0) continue;
+    const role: MusicRole =
+      t.role === "stinger" || t.role === "intro" || t.role === "outro" ? t.role : "underscore";
+    const scenesCovered = Array.isArray(t.scenesCovered)
+      ? t.scenesCovered
+          .filter((s): s is string => typeof s === "string")
+          .filter((s) => knownSceneIds.has(s))
+      : [];
+    const durationSeconds = clampMusicDuration(
+      typeof t.durationSeconds === "number" ? t.durationSeconds : 60,
+    );
+    const label =
+      typeof t.label === "string" && t.label.trim().length > 0
+        ? t.label.trim()
+        : t.prompt.trim().slice(0, 40);
+    tracks.push({
+      id: mintMusicId(),
+      prompt: t.prompt.trim(),
+      durationSeconds,
+      role,
+      scenesCovered,
+      label,
+      rationale: typeof t.rationale === "string" ? t.rationale : "",
+    });
+    if (tracks.length >= 3) break;
+  }
+  return { overallNote: raw.overallNote ?? "", tracks };
+}
+
+let musicIdCounter = 0;
+function mintMusicId(): string {
+  const ms = Date.now().toString(36);
+  const ctr = (musicIdCounter++).toString(36).padStart(2, "0");
+  return `music-${ms}-${ctr}`;
+}
+
+// ── Render-review (Gemini) ───────────────────────────────────────────────────
+
+interface RenderReviewToolInput {
+  overallRetentionScore?: number;
+  scrollRiskWindows?: Array<{
+    startS?: number;
+    endS?: number;
+    severity?: string;
+    why?: string;
+    fix?: string;
+  }>;
+  brandConsistency?: {
+    score?: number;
+    drift?: string[];
+  };
+  audioMix?: {
+    voiceClarity?: string;
+    musicLevels?: string;
+    sfxBalance?: string;
+  };
+  perScene?: Array<{
+    sceneId?: string;
+    visualHook?: number;
+    paceMatch?: number;
+    onBrand?: number;
+    note?: string;
+  }>;
+}
+
+interface RenderReviewResponse {
+  overallRetentionScore: number;
+  scrollRiskWindows: Array<{
+    startS: number;
+    endS: number;
+    severity: "low" | "med" | "high";
+    why: string;
+    fix: string;
+  }>;
+  brandConsistency: { score: number; drift: string[] };
+  audioMix: {
+    voiceClarity: "good" | "muddy" | "clipped";
+    musicLevels: "ducked" | "flat" | "fighting";
+    sfxBalance: "well-placed" | "missing" | "overused";
+  };
+  perScene: Array<{
+    sceneId: string;
+    visualHook: number;
+    paceMatch: number;
+    onBrand: number;
+    note: string;
+  }>;
+}
+
+const RENDER_REVIEW_TOOL: ToolDefinition = {
+  name: "report_render_review",
+  description:
+    "Report a structured retention review of a rendered video. Score retention, identify scroll-risk windows, audit brand consistency, and grade each scene.",
+  input_schema: {
+    type: "object",
+    properties: {
+      overallRetentionScore: {
+        type: "number",
+        description: "0-100. Single rough estimate of how likely a feed viewer watches to the end.",
+      },
+      scrollRiskWindows: {
+        type: "array",
+        items: {
+          type: "object",
+          properties: {
+            startS: { type: "number" },
+            endS: { type: "number" },
+            severity: { type: "string", enum: ["low", "med", "high"] },
+            why: { type: "string" },
+            fix: { type: "string" },
+          },
+          required: ["startS", "endS", "severity", "why", "fix"],
+        },
+        description:
+          "Time windows where retention is at risk. Each carries a one-sentence why and a one-sentence concrete fix.",
+      },
+      brandConsistency: {
+        type: "object",
+        properties: {
+          score: { type: "number" },
+          drift: { type: "array", items: { type: "string" } },
+        },
+      },
+      audioMix: {
+        type: "object",
+        properties: {
+          voiceClarity: { type: "string", enum: ["good", "muddy", "clipped"] },
+          musicLevels: { type: "string", enum: ["ducked", "flat", "fighting"] },
+          sfxBalance: { type: "string", enum: ["well-placed", "missing", "overused"] },
+        },
+      },
+      perScene: {
+        type: "array",
+        items: {
+          type: "object",
+          properties: {
+            sceneId: { type: "string" },
+            visualHook: { type: "number" },
+            paceMatch: { type: "number" },
+            onBrand: { type: "number" },
+            note: { type: "string" },
+          },
+          required: ["sceneId", "visualHook", "paceMatch", "onBrand", "note"],
+        },
+      },
+    },
+    required: ["overallRetentionScore", "scrollRiskWindows", "perScene"],
+  },
+};
+
+function buildRenderReviewSystem(): string {
+  return [
+    "# Retention review",
+    "",
+    "You're a retention engineer reviewing a Reels-style explainer video. Watch the whole video, then report:",
+    "",
+    "  - overallRetentionScore (0-100): how likely is a feed viewer to watch to the end?",
+    "  - scrollRiskWindows: time spans where viewers will drop off. ALWAYS include why + a concrete one-sentence fix referencing the existing scenes/templates.",
+    "  - brandConsistency: 0-100 score + per-scene drift notes (which scenes break the look).",
+    "  - audioMix: voice clarity, music levels relative to voice, sfx balance.",
+    "  - perScene: visualHook (0-10), paceMatch (0-10 — does pacing match narration density?), onBrand (0-10), one-sentence note.",
+    "",
+    "Rules:",
+    "1. Be specific. 'Scene 4 visual is generic' is unhelpful. 'Scene 4 has 15 words on screen with no movement for 3.5s' is.",
+    "2. Reference per-scene fixes by template id where relevant ('swap to kinetic-words', 'use editorial-serif for breath').",
+    "3. The whole point is RETENTION. A safe score is useless. Tell the user where they're losing viewers.",
+  ].join("\n");
+}
+
+function buildRenderReviewUser(
+  script: Script,
+  timings: Array<{ sceneId: string; start: number; duration: number }>,
+): string {
+  const lines = script.scenes.map((s) => {
+    const t = timings.find((tt) => tt.sceneId === s.id);
+    return `${s.id} (${t ? `${t.start.toFixed(1)}-${(t.start + t.duration).toFixed(1)}s` : "?"}) · ${s.template}${s.hook ? " · HOOK" : ""} · ${s.text}`;
+  });
+  return [
+    "## Script + scene timings (use these to anchor timestamps in your review)",
+    lines.join("\n"),
+    "",
+    "Now watch the attached video and call report_render_review.",
+  ].join("\n");
+}
+
+function buildRenderReviewResponse(
+  raw: RenderReviewToolInput,
+  script: Script,
+): RenderReviewResponse {
+  const knownSceneIds = new Set(script.scenes.map((s) => s.id));
+  return {
+    overallRetentionScore: clampScore(raw.overallRetentionScore, 0, 100, 50),
+    scrollRiskWindows: (raw.scrollRiskWindows ?? [])
+      .filter((w) => w && typeof w.startS === "number" && typeof w.endS === "number")
+      .map((w) => ({
+        startS: w.startS!,
+        endS: w.endS!,
+        severity: w.severity === "high" || w.severity === "med" ? w.severity : "low",
+        why: typeof w.why === "string" ? w.why : "",
+        fix: typeof w.fix === "string" ? w.fix : "",
+      })),
+    brandConsistency: {
+      score: clampScore(raw.brandConsistency?.score, 0, 100, 70),
+      drift: Array.isArray(raw.brandConsistency?.drift)
+        ? raw.brandConsistency.drift.filter((s): s is string => typeof s === "string")
+        : [],
+    },
+    audioMix: {
+      voiceClarity:
+        raw.audioMix?.voiceClarity === "muddy" || raw.audioMix?.voiceClarity === "clipped"
+          ? raw.audioMix.voiceClarity
+          : "good",
+      musicLevels:
+        raw.audioMix?.musicLevels === "flat" || raw.audioMix?.musicLevels === "fighting"
+          ? raw.audioMix.musicLevels
+          : "ducked",
+      sfxBalance:
+        raw.audioMix?.sfxBalance === "missing" || raw.audioMix?.sfxBalance === "overused"
+          ? raw.audioMix.sfxBalance
+          : "well-placed",
+    },
+    perScene: (raw.perScene ?? [])
+      .filter((p) => p && typeof p.sceneId === "string" && knownSceneIds.has(p.sceneId))
+      .map((p) => ({
+        sceneId: p.sceneId!,
+        visualHook: clampScore(p.visualHook, 0, 10, 5),
+        paceMatch: clampScore(p.paceMatch, 0, 10, 5),
+        onBrand: clampScore(p.onBrand, 0, 10, 5),
+        note: typeof p.note === "string" ? p.note : "",
+      })),
+  };
+}
+
+function clampScore(value: number | undefined, min: number, max: number, fallback: number): number {
+  if (typeof value !== "number" || !Number.isFinite(value)) return fallback;
+  return Math.max(min, Math.min(max, value));
+}
+
+// ── Scroll-test (Gemini, per scene) ──────────────────────────────────────────
+
+interface ScrollTestToolInput {
+  wouldScroll?: boolean;
+  whyOrWhyNot?: string;
+  oneChangeFix?: string;
+  sceneStrengthScore?: number;
+  patch?: {
+    template?: string;
+    props?: Record<string, unknown>;
+    reasoning?: string;
+  };
+}
+
+interface ScrollTestResponse {
+  sceneId: string;
+  wouldScroll: boolean;
+  whyOrWhyNot: string;
+  oneChangeFix: string;
+  sceneStrengthScore: number;
+  /** Optional patch that the studio surfaces as a SceneSuggestion in the
+   *  scene's amber stack — applies to script.json on Apply. */
+  suggestion: {
+    preview: string;
+    rationale: string;
+    patch: { template?: string; props?: Record<string, unknown>; reasoning?: string };
+  } | null;
+}
+
+const SCROLL_TEST_TOOL: ToolDefinition = {
+  name: "report_scroll_test",
+  description:
+    "Predict whether a feed viewer would scroll past this scene. Score it, give a one-sentence why, propose a one-change fix, and optionally a concrete scene patch the studio can apply.",
+  input_schema: {
+    type: "object",
+    properties: {
+      wouldScroll: {
+        type: "boolean",
+        description: "Best estimate: would a viewer in a feed scroll past this scene?",
+      },
+      whyOrWhyNot: {
+        type: "string",
+        description: "One specific sentence. Reference the visual, audio, or pacing.",
+      },
+      oneChangeFix: {
+        type: "string",
+        description:
+          "One sentence: the single change that would most improve retention. Be concrete — reference a template, an accent word, a duration cut.",
+      },
+      sceneStrengthScore: {
+        type: "number",
+        minimum: 0,
+        maximum: 100,
+        description: "Hold-power score 0-100. <30 = strong scroll signal. >70 = strong hold.",
+      },
+      patch: {
+        type: "object",
+        description:
+          "Optional concrete scene patch — same shape as the storyline-level intent patches. Set ONLY when the fix maps cleanly to a template/props change. Skip when it's narrative-level (re-record narration).",
+        properties: {
+          template: { type: "string" },
+          props: { type: "object" },
+          reasoning: { type: "string" },
+        },
+      },
+    },
+    required: ["wouldScroll", "whyOrWhyNot", "oneChangeFix", "sceneStrengthScore"],
+  },
+};
+
+function buildScrollTestSystem(): string {
+  return [
+    "# Scroll test",
+    "",
+    "You're a retention scientist watching ONE scene from a feed perspective. Three frames + the narration give you the full picture for this scene.",
+    "",
+    "Predict: would a feed viewer scroll past?",
+    "",
+    "Heuristics that predict scroll-through:",
+    "  - Static visual for >2s with monotone audio → scroll",
+    "  - Long on-screen text with no motion → scroll",
+    "  - Audio-visual mismatch (boring visual + urgent VO) → scroll",
+    "  - No clear payoff in the scene → scroll",
+    "",
+    "Heuristics that predict hold:",
+    "  - Pattern interrupt (cut, motion shift, accent word lands)",
+    "  - One concrete number / claim landing on screen",
+    "  - Tight pacing matching narration density",
+    "",
+    "Be specific. Reference the visual you actually see in the frames. If you can map the fix to a template or props change, ALSO emit a `patch` so the studio can apply it with one click.",
+  ].join("\n");
+}
+
+function buildScrollTestUser(scene: SceneRef): string {
+  const headline =
+    typeof scene.props.title === "string"
+      ? scene.props.title
+      : Array.isArray(scene.props.words)
+        ? (scene.props.words as unknown[]).join(" ")
+        : "";
+  return [
+    `## Scene ${scene.id} · ${scene.template}${scene.hook ? " · HOOK" : ""}`,
+    `Narration: ${scene.text}`,
+    `On-screen: ${headline.slice(0, 200)}`,
+    "",
+    "The frames attached are sampled from start / mid / end of this scene's window. Now call report_scroll_test.",
+  ].join("\n");
+}
+
+function buildScrollTestResponse(raw: ScrollTestToolInput, scene: SceneRef): ScrollTestResponse {
+  const score = clampScore(raw.sceneStrengthScore, 0, 100, 50);
+  const wouldScroll = typeof raw.wouldScroll === "boolean" ? raw.wouldScroll : score < 50;
+  const fix = typeof raw.oneChangeFix === "string" ? raw.oneChangeFix : "";
+  // Promote the model's optional patch into the SceneSuggestion shape if it
+  // emitted one. The studio can apply via the existing applyPatch pipeline.
+  let suggestion: ScrollTestResponse["suggestion"] = null;
+  if (raw.patch && (raw.patch.template || raw.patch.props || raw.patch.reasoning)) {
+    suggestion = {
+      preview: fix || "Scroll-test fix",
+      rationale: typeof raw.whyOrWhyNot === "string" ? raw.whyOrWhyNot : "",
+      patch: {
+        ...(typeof raw.patch.template === "string" ? { template: raw.patch.template } : {}),
+        ...(raw.patch.props && typeof raw.patch.props === "object"
+          ? { props: { ...scene.props, ...raw.patch.props } }
+          : {}),
+        ...(typeof raw.patch.reasoning === "string" ? { reasoning: raw.patch.reasoning } : {}),
+      },
+    };
+  }
+  return {
+    sceneId: scene.id,
+    wouldScroll,
+    whyOrWhyNot: typeof raw.whyOrWhyNot === "string" ? raw.whyOrWhyNot : "",
+    oneChangeFix: fix,
+    sceneStrengthScore: score,
+    suggestion,
+  };
+}
+
+// ── Helpers shared across the three new milestones ───────────────────────────
+
+/**
+ * Convert an Anthropic-shaped tool definition (`input_schema`) to Gemini's
+ * function-declaration shape (`parameters`). Both providers accept JSON Schema
+ * for the body; only the wrapper key differs. This keeps the tool definitions
+ * readable as one shape and lets us reuse them across providers.
+ */
+function anthropicToGeminiTool(tool: ToolDefinition): {
+  name: string;
+  description: string;
+  parameters: Record<string, unknown>;
+} {
+  return {
+    name: tool.name,
+    description: tool.description,
+    parameters: tool.input_schema as Record<string, unknown>,
+  };
+}
+
+function computeSceneTimings(
+  script: Script,
+): Array<{ sceneId: string; start: number; duration: number }> {
+  const out: Array<{ sceneId: string; start: number; duration: number }> = [];
+  let cursor = 0;
+  for (const scene of script.scenes) {
+    const audioDur = (scene as { audio?: { durationSeconds?: number } }).audio?.durationSeconds;
+    const lead = (scene as { audio?: { leadInSeconds?: number } }).audio?.leadInSeconds ?? 0;
+    const tail = (scene as { audio?: { tailPadSeconds?: number } }).audio?.tailPadSeconds ?? 0;
+    const total =
+      typeof audioDur === "number" && audioDur > 0
+        ? audioDur + lead + tail
+        : (scene.durationHint ?? 4);
+    out.push({ sceneId: scene.id, start: cursor, duration: total });
+    cursor += total;
+  }
+  return out;
+}
+
+function findMostRecentRender(projectDir: string): string | null {
+  const rendersDir = join(projectDir, "renders");
+  if (!existsSync(rendersDir)) return null;
+  try {
+    const fs = require("node:fs") as typeof import("node:fs");
+    const entries = fs.readdirSync(rendersDir);
+    const mp4s = entries.filter((f: string) => f.toLowerCase().endsWith(".mp4"));
+    if (mp4s.length === 0) return null;
+    const withMtime = mp4s.map((f: string) => {
+      const stat = fs.statSync(join(rendersDir, f));
+      return { f, mtime: stat.mtimeMs };
+    });
+    withMtime.sort((a, b) => b.mtime - a.mtime);
+    const first = withMtime[0];
+    return first ? `renders/${first.f}` : null;
+  } catch {
+    return null;
+  }
+}
+
+function loadMostRecentRenderReview(projectDir: string): unknown | null {
+  const dir = join(projectDir, ".hyperframes", "render-reviews");
+  if (!existsSync(dir)) return null;
+  try {
+    const fs = require("node:fs") as typeof import("node:fs");
+    const entries = fs.readdirSync(dir).filter((f: string) => f.endsWith(".json"));
+    if (entries.length === 0) return null;
+    entries.sort();
+    const latest = entries[entries.length - 1];
+    if (!latest) return null;
+    return JSON.parse(readFileSync(join(dir, latest), "utf-8"));
+  } catch {
+    return null;
+  }
+}
diff --git a/packages/core/src/studio-api/types.ts b/packages/core/src/studio-api/types.ts
index defbd4e8f..db9d1d930 100644
--- a/packages/core/src/studio-api/types.ts
+++ b/packages/core/src/studio-api/types.ts
@@ -84,6 +84,18 @@ export interface StudioApiAdapter {
    */
   probeAudioDurationSeconds?: (filePath: string) => Promise<number>;
 
+  /**
+   * Optional: extract a single JPEG frame from a video at the given second.
+   * Used by the storyline scroll-test route to send Gemini representative
+   * frames for retention analysis. If absent the scroll-test runs text-only —
+   * Gemini still produces a reasonable verdict from the narration alone.
+   *
+   * Implementations should return null on extraction failure (corrupt video,
+   * timestamp past end) rather than throwing — the caller treats null as
+   * "skip this frame, try the next".
+   */
+  extractVideoFrameToBytes?: (filePath: string, timeSeconds: number) => Promise<Buffer | null>;
+
   /**
    * Optional: create a new project on disk with a unique id. Returns the
    * resolved project. If absent, POST /projects returns 501.
diff --git a/packages/core/src/telemetry/cost.ts b/packages/core/src/telemetry/cost.ts
index 67c831fc4..f6b6e09ab 100644
--- a/packages/core/src/telemetry/cost.ts
+++ b/packages/core/src/telemetry/cost.ts
@@ -21,6 +21,12 @@ export type CostOp =
       imageCount: number;
     } & AnthropicTokenUsage)
   | { kind: "elevenlabs"; voiceId: string; characters: number }
+  | {
+      kind: "gemini";
+      model: string;
+      promptTokens: number;
+      outputTokens: number;
+    }
   | {
       kind: "render";
       durationSeconds: number;
@@ -70,6 +76,13 @@ export function computeCost(rates: CostRates, op: CostOp): number {
   if (op.kind === "elevenlabs") {
     return (op.characters / 1_000_000) * rates.elevenlabs.perMChar;
   }
+  if (op.kind === "gemini") {
+    const rate = rates.gemini[op.model] ?? rates.gemini.default;
+    return (
+      (op.promptTokens / 1_000_000) * rate.inputPerMTok +
+      (op.outputTokens / 1_000_000) * rate.outputPerMTok
+    );
+  }
   if (op.kind === "render") {
     return (op.durationSeconds / 60) * rates.render.perMinute;
   }
diff --git a/packages/core/src/telemetry/rates.ts b/packages/core/src/telemetry/rates.ts
index 592db5d10..eaf6dafba 100644
--- a/packages/core/src/telemetry/rates.ts
+++ b/packages/core/src/telemetry/rates.ts
@@ -17,9 +17,18 @@ export interface AnthropicRate {
   cacheReadPerMTok?: number;
 }
 
+export interface GeminiRate {
+  inputPerMTok: number;
+  outputPerMTok: number;
+}
+
 export interface CostRates {
   anthropic: Record<string, AnthropicRate>;
   elevenlabs: { perMChar: number };
+  /** Gemini per-model rates. `default` is the fallback when a model id isn't
+   *  in the table — keeps cost reporting sensible even when the model lineup
+   *  changes upstream. */
+  gemini: Record<string, GeminiRate> & { default: GeminiRate };
   render: { perMinute: number };
 }
 
@@ -62,6 +71,14 @@ export const DEFAULT_RATES: CostRates = {
     },
   },
   elevenlabs: { perMChar: 30 },
+  gemini: {
+    // Google's published pricing as of 2026-04. Flash is the workhorse for
+    // every storyline action (render review, scroll-test, image analysis);
+    // Pro is reserved for multi-video comparison work that isn't in scope yet.
+    "gemini-2.5-flash": { inputPerMTok: 0.3, outputPerMTok: 2.5 },
+    "gemini-2.5-pro": { inputPerMTok: 1.25, outputPerMTok: 10 },
+    default: { inputPerMTok: 0.3, outputPerMTok: 2.5 },
+  },
   render: { perMinute: 0.1 },
 };
 
@@ -86,6 +103,9 @@ function mergeRates(base: CostRates, override: Partial<CostRates> | null): CostR
     elevenlabs: override.elevenlabs
       ? { ...base.elevenlabs, ...override.elevenlabs }
       : base.elevenlabs,
+    gemini: override.gemini
+      ? ({ ...base.gemini, ...override.gemini } as CostRates["gemini"])
+      : base.gemini,
     render: override.render ? { ...base.render, ...override.render } : base.render,
   };
 }
diff --git a/packages/studio/src/components/sidebar/StorylineTab.tsx b/packages/studio/src/components/sidebar/StorylineTab.tsx
index 3955e64f1..8fe50009e 100644
--- a/packages/studio/src/components/sidebar/StorylineTab.tsx
+++ b/packages/studio/src/components/sidebar/StorylineTab.tsx
@@ -78,6 +78,54 @@ interface ProjectIntentResponse {
 
 type DirectorScope = "storyline" | "project";
 
+interface MusicSuggestion {
+  id: string;
+  prompt: string;
+  durationSeconds: number;
+  role: "underscore" | "stinger" | "intro" | "outro";
+  scenesCovered: string[];
+  label: string;
+  rationale: string;
+}
+interface MusicSuggestionList {
+  overallNote: string;
+  tracks: MusicSuggestion[];
+}
+interface MusicEntry {
+  id: string;
+  prompt: string;
+  path: string;
+  durationSeconds: number;
+  scenesCovered: string[];
+  role: "underscore" | "stinger" | "intro" | "outro";
+  label?: string;
+}
+
+interface RenderReviewSummary {
+  overallRetentionScore: number;
+  scrollRiskWindows: Array<{
+    startS: number;
+    endS: number;
+    severity: "low" | "med" | "high";
+    why: string;
+    fix: string;
+  }>;
+  brandConsistency: { score: number; drift: string[] };
+  audioMix: {
+    voiceClarity: "good" | "muddy" | "clipped";
+    musicLevels: "ducked" | "flat" | "fighting";
+    sfxBalance: "well-placed" | "missing" | "overused";
+  };
+  perScene: Array<{
+    sceneId: string;
+    visualHook: number;
+    paceMatch: number;
+    onBrand: number;
+    note: string;
+  }>;
+  renderPath?: string;
+}
+
 const SCRIPT_GENERATED = "script.generated.json";
 
 /** Custom DOM event dispatched when the focal scene card changes during
@@ -94,6 +142,9 @@ const ACTION_PATH: Record<AIActionId, string> = {
   // dedicated branch in handleAIAction. The path is the same prefix so it
   // shares the route table.
   addSfx: "sfx-suggest",
+  // scrollTest returns a Gemini verdict + optional patch — handled in a
+  // dedicated branch.
+  scrollTest: "scroll-test",
 };
 
 const SUGGESTION_PROMPTS_BY_SCOPE: Record<DirectorScope, string[]> = {
@@ -135,6 +186,38 @@ export const StorylineTab = memo(function StorylineTab({ projectId }: StorylineT
     Record<string, "idle" | "running" | "error">
   >({});
 
+  // Per-scene Gemini scroll-test verdicts. Composed with renderReview's
+  // perScene scores into the retention-map strip at the top of the tab.
+  const [scrollTestByScene, setScrollTestByScene] = useState<
+    Record<
+      string,
+      {
+        wouldScroll: boolean;
+        whyOrWhyNot: string;
+        oneChangeFix: string;
+        sceneStrengthScore: number;
+      }
+    >
+  >({});
+
+  // Music wizard state — separate from the scene-level Director because it
+  // runs against ElevenLabs (slow, polled-job) instead of Haiku (sub-second).
+  const [musicVibe, setMusicVibe] = useState("");
+  const [musicWizardRunning, setMusicWizardRunning] = useState(false);
+  const [musicWizardError, setMusicWizardError] = useState<string | null>(null);
+  const [musicSuggestions, setMusicSuggestions] = useState<MusicSuggestionList | null>(null);
+  const [musicTracks, setMusicTracks] = useState<MusicEntry[]>([]);
+  const [musicGenerationStatus, setMusicGenerationStatus] = useState<
+    Record<string, "idle" | "running" | "error">
+  >({});
+
+  // Render-review (Gemini) state. The result persists to disk under
+  // .hyperframes/render-reviews/<ts>.json so the studio can show the last
+  // review on reload without re-running.
+  const [renderReview, setRenderReview] = useState<RenderReviewSummary | null>(null);
+  const [renderReviewRunning, setRenderReviewRunning] = useState(false);
+  const [renderReviewError, setRenderReviewError] = useState<string | null>(null);
+
   // Director state — single textarea, two scopes (storyline vs project).
   const [directorScope, setDirectorScope] = useState<DirectorScope>("storyline");
   const [intent, setIntent] = useState("");
@@ -201,10 +284,12 @@ export const StorylineTab = memo(function StorylineTab({ projectId }: StorylineT
       setLoading(true);
       setError(null);
       try {
-        const [planned, imagesRes, sfxRes] = await Promise.all([
+        const [planned, imagesRes, sfxRes, musicRes, reviewRes] = await Promise.all([
           loadGeneratedOrPlanned(),
           fetch(`/api/projects/${projectId}/images`).catch(() => null),
           fetch(`/api/projects/${projectId}/storyline/sfx`).catch(() => null),
+          fetch(`/api/projects/${projectId}/storyline/music`).catch(() => null),
+          fetch(`/api/projects/${projectId}/storyline/render-review`).catch(() => null),
         ]);
         if (cancelled) return;
         setScript(planned);
@@ -228,6 +313,16 @@ export const StorylineTab = memo(function StorylineTab({ projectId }: StorylineT
           }
           if (!cancelled) setSfxByScene(grouped);
         }
+        if (musicRes && musicRes.ok) {
+          const musicJson = (await musicRes.json()) as {
+            manifest?: { entries?: MusicEntry[] };
+          };
+          if (!cancelled) setMusicTracks(musicJson.manifest?.entries ?? []);
+        }
+        if (reviewRes && reviewRes.ok) {
+          const reviewJson = (await reviewRes.json()) as { review?: RenderReviewSummary };
+          if (!cancelled && reviewJson.review) setRenderReview(reviewJson.review);
+        }
       } catch (err) {
         if (!cancelled) setError(err instanceof Error ? err.message : String(err));
       } finally {
@@ -300,6 +395,48 @@ export const StorylineTab = memo(function StorylineTab({ projectId }: StorylineT
             ...prev,
             [scene.id]: [...(prev[scene.id] ?? []), ...(json.suggestions ?? [])],
           }));
+        } else if (action === "scrollTest") {
+          // Gemini scroll-test response: store the verdict in the retention
+          // map's per-scene state, and surface the optional patch as a
+          // SceneSuggestion in the regular stack so Apply works for free.
+          const json = (await res.json()) as {
+            sceneId?: string;
+            wouldScroll?: boolean;
+            whyOrWhyNot?: string;
+            oneChangeFix?: string;
+            sceneStrengthScore?: number;
+            suggestion?: {
+              preview?: string;
+              rationale?: string;
+              patch?: {
+                template?: string;
+                props?: Record<string, unknown>;
+                reasoning?: string;
+              };
+            } | null;
+          };
+          setScrollTestByScene((prev) => ({
+            ...prev,
+            [scene.id]: {
+              wouldScroll: json.wouldScroll ?? false,
+              whyOrWhyNot: json.whyOrWhyNot ?? "",
+              oneChangeFix: json.oneChangeFix ?? "",
+              sceneStrengthScore: json.sceneStrengthScore ?? 50,
+            },
+          }));
+          if (json.suggestion?.patch) {
+            const suggestion: SceneSuggestion = {
+              id: `${scene.id}-scrollTest-${Date.now()}`,
+              action: "scrollTest",
+              preview: json.suggestion.preview ?? "",
+              rationale: json.suggestion.rationale ?? "",
+              patch: json.suggestion.patch,
+            };
+            setSuggestionsByScene((prev) => ({
+              ...prev,
+              [scene.id]: [...(prev[scene.id] ?? []), suggestion],
+            }));
+          }
         } else {
           const json = (await res.json()) as {
             preview?: string;
@@ -478,6 +615,118 @@ export const StorylineTab = memo(function StorylineTab({ projectId }: StorylineT
     [projectId],
   );
 
+  // ── Music handlers ─────────────────────────────────────────────────────────
+
+  const runMusicSuggest = useCallback(async (): Promise<void> => {
+    const trimmed = musicVibe.trim();
+    if (!trimmed) return;
+    setMusicWizardRunning(true);
+    setMusicWizardError(null);
+    setMusicSuggestions(null);
+    try {
+      const res = await fetch(`/api/projects/${projectId}/storyline/music-suggest`, {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({ vibe: trimmed }),
+      });
+      if (!res.ok) {
+        const err = (await res.json().catch(() => ({}))) as { error?: string };
+        throw new Error(err.error ?? `HTTP ${res.status}`);
+      }
+      const json = (await res.json()) as MusicSuggestionList;
+      setMusicSuggestions(json);
+    } catch (err) {
+      setMusicWizardError(err instanceof Error ? err.message : String(err));
+    } finally {
+      setMusicWizardRunning(false);
+    }
+  }, [musicVibe, projectId]);
+
+  const runMusicGenerate = useCallback(
+    async (track: MusicSuggestion): Promise<void> => {
+      setMusicGenerationStatus((prev) => ({ ...prev, [track.id]: "running" }));
+      try {
+        const res = await fetch(`/api/projects/${projectId}/storyline/music-generate`, {
+          method: "POST",
+          headers: { "Content-Type": "application/json" },
+          body: JSON.stringify({
+            prompt: track.prompt,
+            durationSeconds: track.durationSeconds,
+            role: track.role,
+            scenesCovered: track.scenesCovered,
+            label: track.label,
+          }),
+        });
+        if (!res.ok) {
+          const err = (await res.json().catch(() => ({}))) as { error?: string };
+          throw new Error(err.error ?? `HTTP ${res.status}`);
+        }
+        const json = (await res.json()) as { ok?: boolean; entry?: MusicEntry };
+        if (json.entry) {
+          setMusicTracks((prev) => [...prev, json.entry!]);
+        }
+        // Drop the matching suggestion from the wizard once generated.
+        setMusicSuggestions((prev) =>
+          prev ? { ...prev, tracks: prev.tracks.filter((t) => t.id !== track.id) } : prev,
+        );
+        setMusicGenerationStatus((prev) => {
+          const { [track.id]: _, ...rest } = prev;
+          return rest;
+        });
+        setReloadKey((k) => k + 1);
+      } catch (err) {
+        setMusicGenerationStatus((prev) => ({ ...prev, [track.id]: "error" }));
+        window.alert(
+          `Couldn't generate music: ${err instanceof Error ? err.message : String(err)}`,
+        );
+      }
+    },
+    [projectId],
+  );
+
+  const runMusicDelete = useCallback(
+    async (entryId: string): Promise<void> => {
+      try {
+        const res = await fetch(`/api/projects/${projectId}/storyline/music/${entryId}`, {
+          method: "DELETE",
+        });
+        if (!res.ok) {
+          const err = (await res.json().catch(() => ({}))) as { error?: string };
+          throw new Error(err.error ?? `HTTP ${res.status}`);
+        }
+        setMusicTracks((prev) => prev.filter((t) => t.id !== entryId));
+        setReloadKey((k) => k + 1);
+      } catch (err) {
+        window.alert(`Couldn't remove music: ${err instanceof Error ? err.message : String(err)}`);
+      }
+    },
+    [projectId],
+  );
+
+  // ── Render-review handler (Gemini) ─────────────────────────────────────────
+
+  const runRenderReview = useCallback(async (): Promise<void> => {
+    setRenderReviewRunning(true);
+    setRenderReviewError(null);
+    try {
+      const res = await fetch(`/api/projects/${projectId}/storyline/render-review`, {
+        method: "POST",
+        headers: { "Content-Type": "application/json" },
+        body: JSON.stringify({}),
+      });
+      if (!res.ok) {
+        const err = (await res.json().catch(() => ({}))) as { error?: string };
+        throw new Error(err.error ?? `HTTP ${res.status}`);
+      }
+      const json = (await res.json()) as RenderReviewSummary;
+      setRenderReview(json);
+    } catch (err) {
+      setRenderReviewError(err instanceof Error ? err.message : String(err));
+    } finally {
+      setRenderReviewRunning(false);
+    }
+  }, [projectId]);
+
   // ── Storyline intent ───────────────────────────────────────────────────────
 
   const runIntent = useCallback(async (): Promise<void> => {
@@ -874,6 +1123,46 @@ export const StorylineTab = memo(function StorylineTab({ projectId }: StorylineT
         </div>
       </header>
 
+      {/* Retention map — composes Gemini's render-review per-scene scores
+          with per-card scroll-test results into a single horizontal strip.
+          Click any cell to scroll the storyline to that scene. */}
+      <RetentionMap
+        scenes={scenesWithStart.map(({ scene }) => scene.id)}
+        renderReviewPerScene={renderReview?.perScene}
+        scrollTestByScene={scrollTestByScene}
+        onSceneClick={(sceneId) => {
+          const el = cardRefs.current.get(sceneId);
+          if (!el) return;
+          el.scrollIntoView({ behavior: "smooth", block: "center" });
+        }}
+      />
+
+      {/* Render-review panel — Gemini reviews the most recent render. The
+          result persists to disk so reload shows the last review. */}
+      <RenderReviewPanel
+        review={renderReview}
+        running={renderReviewRunning}
+        error={renderReviewError}
+        onRun={runRenderReview}
+        onDismiss={() => setRenderReview(null)}
+      />
+
+      {/* Music wizard — separate from the Director because it runs against
+          ElevenLabs (slow, polled-job) instead of Haiku (sub-second). */}
+      <MusicWizardPanel
+        vibe={musicVibe}
+        onVibeChange={setMusicVibe}
+        running={musicWizardRunning}
+        error={musicWizardError}
+        onSubmit={runMusicSuggest}
+        suggestions={musicSuggestions}
+        onGenerate={runMusicGenerate}
+        onDismiss={() => setMusicSuggestions(null)}
+        generationStatus={musicGenerationStatus}
+        appliedTracks={musicTracks}
+        onDelete={runMusicDelete}
+      />
+
       {/* Director — single textarea, two scopes. Storyline scope returns
           per-scene patches; Project scope additionally proposes theme + brief
           changes that move the whole video. */}
@@ -1389,3 +1678,413 @@ function KbdHint({ keys, label }: { keys: string[]; label: string }) {
     </span>
   );
 }
+
+// ── Retention map (Milestone F) ──────────────────────────────────────────────
+
+/**
+ * Horizontal strip at the top of Storyline showing one cell per scene.
+ * Color-coded by retention strength:
+ *   - render-review's perScene scores (visualHook + paceMatch + onBrand averaged)
+ *   - falling back to scrollTest's sceneStrengthScore when render-review is absent
+ *   - showing a neutral cell when neither has run for that scene
+ *
+ * Click a cell → scroll the storyline to that scene's card. Pure presentation;
+ * no fetch happens here.
+ */
+function RetentionMap({
+  scenes,
+  renderReviewPerScene,
+  scrollTestByScene,
+  onSceneClick,
+}: {
+  scenes: string[];
+  renderReviewPerScene?: RenderReviewSummary["perScene"];
+  scrollTestByScene: Record<string, { sceneStrengthScore: number }>;
+  onSceneClick: (sceneId: string) => void;
+}) {
+  if (scenes.length === 0) return null;
+  const reviewById = new Map((renderReviewPerScene ?? []).map((s) => [s.sceneId, s] as const));
+  const cells = scenes.map((sceneId) => {
+    const review = reviewById.get(sceneId);
+    if (review) {
+      // Average of three 0-10 scores → 0-100.
+      const avg = (review.visualHook + review.paceMatch + review.onBrand) / 3;
+      return { sceneId, score: Math.round(avg * 10), source: "review" as const };
+    }
+    const test = scrollTestByScene[sceneId];
+    if (test) return { sceneId, score: test.sceneStrengthScore, source: "test" as const };
+    return { sceneId, score: -1, source: "none" as const };
+  });
+
+  const allUnscored = cells.every((c) => c.score < 0);
+  if (allUnscored) {
+    // Don't take vertical space until we have at least one signal.
+    return null;
+  }
+
+  return (
+    <section className="mb-3 rounded-lg border border-neutral-800 bg-neutral-900/40 p-2">
+      <div className="flex items-center justify-between mb-1.5">
+        <span className="text-[9px] uppercase tracking-[0.22em] font-semibold text-neutral-500">
+          Retention map
+        </span>
+        <span className="text-[9px] text-neutral-600">
+          green = hold · amber = warn · red = scroll
+        </span>
+      </div>
+      <div className="flex items-stretch gap-0.5">
+        {cells.map((c) => {
+          const tone =
+            c.score < 0
+              ? "bg-neutral-800 border-neutral-800"
+              : c.score >= 70
+                ? "bg-emerald-500/40 border-emerald-400/60 hover:bg-emerald-500/60"
+                : c.score >= 40
+                  ? "bg-amber-500/40 border-amber-400/60 hover:bg-amber-500/60"
+                  : "bg-rose-500/40 border-rose-400/60 hover:bg-rose-500/60";
+          return (
+            <button
+              key={c.sceneId}
+              type="button"
+              onClick={() => onSceneClick(c.sceneId)}
+              className={`flex-1 h-5 rounded border ${tone} transition-colors relative group`}
+              title={
+                c.score < 0
+                  ? `${c.sceneId}: not yet scored — run a render review or scroll test`
+                  : `${c.sceneId}: ${c.score}/100 (${c.source === "review" ? "render review" : "scroll test"})`
+              }
+              aria-label={`Jump to scene ${c.sceneId}, retention score ${c.score}`}
+            >
+              <span className="absolute left-1 top-1/2 -translate-y-1/2 text-[8px] font-mono text-neutral-100/0 group-hover:text-neutral-100/80 transition-colors pointer-events-none">
+                {c.sceneId}
+              </span>
+            </button>
+          );
+        })}
+      </div>
+    </section>
+  );
+}
+
+// ── Render-review panel (Milestone C) ────────────────────────────────────────
+
+function RenderReviewPanel({
+  review,
+  running,
+  error,
+  onRun,
+  onDismiss,
+}: {
+  review: RenderReviewSummary | null;
+  running: boolean;
+  error: string | null;
+  onRun: () => void;
+  onDismiss: () => void;
+}) {
+  if (!review && !running && !error) {
+    return (
+      <section className="mb-3 rounded-lg border border-neutral-800 bg-neutral-900/40 p-3 flex items-center justify-between">
+        <div>
+          <div className="text-[9px] uppercase tracking-[0.22em] font-semibold text-neutral-500">
+            Retention review
+          </div>
+          <p className="text-[11px] text-neutral-400 mt-0.5">
+            Have Gemini watch your most recent render and grade retention scene by scene.
+          </p>
+        </div>
+        <button
+          type="button"
+          onClick={onRun}
+          className="h-7 px-3 rounded-md text-[11px] font-semibold border border-studio-accent/40 bg-studio-accent/15 text-studio-accent hover:bg-studio-accent/25 transition-colors"
+        >
+          🔍 Run review
+        </button>
+      </section>
+    );
+  }
+  if (running) {
+    return (
+      <section className="mb-3 rounded-lg border border-studio-accent/30 bg-studio-accent/[0.04] p-3">
+        <div className="text-[11px] text-studio-accent">
+          Gemini is watching the render… this takes 30-60s for a typical 2-minute video.
+        </div>
+      </section>
+    );
+  }
+  if (error) {
+    return (
+      <section className="mb-3 rounded-lg border border-rose-900/40 bg-rose-950/30 p-3 flex items-start justify-between gap-2">
+        <div className="text-[11px] text-rose-300">{error}</div>
+        <button
+          type="button"
+          onClick={onDismiss}
+          className="h-6 px-2 rounded text-[10px] text-neutral-500 hover:text-neutral-300"
+        >
+          Dismiss
+        </button>
+      </section>
+    );
+  }
+  if (!review) return null;
+
+  const overall = review.overallRetentionScore;
+  const tone =
+    overall >= 70
+      ? "text-emerald-300 border-emerald-400/40 bg-emerald-400/10"
+      : overall >= 40
+        ? "text-amber-300 border-amber-400/40 bg-amber-400/10"
+        : "text-rose-300 border-rose-400/40 bg-rose-400/10";
+
+  return (
+    <section className="mb-3 rounded-lg border border-studio-accent/30 bg-studio-accent/[0.03] overflow-hidden">
+      <header className="px-3 py-2 border-b border-studio-accent/20 flex items-center justify-between gap-2">
+        <div className="flex-1 min-w-0">
+          <div className="text-[9px] uppercase tracking-[0.22em] font-semibold text-studio-accent">
+            Retention review · Gemini
+          </div>
+          {review.renderPath && (
+            <p className="text-[10px] text-neutral-500 mt-0.5 font-mono truncate">
+              {review.renderPath}
+            </p>
+          )}
+        </div>
+        <div
+          className={`px-2 py-1 rounded-md border text-[14px] font-semibold tabular-nums ${tone}`}
+        >
+          {Math.round(overall)}
+        </div>
+        <div className="flex flex-col gap-1">
+          <button
+            type="button"
+            onClick={onRun}
+            className="h-6 px-2 rounded text-[10px] text-neutral-400 hover:text-studio-accent transition-colors"
+          >
+            Re-run
+          </button>
+          <button
+            type="button"
+            onClick={onDismiss}
+            className="h-5 px-2 rounded text-[10px] text-neutral-500 hover:text-neutral-300 transition-colors"
+          >
+            Dismiss
+          </button>
+        </div>
+      </header>
+
+      {review.scrollRiskWindows.length > 0 && (
+        <div className="px-3 py-2 border-b border-studio-accent/15">
+          <div className="text-[9px] uppercase tracking-[0.18em] text-neutral-500 mb-1">
+            Scroll-risk windows
+          </div>
+          <div className="space-y-1.5">
+            {review.scrollRiskWindows.map((w, i) => (
+              <div key={i} className="flex items-start gap-2 text-[11px] leading-snug">
+                <span
+                  className={`px-1.5 py-0.5 rounded text-[9px] font-mono tabular-nums shrink-0 ${
+                    w.severity === "high"
+                      ? "bg-rose-500/20 text-rose-300 border border-rose-400/40"
+                      : w.severity === "med"
+                        ? "bg-amber-500/20 text-amber-300 border border-amber-400/40"
+                        : "bg-neutral-800 text-neutral-400 border border-neutral-700"
+                  }`}
+                >
+                  {w.startS.toFixed(1)}-{w.endS.toFixed(1)}s
+                </span>
+                <div className="flex-1 min-w-0">
+                  <div className="text-neutral-200">{w.why}</div>
+                  <div className="text-neutral-400 italic mt-0.5">Fix: {w.fix}</div>
+                </div>
+              </div>
+            ))}
+          </div>
+        </div>
+      )}
+
+      <div className="px-3 py-2 grid grid-cols-3 gap-2 text-[10px]">
+        <div>
+          <div className="uppercase tracking-[0.18em] text-neutral-500">Brand</div>
+          <div className="text-neutral-200 tabular-nums">
+            {Math.round(review.brandConsistency.score)}/100
+          </div>
+        </div>
+        <div>
+          <div className="uppercase tracking-[0.18em] text-neutral-500">Voice</div>
+          <div className="text-neutral-200 capitalize">{review.audioMix.voiceClarity}</div>
+        </div>
+        <div>
+          <div className="uppercase tracking-[0.18em] text-neutral-500">Music</div>
+          <div className="text-neutral-200 capitalize">{review.audioMix.musicLevels}</div>
+        </div>
+      </div>
+    </section>
+  );
+}
+
+// ── Music wizard panel (Milestone B) ─────────────────────────────────────────
+
+function MusicWizardPanel({
+  vibe,
+  onVibeChange,
+  running,
+  error,
+  onSubmit,
+  suggestions,
+  onGenerate,
+  // onDismiss is reserved for a future "dismiss whole suggestion list" affordance.
+  // Currently the user dismisses individual tracks by generating them or by
+  // re-running the wizard with a fresh prompt.
+  generationStatus,
+  appliedTracks,
+  onDelete,
+}: {
+  vibe: string;
+  onVibeChange: (v: string) => void;
+  running: boolean;
+  error: string | null;
+  onSubmit: () => void;
+  suggestions: MusicSuggestionList | null;
+  onGenerate: (track: MusicSuggestion) => void;
+  /** Reserved — see comment on the destructured param above. */
+  onDismiss: () => void;
+  generationStatus: Record<string, "idle" | "running" | "error">;
+  appliedTracks: MusicEntry[];
+  onDelete: (entryId: string) => void;
+}) {
+  return (
+    <section className="mb-3 rounded-lg border border-amber-400/25 bg-amber-400/[0.03] p-3">
+      <div className="flex items-center justify-between gap-2 mb-2">
+        <div>
+          <span className="text-[9px] uppercase tracking-[0.22em] font-semibold text-amber-300">
+            🎵 Music wizard
+          </span>
+          <p className="text-[10px] text-neutral-500 mt-0.5">
+            describe the vibe — Haiku proposes tracks, ElevenLabs Music generates them
+          </p>
+        </div>
+        {appliedTracks.length > 0 && (
+          <span className="text-[10px] text-neutral-500 font-mono shrink-0">
+            {appliedTracks.length} on lane
+          </span>
+        )}
+      </div>
+      <textarea
+        value={vibe}
+        onChange={(e) => onVibeChange(e.target.value)}
+        rows={2}
+        placeholder='e.g. "investigative documentary, tense pulse, low strings" or "uplifting cinematic strings"'
+        className="w-full bg-neutral-950/50 border border-neutral-800 rounded-md px-2 py-1.5 text-[12px] text-neutral-100 placeholder:text-neutral-600 focus:border-amber-400/50 focus:outline-none resize-none"
+        disabled={running}
+        onKeyDown={(e) => {
+          if ((e.metaKey || e.ctrlKey) && e.key === "Enter") {
+            e.preventDefault();
+            onSubmit();
+          }
+        }}
+      />
+      <div className="flex items-center justify-end mt-2">
+        <button
+          type="button"
+          onClick={onSubmit}
+          disabled={running || !vibe.trim()}
+          className="h-7 px-3 rounded-md text-[11px] font-semibold border border-amber-400/40 bg-amber-400/15 text-amber-200 hover:bg-amber-400/25 disabled:opacity-40 disabled:cursor-not-allowed transition-colors"
+        >
+          {running ? "Thinking…" : "Propose ↵"}
+        </button>
+      </div>
+
+      {error && (
+        <div className="mt-2 rounded-md border border-rose-900/40 bg-rose-950/30 p-2 text-[11px] text-rose-300">
+          {error}
+        </div>
+      )}
+
+      {suggestions && suggestions.tracks.length > 0 && (
+        <div className="mt-2 rounded-md border border-amber-400/25 bg-amber-400/[0.04] overflow-hidden">
+          {suggestions.overallNote && (
+            <div className="px-2 py-1.5 text-[10px] text-neutral-400 italic border-b border-amber-400/15">
+              {suggestions.overallNote}
+            </div>
+          )}
+          {suggestions.tracks.map((t) => {
+            const status = generationStatus[t.id] ?? "idle";
+            const generating = status === "running";
+            return (
+              <div
+                key={t.id}
+                className="px-2 py-2 border-b border-amber-400/15 last:border-b-0 flex items-start gap-2"
+              >
+                <div className="flex-1 min-w-0">
+                  <div className="flex items-center gap-1.5 mb-0.5">
+                    <span className="text-[11px] text-neutral-100 font-medium">{t.label}</span>
+                    <span className="px-1 py-0 rounded text-[9px] font-mono text-neutral-400 border border-neutral-700">
+                      {t.role}
+                    </span>
+                    <span className="text-[9px] text-neutral-500 tabular-nums">
+                      {t.durationSeconds.toFixed(0)}s
+                    </span>
+                    {t.scenesCovered.length > 0 && (
+                      <span className="text-[9px] text-neutral-500 font-mono">
+                        · {t.scenesCovered.join(",")}
+                      </span>
+                    )}
+                  </div>
+                  <div className="text-[11px] text-neutral-300 italic font-mono leading-snug">
+                    “{t.prompt}”
+                  </div>
+                  {t.rationale && (
+                    <div className="text-[10px] text-neutral-500 italic leading-relaxed mt-0.5">
+                      {t.rationale}
+                    </div>
+                  )}
+                </div>
+                <button
+                  type="button"
+                  onClick={() => onGenerate(t)}
+                  disabled={generating}
+                  className="h-6 px-2.5 rounded-md text-[10px] font-semibold border border-amber-400/50 bg-amber-400/15 text-amber-200 hover:bg-amber-400/25 disabled:opacity-40 transition-colors flex-shrink-0"
+                >
+                  {generating ? "Generating…" : "🎵 Generate"}
+                </button>
+              </div>
+            );
+          })}
+        </div>
+      )}
+
+      {appliedTracks.length > 0 && (
+        <div className="mt-2 rounded-md border border-emerald-400/15 bg-emerald-400/[0.02] overflow-hidden">
+          <div className="px-2 py-1.5 text-[9px] uppercase tracking-[0.22em] font-semibold text-emerald-300 border-b border-emerald-400/10">
+            Music on lane
+          </div>
+          {appliedTracks.map((t) => (
+            <div
+              key={t.id}
+              className="px-2 py-1.5 border-b border-emerald-400/10 last:border-b-0 flex items-center gap-2"
+            >
+              <div className="flex-1 min-w-0">
+                <div className="flex items-center gap-1.5">
+                  <span className="text-[11px] text-neutral-100 font-medium">
+                    {t.label ?? t.prompt.slice(0, 40)}
+                  </span>
+                  <span className="px-1 py-0 rounded text-[9px] font-mono text-neutral-400 border border-neutral-700">
+                    {t.role}
+                  </span>
+                  <span className="text-[9px] text-neutral-500 tabular-nums">
+                    {t.durationSeconds.toFixed(0)}s
+                  </span>
+                </div>
+              </div>
+              <button
+                type="button"
+                onClick={() => onDelete(t.id)}
+                className="h-6 px-2 rounded text-[10px] text-neutral-500 hover:text-rose-400 transition-colors"
+              >
+                Remove
+              </button>
+            </div>
+          ))}
+        </div>
+      )}
+    </section>
+  );
+}
diff --git a/packages/studio/src/components/storyline/SceneCard.tsx b/packages/studio/src/components/storyline/SceneCard.tsx
index ae2e5cb42..b94b210e2 100644
--- a/packages/studio/src/components/storyline/SceneCard.tsx
+++ b/packages/studio/src/components/storyline/SceneCard.tsx
@@ -40,7 +40,8 @@ export type AIActionId =
   | "suggestEmphasis"
   | "refineReasoning"
   | "rePickTemplate"
-  | "addSfx";
+  | "addSfx"
+  | "scrollTest";
 
 /**
  * One SFX suggestion produced by the per-scene `/sfx-suggest` Haiku action.
@@ -171,6 +172,12 @@ const AI_ACTIONS: Array<{ id: AIActionId; label: string; tooltip: string }> = [
     label: "🔊 Add SFX",
     tooltip: "Propose 1-3 sound effects via Haiku; generate them via ElevenLabs",
   },
+  {
+    id: "scrollTest",
+    label: "📉 Scroll test",
+    tooltip:
+      "Sample frames from this scene, ask Gemini if a feed viewer would scroll past, and propose a one-change fix",
+  },
 ];
 
 const STATUS_TONE: Record<WordBudgetStatus, { label: string; tone: string }> = {
@@ -755,6 +762,9 @@ function SuggestionRow({
     // SFX uses its own SfxSuggestionRow renderer; this label is a defensive
     // fallback only — never actually rendered.
     addSfx: "SFX",
+    // Scroll test: Gemini proposes a fix and we render it in this same row
+    // when the model emits a concrete `patch`.
+    scrollTest: "Scroll-test fix",
   };
   return (
     <div className="px-3 py-2 border-b border-studio-accent/20 last:border-b-0 flex items-start gap-3">