feat: separate UI choices from AI image (bypass vision)

HTML choice buttons now call /api/interact directly, bypassing the ~4s Vision roundtrip. Free-form background clicks still go through Vision as before.
This commit is contained in:
Qi Chen
2026-05-25 20:47:33 +08:00
committed by GitHub
parent bf8f356e37
commit d116c2e3b5
3 changed files with 314 additions and 99 deletions
+207 -9
View File
@@ -1,28 +1,124 @@
"use client";
import { useRef, useState } from "react";
import { useEffect, useRef, useState } from "react";
import type { StoryFrame } from "@yume/types";
export type Phase = "loading-first" | "ready" | "interacting";
const SHADOW =
"0 1px 0 rgba(45,24,16,0.05), 0 36px 64px -28px rgba(45,24,16,0.25), 0 8px 18px -6px rgba(45,24,16,0.10)";
// ── Typewriter hook ────────────────────────────────────────────────────
function useTypewriter(text: string, speed = 28): string {
const [displayed, setDisplayed] = useState("");
const textRef = useRef(text);
useEffect(() => {
// Reset immediately when the text changes
setDisplayed("");
textRef.current = text;
if (!text) return;
let i = 0;
const id = setInterval(() => {
i += 1;
setDisplayed(text.slice(0, i));
if (i >= text.length) clearInterval(id);
}, speed);
return () => clearInterval(id);
}, [text, speed]);
return displayed;
}
// ── Choice button ──────────────────────────────────────────────────────
function ChoiceButton({
index,
label,
disabled,
onClick,
}: {
index: number;
label: string;
disabled: boolean;
onClick: () => void;
}) {
return (
<button
type="button"
disabled={disabled}
onClick={onClick}
className="group relative flex-1 min-w-0 px-4 py-3 text-left transition-all duration-200
disabled:opacity-50 disabled:cursor-wait"
style={{
background: "rgba(20, 14, 8, 0.68)",
border: "1.5px solid rgba(180, 140, 80, 0.65)",
borderRadius: "6px",
backdropFilter: "blur(8px)",
WebkitBackdropFilter: "blur(8px)",
boxShadow: "0 2px 12px rgba(0,0,0,0.4), inset 0 1px 0 rgba(200,165,90,0.12)",
}}
>
{/* Hover shimmer overlay */}
<span
className="absolute inset-0 rounded-[5px] opacity-0 group-hover:opacity-100 transition-opacity duration-200 pointer-events-none"
style={{
background: "rgba(180,140,60,0.10)",
border: "1.5px solid rgba(200,165,90,0.85)",
}}
/>
<span className="relative flex items-baseline gap-2">
<span
className="shrink-0 font-serif text-[11px] num"
style={{ color: "rgba(195,155,75,0.9)" }}
>
{index + 1}.
</span>
<span
className="font-serif text-[13px] md:text-[14px] leading-snug"
style={{ color: "rgba(245,235,210,0.95)" }}
>
{label}
</span>
</span>
</button>
);
}
// ── Main component ─────────────────────────────────────────────────────
export function PlayCanvas({
imageBase64,
phase,
frame,
pendingClick,
onClick,
onSelectChoice,
fullViewport = false,
}: {
imageBase64: string | null;
phase: Phase;
frame: StoryFrame | null;
pendingClick: { x: number; y: number } | null;
onClick: (click: { x: number; y: number }) => void;
onSelectChoice?: (choiceId: string, label: string) => void;
fullViewport?: boolean;
}) {
const imgRef = useRef<HTMLImageElement>(null);
const [dims, setDims] = useState<{ w: number; h: number } | null>(null);
const choices = frame?.uiElements.filter((e) => e.kind === "choice") ?? [];
const dialogueText = frame
? [frame.speaker ? `${frame.speaker}${frame.line ?? ""}` : frame.line, frame.narration]
.filter(Boolean)
.join("\n")
: "";
const narrationOnly = !frame?.speaker && !frame?.line && !!frame?.narration;
const displayBody = frame?.speaker
? frame.line ?? ""
: frame?.narration ?? "";
const typedBody = useTypewriter(displayBody, 30);
function handleClick(e: React.MouseEvent<HTMLImageElement>) {
if (phase !== "ready" || !imgRef.current) return;
const rect = imgRef.current.getBoundingClientRect();
@@ -37,16 +133,13 @@ export function PlayCanvas({
const interactive = phase === "ready" && !!imageBase64;
const dimmed = phase === "interacting";
// 16:9 sizing — letterbox into available viewport
const sizeStyle = fullViewport
? { maxWidth: "100vw", maxHeight: "100dvh" }
: { maxWidth: "96vw", maxHeight: "calc(100dvh - 280px)" };
: { maxWidth: "96vw", maxHeight: "calc(100dvh - 200px)" };
// Placeholder needs an explicit width for aspect-video to compute height.
// Pick the largest 16:9 box that fits in the available viewport.
const placeholderWidth = fullViewport
? "min(100vw, calc(100dvh * 16 / 9))"
: "min(96vw, calc((100dvh - 280px) * 16 / 9))";
: "min(96vw, calc((100dvh - 200px) * 16 / 9))";
return (
<div
@@ -57,6 +150,7 @@ export function PlayCanvas({
className="relative inline-block"
style={{ boxShadow: fullViewport ? "none" : SHADOW }}
>
{/* ── Background image ── */}
<img
key={imageBase64.slice(-48)}
ref={imgRef}
@@ -68,17 +162,121 @@ export function PlayCanvas({
setDims({ w: img.naturalWidth, h: img.naturalHeight });
}}
draggable={false}
className={`block w-auto h-auto select-none animate-fade-in transition-opacity duration-700 ease-out ${interactive ? "cursor-pointer" : "cursor-wait"} ${dimmed ? "opacity-30" : "opacity-100"}`}
className={`block w-auto h-auto select-none animate-fade-in transition-opacity duration-700 ease-out ${
interactive ? "cursor-pointer" : "cursor-wait"
} ${dimmed ? "opacity-40" : "opacity-100"}`}
style={sizeStyle}
/>
{/* ── Top/bottom gradient vignette ── */}
{!fullViewport && (
<>
<div className="absolute inset-x-0 top-0 h-10 bg-gradient-to-b from-clay-900/12 to-transparent pointer-events-none" />
<div className="absolute inset-x-0 bottom-0 h-10 bg-gradient-to-t from-clay-900/12 to-transparent pointer-events-none" />
</>
)}
{/* ══════════════════════════════════════════════════════════
PREFAB UI OVERLAY — rendered on top of image
══════════════════════════════════════════════════════════ */}
{frame && (
<div className="absolute inset-0 flex flex-col justify-end pointer-events-none select-none">
{/* ── Choices row ── */}
{choices.length > 0 && (
<div
className="pointer-events-auto px-[3%] pb-[1.5%] flex gap-[1.5%] items-stretch"
>
{choices.map((choice, i) => (
<ChoiceButton
key={choice.id}
index={i}
label={choice.label}
disabled={phase !== "ready"}
onClick={() => onSelectChoice?.(choice.id, choice.label)}
/>
))}
</div>
)}
{/* ── Dialogue / narration box ── */}
{(frame.narration || frame.line) && (
<div
className="pointer-events-none mx-[2%] mb-[2%] px-[3%] py-[2.2%] relative"
style={{
background: "rgba(14, 10, 6, 0.72)",
border: "1.5px solid rgba(175, 138, 72, 0.60)",
borderRadius: "6px",
backdropFilter: "blur(10px)",
WebkitBackdropFilter: "blur(10px)",
boxShadow:
"0 4px 24px rgba(0,0,0,0.55), inset 0 1px 0 rgba(200,165,90,0.10)",
}}
>
{/* Inner golden corner decoration */}
<span
className="absolute top-[6px] left-[8px] text-[10px] opacity-40 pointer-events-none"
style={{ color: "rgba(195,155,75,1)" }}
aria-hidden
>
</span>
<span
className="absolute top-[6px] right-[8px] text-[10px] opacity-40 pointer-events-none"
style={{ color: "rgba(195,155,75,1)" }}
aria-hidden
>
</span>
{/* Speaker name tag */}
{frame.speaker && (
<p
className="font-serif text-[11px] md:text-[12px] smallcaps mb-[0.6em]"
style={{ color: "rgba(205,165,90,0.92)" }}
>
{frame.speaker}
</p>
)}
{/* Main text */}
<p
className="font-serif leading-[1.85] text-[13px] md:text-[15px]"
style={{ color: "rgba(245,235,210,0.95)" }}
>
{typedBody}
{/* Narration only — also show secondary line */}
{frame.speaker && frame.narration && (
<span
className="block mt-[0.5em] italic text-[12px] md:text-[13px]"
style={{ color: "rgba(200,185,155,0.78)" }}
>
{frame.narration}
</span>
)}
</p>
{/* Scroll hint ▼ */}
<span
className="absolute bottom-[6px] right-[10px] text-[10px] animate-slow-pulse"
style={{ color: "rgba(195,155,75,0.7)" }}
aria-hidden
>
</span>
</div>
)}
</div>
)}
{/* Loading/interacting dim overlay */}
{phase === "interacting" && (
<div className="absolute inset-0 flex items-center justify-center pointer-events-none">
<p className="text-[10px] smallcaps text-cream-50/70 animate-slow-pulse">
AI · · · · · · ·
</p>
</div>
)}
{/* Click ripple indicator */}
{pendingClick && (
<>
<div
@@ -133,7 +331,7 @@ export function PlayCanvas({
{dims ? `${dims.w} × ${dims.h} · png` : "—"}
</span>
<span className="text-[9px] smallcaps text-clay-400">
{phase === "ready" ? "任 · 意 · 点 · 击" : "···"}
{phase === "ready" ? (choices.length > 0 ? "选 · 择 · 一 · 项" : "任 · 意 · 点 · 击") : "···"}
</span>
</div>
)}