addbede929
- Move vercel.json to apps/web/ with correct route paths; cap scene route
maxDuration 120→60s for Hobby. Root vercel.json removed. Vercel project's
Root Directory must be set to apps/web (Deploy button URL passes this).
- Switch image transport from base64-in-JSON to Runware-hosted URLs:
generateImage now uses outputType=URL and returns {imageUrl, imageUuid};
StartResponse/SceneResponse carry imageUrl; VisionRequest carries
prevImageUrl (server re-fetches the bytes for click annotation). This
eliminates the 4.5MB serverless body-size risk.
- Painter and director prefer URL over UUID for referenceImages — the UUID
returned by Runware imageInference isn't always recognized in the refs
pipeline (surfaces as `failedToTransferImage`).
- Client preloads scene images via `new Image().decode()` before committing
to React state, so URL transitions render instantly; prefetched scenes
also warm the HTTP cache.
- jsonParser uses the jsonrepair package (replaces hand-rolled repair) and
adds a targeted preRepair regex for the missing-key-close-quote pattern
that jsonrepair couldn't disambiguate. Full raw model output dumped on
failure for diagnostic visibility.
- Default text provider switched to DeepSeek v4-flash via direct API
(significantly more stable JSON than MiMo v2.5-pro). VISION/TTS stay on
MiMo (DeepSeek has no multimodal / TTS offerings).
- next.config: drop dead experimental.serverActions.bodySizeLimit (no
server actions used).
- README: real Deploy button URL (zonghaoyuan/yume + root-directory=apps/web
+ TTS/MOCK_IMAGE in env list); refreshed env vars table with optional
TTS section.
Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
131 lines
4.5 KiB
TypeScript
131 lines
4.5 KiB
TypeScript
import type { ProviderConfig } from "@yume/types";
|
||
import { fetchWithRetry } from "./fetchWithRetry";
|
||
|
||
// Runware uses its own task-array protocol (not OpenAI-compatible).
|
||
// POST <baseUrl> with [{ taskType: "imageInference", ... }]; errors come
|
||
// back as a 200 with `errors[]`, so we have to inspect the body either way.
|
||
//
|
||
// referenceImages accepts UUIDs, public URLs, or base64. UUID is cheapest
|
||
// in transport cost; URL is next; base64 last resort. The FLUX.2 [klein] 9B
|
||
// KV variant (runware:400@6) accelerates multi-reference inference ~2.5× via
|
||
// its KV cache for reference latents (cached only within one inference run,
|
||
// not persisted across calls — hence the need to keep stable UUIDs/URLs for
|
||
// later reuse).
|
||
//
|
||
// We request outputType=URL so Runware persists the image and returns a CDN
|
||
// link the client can render directly. The same response also carries the
|
||
// image UUID, so we never need a separate uploadImage round-trip to anchor
|
||
// future referenceImages.
|
||
const DEFAULT_IMG2IMG_STRENGTH = 0.85;
|
||
const MAX_REFERENCE_IMAGES = 4;
|
||
|
||
type RunwareImageResult = {
|
||
imageURL?: string;
|
||
imageUUID?: string;
|
||
};
|
||
type RunwareError = {
|
||
code?: string;
|
||
message?: string;
|
||
parameter?: string;
|
||
};
|
||
type RunwareResponse = {
|
||
data?: RunwareImageResult[];
|
||
errors?: RunwareError[];
|
||
};
|
||
|
||
export type GenerateImageOptions = {
|
||
/**
|
||
* Reference image (UUID, public URL, or base64) for img2img. When set,
|
||
* FLUX preserves the seed image's composition and applies `strength` to
|
||
* deviate. NOTE: FLUX.2 [klein] 9B KV does NOT support seedImage — use
|
||
* `referenceImages` for visual continuity instead.
|
||
*/
|
||
seedImage?: string;
|
||
/**
|
||
* Reference images (UUIDs, URLs, or base64) to condition generation on —
|
||
* typically character portraits + the prior scene image. Runware caps at 4;
|
||
* we silently truncate beyond that.
|
||
*/
|
||
referenceImages?: string[];
|
||
/** 0–1, FLUX needs ≥ 0.8 to actually have an effect. */
|
||
strength?: number;
|
||
};
|
||
|
||
export type GenerateImageResult = {
|
||
/** Public CDN URL of the generated image (Runware-hosted). */
|
||
imageUrl: string;
|
||
/** Stable UUID for cheap re-reference in later `referenceImages`. */
|
||
imageUuid: string;
|
||
};
|
||
|
||
// ──────────────────────────────────────────────────────────────────────
|
||
// generateImage — text-to-image (default) or referenceImages-conditioned.
|
||
// Returns both the public URL (for client display + future references)
|
||
// and the UUID (cheapest reference form for subsequent calls).
|
||
// ──────────────────────────────────────────────────────────────────────
|
||
|
||
export async function generateImage(
|
||
config: ProviderConfig,
|
||
prompt: string,
|
||
options?: GenerateImageOptions,
|
||
): Promise<GenerateImageResult> {
|
||
const url = config.baseUrl.replace(/\/$/, "");
|
||
|
||
const task: Record<string, unknown> = {
|
||
taskType: "imageInference",
|
||
taskUUID: crypto.randomUUID(),
|
||
model: config.model,
|
||
positivePrompt: prompt,
|
||
width: 1792,
|
||
height: 1024,
|
||
steps: 4,
|
||
CFGScale: 3.5,
|
||
numberResults: 1,
|
||
outputType: "URL",
|
||
outputFormat: "PNG",
|
||
includeCost: false,
|
||
};
|
||
|
||
if (options?.seedImage) {
|
||
task.seedImage = options.seedImage;
|
||
task.strength = options.strength ?? DEFAULT_IMG2IMG_STRENGTH;
|
||
}
|
||
|
||
if (options?.referenceImages?.length) {
|
||
task.referenceImages = options.referenceImages.slice(0, MAX_REFERENCE_IMAGES);
|
||
}
|
||
|
||
const res = await fetchWithRetry(url, {
|
||
method: "POST",
|
||
headers: {
|
||
"Content-Type": "application/json",
|
||
Authorization: `Bearer ${config.apiKey}`,
|
||
},
|
||
body: JSON.stringify([task]),
|
||
});
|
||
|
||
const text = await res.text();
|
||
let json: RunwareResponse;
|
||
try {
|
||
json = JSON.parse(text) as RunwareResponse;
|
||
} catch {
|
||
throw new Error(`Image API error ${res.status}: ${text.slice(0, 500)}`);
|
||
}
|
||
|
||
if (json.errors?.length) {
|
||
const e = json.errors[0]!;
|
||
throw new Error(
|
||
`Runware error [${e.code ?? "unknown"}]: ${e.message ?? "no message"}` +
|
||
(e.parameter ? ` (parameter: ${e.parameter})` : ""),
|
||
);
|
||
}
|
||
|
||
const result = json.data?.[0];
|
||
const imageUrl = result?.imageURL;
|
||
const imageUuid = result?.imageUUID;
|
||
if (!imageUrl || !imageUuid) {
|
||
throw new Error(`No image URL/UUID in Runware response: ${text.slice(0, 300)}`);
|
||
}
|
||
return { imageUrl, imageUuid };
|
||
}
|