347ab297d5
自定义画风入口里加上传按钮:客户端把图缩到 512px webp(base64),传到新 路由 /api/parse-style-image,vision LLM 解析成英文 style prompt 回填 textarea; 图本身随 sessionStorage → /api/start → Session.styleReferenceImage 透传, painter.collectReferenceImages 把它置于 slot 0,整局每一幕都作为 reference 图锚定画风(brush / color / mood),比 priorScene 优先级更高。 Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com>
90 lines
2.4 KiB
TypeScript
90 lines
2.4 KiB
TypeScript
import type { ProviderConfig } from "@infiplot/types";
|
|
import { fetchWithRetry } from "./fetchWithRetry";
|
|
|
|
export async function interpretClick(
|
|
config: ProviderConfig,
|
|
imageBase64: string,
|
|
prompt: string,
|
|
): Promise<string> {
|
|
// Wrap the raw base64 in a PNG data URL — the Canvas annotator on the
|
|
// client encodes as PNG. analyzeImageDataUrl handles the actual request.
|
|
return analyzeImageDataUrl(
|
|
config,
|
|
`data:image/png;base64,${imageBase64}`,
|
|
prompt,
|
|
{ responseFormat: "json_object" },
|
|
);
|
|
}
|
|
|
|
/**
|
|
* General single-image vision call. Accepts a complete data URL (preserves
|
|
* the source mime type, e.g. webp/jpeg) and lets the caller opt out of
|
|
* `response_format: json_object` for free-form text responses.
|
|
*/
|
|
export async function analyzeImageDataUrl(
|
|
config: ProviderConfig,
|
|
imageDataUrl: string,
|
|
prompt: string,
|
|
opts: { responseFormat?: "json_object" | "text" } = {},
|
|
): Promise<string> {
|
|
const url = `${config.baseUrl.replace(/\/$/, "")}/chat/completions`;
|
|
|
|
const body: Record<string, unknown> = {
|
|
model: config.model,
|
|
messages: [
|
|
{
|
|
role: "user",
|
|
content: [
|
|
{ type: "text", text: prompt },
|
|
{ type: "image_url", image_url: { url: imageDataUrl } },
|
|
],
|
|
},
|
|
],
|
|
temperature: 0.2,
|
|
};
|
|
if (opts.responseFormat === "json_object") {
|
|
body.response_format = { type: "json_object" };
|
|
}
|
|
|
|
const timeoutCtrl = new AbortController();
|
|
const timeoutId = setTimeout(() => timeoutCtrl.abort(), 60_000);
|
|
|
|
let res: Response;
|
|
try {
|
|
res = await fetchWithRetry(url, {
|
|
method: "POST",
|
|
headers: {
|
|
"Content-Type": "application/json",
|
|
Authorization: `Bearer ${config.apiKey}`,
|
|
},
|
|
body: JSON.stringify(body),
|
|
signal: timeoutCtrl.signal,
|
|
retries: 0,
|
|
});
|
|
} finally {
|
|
clearTimeout(timeoutId);
|
|
}
|
|
|
|
const text = await res.text();
|
|
if (!res.ok) {
|
|
throw new Error(`Vision API error ${res.status}: ${text}`);
|
|
}
|
|
|
|
let json: { choices: { message: { content: string } }[] };
|
|
try {
|
|
json = JSON.parse(text);
|
|
} catch {
|
|
throw new Error(`Vision API returned invalid JSON: ${text.slice(0, 500)}`);
|
|
}
|
|
|
|
// Guard against empty choices array or missing message/content fields
|
|
const content = json.choices?.[0]?.message?.content;
|
|
if (typeof content !== "string") {
|
|
throw new Error(
|
|
`Vision API returned no content. Response: ${text.slice(0, 500)}`
|
|
);
|
|
}
|
|
|
|
return content;
|
|
}
|