Files
infiplot-web/lib/engine/stream/index.ts
T
Zonghao Yuan 0e4c2ebef4 feat(engine): merge cloudflare-migration — paradigm D engine, BYOK proxy, story persistence (#95)
Squash-merge the cloudflare-migration branch (7 commits by Kai ki) into
staging with conflict resolution, feature integration, and bug fixes.

Engine:
- Paradigm D: single-stream Writer replacing dual-phase Plan/Beats
- Delete Architect agent; story bible generated via Writer <plan> tag
- Modular prompt architecture (segments/registry/builder)
- StreamRouter for tagged stream splitting (<plan>/<story>/<choices>)

Infrastructure:
- Cloudflare Workers deployment (wrangler.jsonc, OpenNext adapter)
- D1 database schema + Drizzle ORM (scaffolded, not yet active)
- R2 storage helpers (scaffolded, not yet active)
- Story persistence API routes + client-side persistence

BYOK (Bring Your Own Key):
- /api/llm/user-proxy with SSRF-protected LLM proxy (+ requireUser auth)
- CORS-aware fetch in ai-client: auto-detect CORS failure, fallback to
  server proxy transparently via OpenAI SDK custom fetch
- BYO config support added to classify-freeform and vision routes
- SettingsModal CORS privacy notice (keys never logged/stored)

SSE streaming:
- engineClient.ts: fetchSSE helper for progressive scene events
- startSession/requestScene accept optional emit callback
- Fix SSE error event field name (error → message) in scene/start routes

i18n integration:
- Wire buildLanguageDirective into paradigm D's prompt builder
- Update corsNotice i18n keys (zh-CN/en/ja) with CORS proxy privacy text
- Preserve Session.language + LanguageSwitcher from i18n commit

Co-authored-by: Kai ki <155355644+zbf1009@users.noreply.github.com>
Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
2026-06-18 18:05:38 +08:00

248 lines
8.7 KiB
TypeScript

import type {
BeatChoice,
WriterScenePlan,
StreamRouterHandlers,
StreamRouterResult,
} from "@infiplot/types";
import { parseJsonLoose } from "../jsonParser";
// ──────────────────────────────────────────────────────────────────────
// StreamRouter — tagged stream splitter for paradigm D.
//
// Consumes Writer's incremental textStream, recognizes <plan>/<story>/
// <choices> tag boundaries, and dispatches handlers at the right time:
// - </plan> closes → parse → onPlan (downstream media translators)
// - <story> incremental → onBeat (client progressive playback)
// - </story> closes → store raw prose → onStoryComplete
// - </choices> closes → parse → onChoices
//
// RELIABILITY RULE: the degrade path is designed BEFORE the main path.
// Any tag anomaly (missing / misordered / unclosed / timeout) → buffer
// everything, attempt best-effort slicing, or treat the whole output
// as raw prose. Returns degraded=true. Never throws.
// ──────────────────────────────────────────────────────────────────────
type TagName = "plan" | "story" | "choices";
const TAG_NAMES: TagName[] = ["plan", "story", "choices"];
function openTag(name: TagName): string {
return `<${name}>`;
}
function closeTag(name: TagName): string {
return `</${name}>`;
}
function tryParseJson<T>(raw: string, label: string): T | undefined {
try {
return parseJsonLoose<T>(raw);
} catch (err) {
console.warn(`[StreamRouter] failed to parse ${label}:`, err);
return undefined;
}
}
function extractTagContent(buffer: string, name: TagName): string | undefined {
const open = openTag(name);
const close = closeTag(name);
const start = buffer.indexOf(open);
const end = buffer.indexOf(close);
if (start === -1 || end === -1 || end <= start) return undefined;
return buffer.slice(start + open.length, end);
}
/**
* Route a Writer tagged stream to handlers. Pure logic — no LLM calls.
*
* Uses a cursor-based state machine over a growing fullBuffer: after each
* chunk, scan from `cursor` for tag boundaries. This naturally handles
* tags that split across chunk boundaries without double-buffering bugs.
*/
export async function routeTaggedStream(
textStream: AsyncIterable<string>,
handlers: StreamRouterHandlers,
opts?: { timeoutMs?: number },
): Promise<StreamRouterResult> {
const result: StreamRouterResult = {
plan: undefined,
beats: [],
choices: undefined,
rawStorySegment: undefined,
degraded: false,
};
let fullBuffer = "";
let cursor = 0;
let currentTag: TagName | null = null;
let tagContentStart = 0;
let lastBeatEmitCursor = 0;
let planDispatched = false;
let storyCompleted = false;
const timeoutMs = opts?.timeoutMs ?? 120_000;
let timedOut = false;
function scan(): void {
while (cursor < fullBuffer.length) {
if (currentTag === null) {
let earliestIdx = Infinity;
let earliestTag: TagName | null = null;
for (const name of TAG_NAMES) {
const idx = fullBuffer.indexOf(openTag(name), cursor);
if (idx !== -1 && idx < earliestIdx) {
earliestIdx = idx;
earliestTag = name;
}
}
if (earliestTag === null) {
// No complete open tag found. Back up cursor by the max possible
// partial tag length so a split like "<pl" + "an>" is re-scanned
// when the next chunk appends.
const maxTagLen = Math.max(...TAG_NAMES.map((n) => openTag(n).length));
cursor = Math.max(cursor, fullBuffer.length - maxTagLen + 1);
break;
}
currentTag = earliestTag;
tagContentStart = earliestIdx + openTag(earliestTag).length;
lastBeatEmitCursor = tagContentStart;
cursor = tagContentStart;
continue;
}
// Inside a tag — look for the close tag.
const close = closeTag(currentTag);
const closeIdx = fullBuffer.indexOf(close, cursor);
if (closeIdx !== -1) {
// Tag closed — extract and finalize.
const content = fullBuffer.slice(tagContentStart, closeIdx);
if (currentTag === "plan") {
const parsed = tryParseJson<WriterScenePlan>(content, "plan");
if (parsed) {
result.plan = parsed;
planDispatched = true;
try { handlers.onPlan?.(parsed); } catch {}
} else {
result.degraded = true;
}
} else if (currentTag === "story") {
// Emit any remaining un-emitted prose text before finalizing.
if (lastBeatEmitCursor < closeIdx) {
const remaining = fullBuffer.slice(lastBeatEmitCursor, closeIdx);
if (remaining.length) {
try { handlers.onBeat?.(remaining); } catch {}
}
}
// The <story> segment is raw prose — NOT JSON. Store it verbatim;
// the director feeds it to proseSplitter to produce Beat[].
result.rawStorySegment = content;
if (content.trim().length > 0) {
storyCompleted = true;
try { handlers.onStoryComplete?.(content); } catch {}
} else {
result.degraded = true;
}
} else if (currentTag === "choices") {
const parsed = tryParseJson<BeatChoice[]>(content, "choices");
if (parsed && Array.isArray(parsed)) {
result.choices = parsed;
try { handlers.onChoices?.(parsed); } catch {}
}
}
cursor = closeIdx + close.length;
currentTag = null;
continue;
}
// Close tag not yet in buffer — emit incremental prose if applicable.
if (currentTag === "story" && lastBeatEmitCursor < fullBuffer.length) {
const newText = fullBuffer.slice(lastBeatEmitCursor);
// Don't emit partial close-tag lookalikes: hold back the last few
// chars that could be a partial "</story>" (max 8 chars).
const safeLen = Math.max(0, newText.length - closeTag("story").length);
if (safeLen > 0) {
const safe = newText.slice(0, safeLen);
try { handlers.onBeat?.(safe); } catch {}
lastBeatEmitCursor += safeLen;
}
}
// Close tag not found — back up cursor by the max close-tag length
// (split like "</pla" + "n>" can complete on next chunk append).
const maxCloseLen = Math.max(...TAG_NAMES.map((n) => closeTag(n).length));
cursor = Math.max(cursor, fullBuffer.length - maxCloseLen + 1);
break;
}
}
const consume = async (): Promise<void> => {
for await (const chunk of textStream) {
fullBuffer += chunk;
scan();
}
// Final scan — flush any remaining buffer (handles close tags that
// arrived in the last chunk without a subsequent iteration).
scan();
};
try {
await Promise.race([
consume(),
new Promise<void>((_, reject) =>
setTimeout(() => {
timedOut = true;
reject(new Error("StreamRouter timeout"));
}, timeoutMs),
),
]);
} catch {
// Timeout or stream error — fall through to degrade path.
}
// ── Degrade path ──────────────────────────────────────────────────
if (!planDispatched || !storyCompleted || timedOut) {
result.degraded = true;
if (!planDispatched) {
const planContent = extractTagContent(fullBuffer, "plan");
if (planContent) {
const parsed = tryParseJson<WriterScenePlan>(planContent, "plan:degraded");
if (parsed) {
result.plan = parsed;
try { handlers.onPlan?.(parsed); } catch {}
}
}
}
if (!storyCompleted) {
// Best-effort: extract <story> prose; if no tag at all, fall back to
// the whole buffer as prose (the splitter degrades further if empty).
const storyContent =
extractTagContent(fullBuffer, "story") ?? fullBuffer.trim();
result.rawStorySegment = storyContent;
if (storyContent.trim().length > 0) {
try { handlers.onStoryComplete?.(storyContent); } catch {}
}
}
if (!result.choices) {
const choicesContent = extractTagContent(fullBuffer, "choices");
if (choicesContent) {
const parsed = tryParseJson<BeatChoice[]>(choicesContent, "choices:degraded");
if (parsed && Array.isArray(parsed)) result.choices = parsed;
}
}
if (timedOut) {
console.warn(`[StreamRouter] timed out after ${timeoutMs}ms, degraded extraction attempted`);
}
}
return result;
}