feat(engine): merge cloudflare-migration — paradigm D engine, BYOK proxy, story persistence (#95)

Squash-merge the cloudflare-migration branch (7 commits by Kai ki) into staging with conflict resolution, feature integration, and bug fixes. Engine: - Paradigm D: single-stream Writer replacing dual-phase Plan/Beats - Delete Architect agent; story bible generated via Writer <plan> tag - Modular prompt architecture (segments/registry/builder) - StreamRouter for tagged stream splitting (<plan>/<story>/<choices>) Infrastructure: - Cloudflare Workers deployment (wrangler.jsonc, OpenNext adapter) - D1 database schema + Drizzle ORM (scaffolded, not yet active) - R2 storage helpers (scaffolded, not yet active) - Story persistence API routes + client-side persistence BYOK (Bring Your Own Key): - /api/llm/user-proxy with SSRF-protected LLM proxy (+ requireUser auth) - CORS-aware fetch in ai-client: auto-detect CORS failure, fallback to server proxy transparently via OpenAI SDK custom fetch - BYO config support added to classify-freeform and vision routes - SettingsModal CORS privacy notice (keys never logged/stored) SSE streaming: - engineClient.ts: fetchSSE helper for progressive scene events - startSession/requestScene accept optional emit callback - Fix SSE error event field name (error → message) in scene/start routes i18n integration: - Wire buildLanguageDirective into paradigm D's prompt builder - Update corsNotice i18n keys (zh-CN/en/ja) with CORS proxy privacy text - Preserve Session.language + LanguageSwitcher from i18n commit Co-authored-by: Kai ki <155355644+zbf1009@users.noreply.github.com> Co-authored-by: Claude Opus 4.6 <noreply@anthropic.com>
2026-06-18 18:05:38 +08:00
parent 05bd7e229c
commit 0e4c2ebef4
78 changed files with 7396 additions and 919 deletions
@@ -0,0 +1,247 @@
+import type {
+  BeatChoice,
+  WriterScenePlan,
+  StreamRouterHandlers,
+  StreamRouterResult,
+} from "@infiplot/types";
+import { parseJsonLoose } from "../jsonParser";
+
+// ──────────────────────────────────────────────────────────────────────
+//  StreamRouter — tagged stream splitter for paradigm D.
+//
+//  Consumes Writer's incremental textStream, recognizes <plan>/<story>/
+//  <choices> tag boundaries, and dispatches handlers at the right time:
+//    - </plan>  closes → parse → onPlan (downstream media translators)
+//    - <story>  incremental → onBeat (client progressive playback)
+//    - </story> closes → store raw prose → onStoryComplete
+//    - </choices> closes → parse → onChoices
+//
+//  RELIABILITY RULE: the degrade path is designed BEFORE the main path.
+//  Any tag anomaly (missing / misordered / unclosed / timeout) → buffer
+//  everything, attempt best-effort slicing, or treat the whole output
+//  as raw prose. Returns degraded=true. Never throws.
+// ──────────────────────────────────────────────────────────────────────
+
+type TagName = "plan" | "story" | "choices";
+
+const TAG_NAMES: TagName[] = ["plan", "story", "choices"];
+
+function openTag(name: TagName): string {
+  return `<${name}>`;
+}
+function closeTag(name: TagName): string {
+  return `</${name}>`;
+}
+
+function tryParseJson<T>(raw: string, label: string): T | undefined {
+  try {
+    return parseJsonLoose<T>(raw);
+  } catch (err) {
+    console.warn(`[StreamRouter] failed to parse ${label}:`, err);
+    return undefined;
+  }
+}
+
+function extractTagContent(buffer: string, name: TagName): string | undefined {
+  const open = openTag(name);
+  const close = closeTag(name);
+  const start = buffer.indexOf(open);
+  const end = buffer.indexOf(close);
+  if (start === -1 || end === -1 || end <= start) return undefined;
+  return buffer.slice(start + open.length, end);
+}
+
+/**
+ * Route a Writer tagged stream to handlers. Pure logic — no LLM calls.
+ *
+ * Uses a cursor-based state machine over a growing fullBuffer: after each
+ * chunk, scan from `cursor` for tag boundaries. This naturally handles
+ * tags that split across chunk boundaries without double-buffering bugs.
+ */
+export async function routeTaggedStream(
+  textStream: AsyncIterable<string>,
+  handlers: StreamRouterHandlers,
+  opts?: { timeoutMs?: number },
+): Promise<StreamRouterResult> {
+  const result: StreamRouterResult = {
+    plan: undefined,
+    beats: [],
+    choices: undefined,
+    rawStorySegment: undefined,
+    degraded: false,
+  };
+
+  let fullBuffer = "";
+  let cursor = 0;
+  let currentTag: TagName | null = null;
+  let tagContentStart = 0;
+  let lastBeatEmitCursor = 0;
+  let planDispatched = false;
+  let storyCompleted = false;
+
+  const timeoutMs = opts?.timeoutMs ?? 120_000;
+  let timedOut = false;
+
+  function scan(): void {
+    while (cursor < fullBuffer.length) {
+      if (currentTag === null) {
+        let earliestIdx = Infinity;
+        let earliestTag: TagName | null = null;
+
+        for (const name of TAG_NAMES) {
+          const idx = fullBuffer.indexOf(openTag(name), cursor);
+          if (idx !== -1 && idx < earliestIdx) {
+            earliestIdx = idx;
+            earliestTag = name;
+          }
+        }
+
+        if (earliestTag === null) {
+          // No complete open tag found. Back up cursor by the max possible
+          // partial tag length so a split like "<pl" + "an>" is re-scanned
+          // when the next chunk appends.
+          const maxTagLen = Math.max(...TAG_NAMES.map((n) => openTag(n).length));
+          cursor = Math.max(cursor, fullBuffer.length - maxTagLen + 1);
+          break;
+        }
+
+        currentTag = earliestTag;
+        tagContentStart = earliestIdx + openTag(earliestTag).length;
+        lastBeatEmitCursor = tagContentStart;
+        cursor = tagContentStart;
+        continue;
+      }
+
+      // Inside a tag — look for the close tag.
+      const close = closeTag(currentTag);
+      const closeIdx = fullBuffer.indexOf(close, cursor);
+
+      if (closeIdx !== -1) {
+        // Tag closed — extract and finalize.
+        const content = fullBuffer.slice(tagContentStart, closeIdx);
+
+        if (currentTag === "plan") {
+          const parsed = tryParseJson<WriterScenePlan>(content, "plan");
+          if (parsed) {
+            result.plan = parsed;
+            planDispatched = true;
+            try { handlers.onPlan?.(parsed); } catch {}
+          } else {
+            result.degraded = true;
+          }
+        } else if (currentTag === "story") {
+          // Emit any remaining un-emitted prose text before finalizing.
+          if (lastBeatEmitCursor < closeIdx) {
+            const remaining = fullBuffer.slice(lastBeatEmitCursor, closeIdx);
+            if (remaining.length) {
+              try { handlers.onBeat?.(remaining); } catch {}
+            }
+          }
+          // The <story> segment is raw prose — NOT JSON. Store it verbatim;
+          // the director feeds it to proseSplitter to produce Beat[].
+          result.rawStorySegment = content;
+          if (content.trim().length > 0) {
+            storyCompleted = true;
+            try { handlers.onStoryComplete?.(content); } catch {}
+          } else {
+            result.degraded = true;
+          }
+        } else if (currentTag === "choices") {
+          const parsed = tryParseJson<BeatChoice[]>(content, "choices");
+          if (parsed && Array.isArray(parsed)) {
+            result.choices = parsed;
+            try { handlers.onChoices?.(parsed); } catch {}
+          }
+        }
+
+        cursor = closeIdx + close.length;
+        currentTag = null;
+        continue;
+      }
+
+      // Close tag not yet in buffer — emit incremental prose if applicable.
+      if (currentTag === "story" && lastBeatEmitCursor < fullBuffer.length) {
+        const newText = fullBuffer.slice(lastBeatEmitCursor);
+        // Don't emit partial close-tag lookalikes: hold back the last few
+        // chars that could be a partial "</story>" (max 8 chars).
+        const safeLen = Math.max(0, newText.length - closeTag("story").length);
+        if (safeLen > 0) {
+          const safe = newText.slice(0, safeLen);
+          try { handlers.onBeat?.(safe); } catch {}
+          lastBeatEmitCursor += safeLen;
+        }
+      }
+
+      // Close tag not found — back up cursor by the max close-tag length
+      // (split like "</pla" + "n>" can complete on next chunk append).
+      const maxCloseLen = Math.max(...TAG_NAMES.map((n) => closeTag(n).length));
+      cursor = Math.max(cursor, fullBuffer.length - maxCloseLen + 1);
+      break;
+    }
+  }
+
+  const consume = async (): Promise<void> => {
+    for await (const chunk of textStream) {
+      fullBuffer += chunk;
+      scan();
+    }
+    // Final scan — flush any remaining buffer (handles close tags that
+    // arrived in the last chunk without a subsequent iteration).
+    scan();
+  };
+
+  try {
+    await Promise.race([
+      consume(),
+      new Promise<void>((_, reject) =>
+        setTimeout(() => {
+          timedOut = true;
+          reject(new Error("StreamRouter timeout"));
+        }, timeoutMs),
+      ),
+    ]);
+  } catch {
+    // Timeout or stream error — fall through to degrade path.
+  }
+
+  // ── Degrade path ──────────────────────────────────────────────────
+  if (!planDispatched || !storyCompleted || timedOut) {
+    result.degraded = true;
+
+    if (!planDispatched) {
+      const planContent = extractTagContent(fullBuffer, "plan");
+      if (planContent) {
+        const parsed = tryParseJson<WriterScenePlan>(planContent, "plan:degraded");
+        if (parsed) {
+          result.plan = parsed;
+          try { handlers.onPlan?.(parsed); } catch {}
+        }
+      }
+    }
+
+    if (!storyCompleted) {
+      // Best-effort: extract <story> prose; if no tag at all, fall back to
+      // the whole buffer as prose (the splitter degrades further if empty).
+      const storyContent =
+        extractTagContent(fullBuffer, "story") ?? fullBuffer.trim();
+      result.rawStorySegment = storyContent;
+      if (storyContent.trim().length > 0) {
+        try { handlers.onStoryComplete?.(storyContent); } catch {}
+      }
+    }
+
+    if (!result.choices) {
+      const choicesContent = extractTagContent(fullBuffer, "choices");
+      if (choicesContent) {
+        const parsed = tryParseJson<BeatChoice[]>(choicesContent, "choices:degraded");
+        if (parsed && Array.isArray(parsed)) result.choices = parsed;
+      }
+    }
+
+    if (timedOut) {
+      console.warn(`[StreamRouter] timed out after ${timeoutMs}ms, degraded extraction attempted`);
+    }
+  }
+
+  return result;
+}
@@ -0,0 +1,160 @@
+import type {
+  WriterScenePlan,
+} from "@infiplot/types";
+import type { WriterBeatsOutput } from "../agents/writer";
+import {
+  coerceBeatsFromRaw,
+  coerceStoryStatePatch,
+  normalizeSpeakerName,
+  synthesizeFallbackBeats,
+} from "../agents/writer";
+import { parseJsonLoose } from "../jsonParser";
+
+// ──────────────────────────────────────────────────────────────────────
+//  proseSplitter — rule-based prose → Beat[] splitter.
+//
+//  The Writer now outputs continuous prose in the <story> segment instead
+//  of JSON beats. This module splits prose into RawBeat[] using lightweight
+//  markers (blank-line delimited paragraphs, <i> for inner monologue,
+//  「speaker：quote」 for NPC dialogue), then feeds the result through the
+//  existing coerceBeatsFromRaw pipeline to get fully validated Beat[].
+//
+//  Zero extra LLM calls. Multiple degradation layers — never throws.
+// ──────────────────────────────────────────────────────────────────────
+
+type RawBeat = {
+  narration?: string;
+  speaker?: string;
+  line?: string;
+  lineDelivery?: string;
+};
+
+// Match inner-monologue blocks: <i>...</i> (possibly multiline)
+const INNER_RE = /^\s*<i>([\s\S]+?)<\/i>\s*$/;
+
+// Match NPC dialogue: Speaker：「dialogue」 or Speaker:「dialogue」
+// Supports 「」『』"" quote pairs. Speaker name is 1-20 non-whitespace chars.
+const DIALOGUE_RE =
+  /^\s*(\S{1,20})\s*[：:]\s*(?:[「『"]([\s\S]+?)[」』"])\s*$/;
+
+// Match <memory>{...}</memory> block anywhere in the story segment.
+const MEMORY_RE = /<memory>([\s\S]+?)<\/memory>/;
+
+/**
+ * Extract and strip the <memory> JSON block from raw story prose.
+ * Returns the parsed StoryStatePatch (or undefined) plus the cleaned prose.
+ */
+function extractMemoryBlock(rawStory: string): {
+  patch: ReturnType<typeof coerceStoryStatePatch>;
+  cleanedProse: string;
+} {
+  const match = MEMORY_RE.exec(rawStory);
+  if (!match) return { patch: undefined, cleanedProse: rawStory };
+
+  const jsonStr = match[1]!;
+  const cleanedProse = rawStory.replace(MEMORY_RE, "").trim();
+
+  try {
+    const parsed = parseJsonLoose<Record<string, unknown>>(jsonStr);
+    return {
+      patch: coerceStoryStatePatch(
+        parsed as Parameters<typeof coerceStoryStatePatch>[0],
+      ),
+      cleanedProse,
+    };
+  } catch {
+    console.warn("[proseSplitter] failed to parse <memory> block, skipping");
+    return { patch: undefined, cleanedProse };
+  }
+}
+
+/**
+ * Classify a single prose paragraph into one of three beat forms.
+ */
+function classifyBlock(
+  block: string,
+  plan: WriterScenePlan,
+): RawBeat {
+  const trimmed = block.trim();
+
+  // Inner monologue: <i>text</i> → speaker="你"
+  const innerMatch = INNER_RE.exec(trimmed);
+  if (innerMatch) {
+    return {
+      speaker: "你",
+      line: innerMatch[1]!.trim(),
+    };
+  }
+
+  // NPC dialogue: Speaker：「quote」
+  const dialogueMatch = DIALOGUE_RE.exec(trimmed);
+  if (dialogueMatch) {
+    const rawSpeaker = dialogueMatch[1]!.trim();
+    const speaker = normalizeSpeakerName(rawSpeaker);
+    const line = dialogueMatch[2]!.trim();
+    const intent = plan.characterIntents?.find((ci) => ci.name === speaker);
+    return {
+      speaker,
+      line,
+      lineDelivery: intent?.speakingTone || undefined,
+    };
+  }
+
+  // Default: pure narration
+  return { narration: trimmed };
+}
+
+/**
+ * Split continuous prose into Beat[], reusing the full coerce→repair→fallback
+ * pipeline. Zero extra LLM calls. Never throws.
+ *
+ * @param rawStory - The raw prose from the <story> segment.
+ * @param plan - The parsed WriterScenePlan (from <plan> segment).
+ * @returns WriterBeatsOutput with Beat[] + optional StoryStatePatch.
+ */
+export function splitProseToBeats(
+  rawStory: string,
+  plan: WriterScenePlan,
+): WriterBeatsOutput {
+  try {
+    // 1. Extract <memory> block (story-state volatile patch)
+    const { patch, cleanedProse } = extractMemoryBlock(rawStory);
+
+    // 2. Split by blank lines into paragraphs
+    const blocks = cleanedProse
+      .split(/\n\s*\n/)
+      .map((b) => b.trim())
+      .filter((b) => b.length > 0);
+
+    if (blocks.length === 0) {
+      console.warn("[proseSplitter] empty prose after cleanup, using fallback");
+      return {
+        beats: synthesizeFallbackBeats(plan),
+        storyStatePatch: patch,
+      };
+    }
+
+    // 3. Classify each block into a RawBeat
+    const rawBeats: RawBeat[] = blocks.map((block) => {
+      try {
+        return classifyBlock(block, plan);
+      } catch {
+        return { narration: block };
+      }
+    });
+
+    // 4. Feed through existing coerce pipeline (id assignment, POV
+    //    normalization, entry alignment, exit guarantee, uniqueness)
+    const coerced = coerceBeatsFromRaw(rawBeats, plan);
+    return {
+      beats: coerced.beats,
+      storyStatePatch: patch ?? coerced.storyStatePatch,
+    };
+  } catch (err) {
+    console.error("[proseSplitter] unexpected error, using fallback:", err);
+    return {
+      beats: synthesizeFallbackBeats(plan),
+      storyStatePatch: undefined,
+    };
+  }
+}