. * 📖 No markdown dependency — keeps the dashboard zero-dep. Shared by every * 📖 playground so code looks identical everywhere. * @param {string} text * @returns {React.ReactNode} */ function renderAssistantText(text) { if (!text) return null const parts = text.split(/(```[\s\S]*?```)/g) return parts.map((part, idx) => { const codeMatch = part.match(/^```([a-zA-Z0-9_-]+)?\n?([\s\S]*?)```$/) if (codeMatch) { return (

          {codeMatch[2].replace(/\n$/, '')}

) } return {part} }) } /** Round to one decimal, returns '—' for non-finite numbers. */ function round1(n) { return Number.isFinite(n) ? (Math.round(n * 10) / 10).toFixed(1) : '—' } /** * Shared playground chat core. See file header. * * @param {Object} props * @param {string} props.model — 'fcm' (auto-router) or 'providerKey/modelId' (direct). * @param {boolean} [props.disabled=false] — disable the input + send button (e.g. daemon down). * @param {'full'|'mini'} [props.variant='mini'] — density/size of the UI. * @param {boolean} [props.stream=true] — request SSE streaming vs. one-shot JSON. * @param {string} [props.placeholder] — input placeholder. * @param {string} [props.targetLabel] — override the "addressed model" label shown under the * user bubble. The RouterView passes its Primary pick here so the user sees which model the * priority-first router will try first. When omitted, the addressed model is derived from `model`. * @param {string[]} [props.suggestions] — clickable chips in the empty state. * @param {string} [props.emptyTitle] — empty-state title. * @param {string} [props.emptyHint] — empty-state hint line. * @param {React.ReactNode} [props.emptyIcon] — empty-state icon. * @param {React.ReactNode} [props.children] — optional extra node rendered above the transcript * (used by PlaygroundView to host its daemon-start panel / pre-prompt hint). * @param {(summary:{count:number,totalTokens:number,lastMeta?:object}) => void} [props.onTurnComplete] * — fired after every turn so hosts can update their own chrome (token counters, etc.). * @param {React.Ref} ref — imperative handle exposing { clear(), focus(), getMessages() }. */ const PlaygroundChat = forwardRef(function PlaygroundChat({ model, disabled = false, variant = 'mini', stream = true, placeholder, targetLabel, suggestions = [], emptyTitle, emptyHint, emptyIcon, children, onTurnComplete, }, ref) { // 📖 Each message: { id, role, content, target?, meta?, error?, aborted?, pending? } // 📖 meta = { provider, model, latencyMs, tokens, tps } const [messages, setMessages] = useState([]) const [input, setInput] = useState('') const [loading, setLoading] = useState(false) const [copiedIdx, setCopiedIdx] = useState(null) const abortRef = useRef(null) const inputRef = useRef(null) const transcriptRef = useRef(null) // 📖 Ref mirror of `messages` so the imperative handle (below) can read the // 📖 live transcript without being recreated on every message change. const messagesRef = useRef([]) useImperativeHandle(ref, () => ({ /** Stop any in-flight stream and clear the transcript. */ clear: () => { if (abortRef.current) { abortRef.current.abort(); abortRef.current = null } setLoading(false) setMessages([]) }, focus: () => inputRef.current?.focus(), // 📖 `getMessages` is a stable ref read, so the handle never has to be // 📖 recreated when messages change. getMessages: () => messagesRef.current, }), []) // 📖 Keep the ref mirror in sync with the state transcript. useEffect(() => { messagesRef.current = messages }, [messages]) // 📖 Notify the host after a turn SETTLES (token counters etc.). Gated on // 📖 the last message being finalized (meta / error / aborted) so it doesn't // 📖 fire on every streamed token — only once per completed exchange. useEffect(() => { if (typeof onTurnComplete !== 'function') return const last = messages[messages.length - 1] if (!last || last.pending) return // still streaming const settled = last.role === 'assistant' && (!!last.meta || last.error || last.aborted) if (!settled) return const totalTokens = messages.reduce((sum, m) => sum + (m.meta?.tokens || 0), 0) onTurnComplete({ count: messages.length, totalTokens, lastMeta: last.meta }) }, [messages, onTurnComplete]) // 📖 Auto-scroll the transcript to the bottom as content streams in. useEffect(() => { const el = transcriptRef.current if (el) el.scrollTop = el.scrollHeight }, [messages, loading]) const stop = useCallback(() => { if (abortRef.current) { abortRef.current.abort(); abortRef.current = null } setLoading(false) }, []) const sendMessage = useCallback(async (overrideText) => { const text = (typeof overrideText === 'string' ? overrideText : input).trim() if (!text || loading || disabled) return setInput('') // 📖 Build the addressed-model label for the USER bubble. const targetKey = targetLabel || (model === 'fcm' ? 'fcm' : model) const userMsg = { id: `u-${Date.now()}`, role: 'user', content: text, ts: Date.now(), target: targetKey } const assistantId = `a-${Date.now()}` const assistantMsg = { id: assistantId, role: 'assistant', content: '', pending: true } const transcript = [...messages, userMsg] setMessages([...transcript, assistantMsg]) setLoading(true) const controller = new AbortController() abortRef.current = controller const startedAt = Date.now() // 📖 Patch helpers: update the in-flight assistant bubble in place. const patchAssistant = (patch) => setMessages((prev) => prev.map((m) => ( m.id === assistantId ? { ...m, ...patch } : m ))) // 📖 Served-model resolution. The daemon (fcm route) forwards the real // 📖 served model through the `x-fcm-router-model` response header; for // 📖 direct routing there is no such header, so the served model is the // 📖 requested one. We resolve the header lazily once we have the resp. let servedKey = null const resolveServed = (resp) => { const headerKey = resp.headers.get('x-fcm-router-model') servedKey = headerKey || (model !== 'fcm' ? model : null) return parseModelKey(servedKey) || { provider: model, model: '' } } const body = { model: model || 'fcm', messages: transcript.map(({ role, content }) => ({ role, content })), stream, temperature: 0.7, } try { const resp = await fetch('/api/playground/chat', { method: 'POST', headers: { 'Content-Type': 'application/json' }, body: JSON.stringify(body), signal: controller.signal, }) if (!resp.ok) { const errBody = await resp.json().catch(() => null) const errMsg = extractErrorMessage(errBody) || `Request failed (${resp.status})` patchAssistant({ pending: false, error: errMsg }) return } if (stream) { // ── SSE streaming path ───────────────────────────────────────── const reader = resp.body?.getReader() if (!reader) throw new Error('No stream reader available') const decoder = new TextDecoder() let buffer = '' let acc = '' let served = resolveServed(resp) let tokens = 0 let servedKnown = !!servedKey while (true) { const { value, done } = await reader.read() if (done) break buffer += decoder.decode(value, { stream: true }) // 📖 Split on blank-line SSE boundaries; keep the trailing partial. const events = buffer.split(/\n\n/) buffer = events.pop() || '' for (const event of events) { const lines = event.split(/\n/) for (const line of lines) { if (!line.startsWith('data:')) continue const payload = line.slice(5).trim() if (payload === '[DONE]') continue try { const json = JSON.parse(payload) const delta = json?.choices?.[0]?.delta?.content if (typeof delta === 'string' && delta) { acc += delta patchAssistant({ content: acc, pending: false }) } // 📖 Tokens: the final chunk carries usage. Prefer completion // 📖 tokens (matches what was generated) over total. const usage = json?.usage if (usage) { if (typeof usage.completion_tokens === 'number') tokens = usage.completion_tokens else if (typeof usage.total_tokens === 'number') tokens = usage.total_tokens } // 📖 Some daemons/proxies also forward the served model in the // 📖 body — accept it as a fallback to the header. if (!servedKnown && json?.x_routed_via) { served = { provider: json.x_routed_via, model: json.x_routed_model || '' } servedKnown = true } } catch { // 📖 Ignore non-JSON keep-alive frames. } } } } const latencyMs = Date.now() - startedAt const tps = tokens > 0 && latencyMs > 0 ? tokens / (latencyMs / 1000) : null patchAssistant({ pending: false, meta: { provider: served.provider, model: served.model, latencyMs, tokens, tps, }, }) } else { // ── One-shot JSON path ───────────────────────────────────────── const json = await resp.json().catch(() => null) const content = json?.choices?.[0]?.message?.content || '' const usage = json?.usage || {} const tokens = typeof usage.completion_tokens === 'number' ? usage.completion_tokens : (usage.total_tokens || 0) const served = resolveServed(resp) const latencyMs = Date.now() - startedAt const tps = tokens > 0 && latencyMs > 0 ? tokens / (latencyMs / 1000) : null patchAssistant({ pending: false, content, meta: { provider: served.provider, model: served.model, latencyMs, tokens, tps, }, }) } } catch (err) { if (err?.name === 'AbortError') { patchAssistant({ pending: false, aborted: true }) } else { patchAssistant({ pending: false, error: err?.message || String(err) }) } } finally { setLoading(false) abortRef.current = null } }, [input, loading, disabled, messages, model, stream, targetLabel, onTurnComplete]) const handleKeyDown = useCallback((e) => { // 📖 Enter sends, Shift+Enter inserts a newline (full variant only). if (e.key === 'Enter' && !e.shiftKey && variant === 'full') { e.preventDefault() void sendMessage() } else if (e.key === 'Enter' && variant === 'mini') { e.preventDefault() void sendMessage() } }, [sendMessage, variant]) const copyMessage = useCallback(async (idx, content) => { try { await navigator.clipboard.writeText(content || '') setCopiedIdx(idx) setTimeout(() => setCopiedIdx(null), 1500) } catch {} }, []) // 📖 Tiny auto-grow for the textarea so 'full' expands with long prompts. const handleInputChange = useCallback((e) => { setInput(e.target.value) if (variant === 'full') { const el = e.target el.style.height = 'auto' el.style.height = `${Math.min(el.scrollHeight, 180)}px` } }, [variant]) const variantClass = variant === 'full' ? styles.full : styles.mini return (

{children}

{messages.length === 0 ? (

{emptyIcon &&

{emptyIcon}

} {emptyTitle &&

{emptyTitle}

} {emptyHint &&

{emptyHint}

} {suggestions.length > 0 && (

{suggestions.map((s) => ( ))}

)}

) : ( messages.map((m, idx) => (

{m.role} {m.role === 'assistant' && m.content && ( )}

{m.role === 'assistant' ? ( <> {m.content ? renderAssistantText(m.content) : null} {loading && idx === messages.length - 1 && m.pending && !m.aborted && ( )} {!m.content && m.pending && …} ) : ( m.content )}

{/* ── Metadata row under the USER bubble: addressed model ── */} {m.role === 'user' && m.target && (

{m.target}

)} {/* ── Metadata row under the ASSISTANT bubble: served model + ms + tok + t/s ── */} {m.role === 'assistant' && !m.pending && m.meta && (

{m.meta.provider && ( {m.meta.provider}{m.meta.model ? `/${m.meta.model}` : ''} )} {m.meta.latencyMs != null && ( {Math.round(m.meta.latencyMs)}ms )} {m.meta.tokens > 0 && ( {m.meta.tokens} tok )} {m.meta.tps != null && m.meta.tps > 0 && ( {round1(m.meta.tps)} t/s )}

)} {m.role === 'assistant' && m.error && (

{m.error}

)} {m.role === 'assistant' && m.aborted && !m.error && (

stopped

)}

)) )}