Component · May 28, 2026

AI message panel

A product-shaped AI response panel with streaming text, stop and regenerate controls, live status, and expandable citation chips.

ai
streaming
accessibility
interaction

AI message panel

Launch readiness

Generating

Summarize the dashboard accessibility risks before launch.

0 / 91 tokens

component.tsx

'use client'

import { useEffect, useMemo, useRef, useState, useSyncExternalStore } from 'react'

type StreamStatus = 'streaming' | 'stopped' | 'done'

interface Citation {
  id: string
  marker: string
  title: string
  source: string
  quote: string
}

const USER_PROMPT = 'Summarize the dashboard accessibility risks before launch.'

const ASSISTANT_RESPONSE =
  'The launch risk is concentrated in three places: virtualized rows need a stable focus model, chart summaries need text equivalents, and automated locale formatting needs RTL review before it reaches production. I would ship once keyboard navigation, polite announcements, and citation traceability pass review. [1] [2]'

const RESPONSE_TOKENS = ASSISTANT_RESPONSE.split(/(?<=\s)|(?=\s)/).filter(Boolean)

const CITATIONS = [
  {
    id: 'grid-focus',
    marker: '1',
    title: 'Grid focus model',
    source: 'Dashboard accessibility review',
    quote: 'A virtualized grid must keep active row state stable even when offscreen rows unmount.',
  },
  {
    id: 'locale-rtl',
    marker: '2',
    title: 'Locale QA note',
    source: 'International launch checklist',
    quote:
      'RTL QA should validate direction, punctuation, numeric formatting, and focus order together.',
  },
] as const satisfies readonly Citation[]

type CitationId = (typeof CITATIONS)[number]['id']
const REDUCED_MOTION_QUERY = '(prefers-reduced-motion: reduce)'

function tokenDelay(token: string, reducedMotion: boolean): number {
  if (reducedMotion) return 12

  const base = 26 + Math.random() * 34
  const pause = /[.!?]$/.test(token.trim()) ? 180 : 0
  return base + pause
}

function subscribeToMotionPreference(onStoreChange: () => void): () => void {
  const media = window.matchMedia(REDUCED_MOTION_QUERY)
  media.addEventListener('change', onStoreChange)
  return () => media.removeEventListener('change', onStoreChange)
}

function getMotionPreference(): boolean {
  return window.matchMedia(REDUCED_MOTION_QUERY).matches
}

function getServerMotionPreference(): boolean {
  return false
}

function usePrefersReducedMotion(): boolean {
  return useSyncExternalStore(
    subscribeToMotionPreference,
    getMotionPreference,
    getServerMotionPreference,
  )
}

export default function AiMessagePanel() {
  const reducedMotion = usePrefersReducedMotion()
  const [status, setStatus] = useState<StreamStatus>('streaming')
  const [displayed, setDisplayed] = useState('')
  const [tokenIndex, setTokenIndex] = useState(0)
  const [expandedCitationId, setExpandedCitationId] = useState<CitationId | null>('grid-focus')
  const scrollRef = useRef<HTMLDivElement | null>(null)

  const expandedCitation = useMemo(
    () => CITATIONS.find((citation) => citation.id === expandedCitationId) ?? null,
    [expandedCitationId],
  )

  useEffect(() => {
    if (status !== 'streaming') return

    if (reducedMotion) {
      const timer = setTimeout(() => {
        setTokenIndex(RESPONSE_TOKENS.length)
        setDisplayed(ASSISTANT_RESPONSE)
        setStatus('done')
      }, 80)
      return () => clearTimeout(timer)
    }

    const token = RESPONSE_TOKENS[tokenIndex]
    if (token === undefined) {
      return
    }

    const timer = setTimeout(
      () => {
        setDisplayed((current) => current + token)
        setTokenIndex((current) => current + 1)
        if (tokenIndex + 1 >= RESPONSE_TOKENS.length) {
          setStatus('done')
        }
      },
      tokenDelay(token, reducedMotion),
    )

    return () => clearTimeout(timer)
  }, [reducedMotion, status, tokenIndex])

  useEffect(() => {
    if (!scrollRef.current) return
    scrollRef.current.scrollTop = scrollRef.current.scrollHeight
  }, [displayed, expandedCitationId])

  function stopStream() {
    setStatus('stopped')
  }

  function regenerate() {
    setTokenIndex(0)
    setDisplayed('')
    setExpandedCitationId('grid-focus')
    setStatus('streaming')
  }

  return (
    <div className="mx-auto w-full max-w-md overflow-hidden rounded-(--radius-card) border border-(--color-border) bg-(--color-surface) text-sm">
      <style>{`
        @keyframes ai-cursor-blink {
          0%, 100% { opacity: 1; }
          50% { opacity: 0; }
        }

        @media (prefers-reduced-motion: reduce) {
          .ai-cursor { animation: none !important; }
        }
      `}</style>

      <div className="flex items-baseline justify-between gap-3 border-b border-(--color-border) px-5 py-4">
        <p className="text-(--color-fg)">Launch readiness</p>
        <span className="font-mono text-[10px] tracking-[0.14em] text-(--color-fg-subtle) uppercase">
          {status === 'streaming' ? 'Generating' : status === 'done' ? 'Complete' : 'Stopped'}
        </span>
      </div>

      <div
        ref={scrollRef}
        className="scrollbar-thin max-h-[320px] space-y-5 overflow-y-auto bg-(--color-bg) px-5 py-6"
      >
        <section
          aria-label="User message"
          className="ml-auto max-w-[82%] rounded-(--radius-card) rounded-tr-md border border-(--color-border-strong) bg-(--color-surface-hover) px-4 py-3 leading-relaxed text-(--color-fg)"
        >
          {USER_PROMPT}
        </section>

        <section aria-label="Assistant message" className="max-w-[94%]">
          <p
            aria-live="polite"
            // aria-busy true while streaming suppresses per-token announcements
            // (~every 50ms); on completion it flips false so the finished
            // response is announced once as a single polite update.
            aria-busy={status === 'streaming'}
            className="min-h-24 leading-relaxed text-(--color-fg)"
          >
            {displayed}
            {status === 'streaming' ? (
              <span
                aria-hidden="true"
                className="ai-cursor ml-0.5 inline-block h-4 w-1 translate-y-0.5 rounded-full bg-(--color-accent)"
                style={{ animation: 'ai-cursor-blink 860ms steps(1) infinite' }}
              />
            ) : null}
          </p>

          <div className="mt-5 flex flex-wrap gap-2" aria-label="Citations">
            {CITATIONS.map((citation) => {
              const expanded = expandedCitationId === citation.id
              return (
                <button
                  key={citation.id}
                  type="button"
                  onClick={() => setExpandedCitationId(expanded ? null : citation.id)}
                  aria-expanded={expanded}
                  className="rounded-md border px-2.5 py-1 font-mono text-[10px] transition-colors data-[on=true]:border-(--color-border-strong) data-[on=true]:bg-(--color-surface) data-[on=true]:text-(--color-fg) data-[on=false]:border-(--color-border) data-[on=false]:text-(--color-fg-subtle) data-[on=false]:hover:text-(--color-fg-muted)"
                  data-on={expanded}
                >
                  [{citation.marker}] {citation.title}
                </button>
              )
            })}
          </div>

          {expandedCitation ? (
            <aside className="mt-3 rounded-(--radius-card) border border-(--color-border) bg-(--color-surface) px-4 py-3">
              <p className="text-xs leading-relaxed text-(--color-fg-muted)">
                {expandedCitation.quote}
              </p>
              <p className="mt-2.5 font-mono text-[10px] tracking-[0.12em] text-(--color-fg-subtle) uppercase">
                {expandedCitation.source}
              </p>
            </aside>
          ) : null}
        </section>
      </div>

      <div className="flex flex-wrap items-center justify-between gap-3 border-t border-(--color-border) px-5 py-4">
        <span
          className="font-mono text-[10px] text-(--color-fg-subtle)"
          aria-live="polite"
          // The running "n / m tokens" count ticks every token; aria-busy holds
          // announcements until streaming ends, then the final summary is read once.
          aria-busy={status === 'streaming'}
        >
          {status === 'streaming'
            ? `${tokenIndex} / ${RESPONSE_TOKENS.length} tokens`
            : status === 'done'
              ? `${RESPONSE_TOKENS.length} tokens · ${CITATIONS.length} sources`
              : `Stopped at ${tokenIndex} tokens`}
        </span>
        <div className="flex gap-2">
          {status === 'streaming' ? (
            <button
              type="button"
              onClick={stopStream}
              className="rounded-md border border-(--color-border) px-3 py-1.5 text-xs text-(--color-fg-muted) transition-colors hover:text-(--color-fg)"
            >
              Stop
            </button>
          ) : null}
          <button
            type="button"
            onClick={regenerate}
            className="rounded-md border border-(--color-border-strong) bg-(--color-surface-hover) px-3 py-1.5 text-xs text-(--color-fg) transition-colors hover:border-(--color-accent)"
          >
            Regenerate
          </button>
        </div>
      </div>
    </div>
  )
}

My earlier ai-stream demo was about pacing: how token timing changes the way a generated answer feels. This panel takes the same idea one step closer to real product UI. The message has a user prompt, a streamed assistant answer, controls for stopping and regenerating, and citations that expand inline so the reader doesn't get sent away from the answer.

The citations aren't decorative. Each chip has a marker that matches the assistant text, an expanded state, and a short source excerpt. In production that source would need a durable document id and a permission check, but the interaction is the same: you can check the model's claim right when you're deciding whether to trust it.

Accessibility shapes the streaming behavior. The answer uses a polite live region so screen readers can announce changes without interrupting the current task. The status label says whether the response is generating, complete, or stopped, and the controls stay ordinary buttons instead of custom divs with click handlers.

Motion is restrained on purpose. The small activity meter and cursor give sighted users a state signal during generation, but prefers-reduced-motion removes the pulsing and shortens the token delay so it doesn't turn into a forced animation.

I18n formatting playgroundi18n

Virtualized tabledata

Command paletteaccessibility

AI message panel

AI message panel

Related